AMDGPU.h 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360
  1. //===--- AMDGPU.h - Declare AMDGPU target feature support -------*- C++ -*-===//
  2. //
  3. // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
  4. // See https://llvm.org/LICENSE.txt for license information.
  5. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
  6. //
  7. //===----------------------------------------------------------------------===//
  8. //
  9. // This file declares AMDGPU TargetInfo objects.
  10. //
  11. //===----------------------------------------------------------------------===//
  12. #ifndef LLVM_CLANG_LIB_BASIC_TARGETS_AMDGPU_H
  13. #define LLVM_CLANG_LIB_BASIC_TARGETS_AMDGPU_H
  14. #include "clang/Basic/TargetInfo.h"
  15. #include "clang/Basic/TargetOptions.h"
  16. #include "llvm/ADT/StringSet.h"
  17. #include "llvm/ADT/Triple.h"
  18. #include "llvm/Support/Compiler.h"
  19. #include "llvm/Support/TargetParser.h"
  20. namespace clang {
  21. namespace targets {
  22. class LLVM_LIBRARY_VISIBILITY AMDGPUTargetInfo final : public TargetInfo {
  23. static const Builtin::Info BuiltinInfo[];
  24. static const char *const GCCRegNames[];
  25. enum AddrSpace {
  26. Generic = 0,
  27. Global = 1,
  28. Local = 3,
  29. Constant = 4,
  30. Private = 5
  31. };
  32. static const LangASMap AMDGPUDefIsGenMap;
  33. static const LangASMap AMDGPUDefIsPrivMap;
  34. llvm::AMDGPU::GPUKind GPUKind;
  35. unsigned GPUFeatures;
  36. bool hasFP64() const {
  37. return getTriple().getArch() == llvm::Triple::amdgcn ||
  38. !!(GPUFeatures & llvm::AMDGPU::FEATURE_FP64);
  39. }
  40. /// Has fast fma f32
  41. bool hasFastFMAF() const {
  42. return !!(GPUFeatures & llvm::AMDGPU::FEATURE_FAST_FMA_F32);
  43. }
  44. /// Has fast fma f64
  45. bool hasFastFMA() const {
  46. return getTriple().getArch() == llvm::Triple::amdgcn;
  47. }
  48. bool hasFMAF() const {
  49. return getTriple().getArch() == llvm::Triple::amdgcn ||
  50. !!(GPUFeatures & llvm::AMDGPU::FEATURE_FMA);
  51. }
  52. bool hasFullRateDenormalsF32() const {
  53. return !!(GPUFeatures & llvm::AMDGPU::FEATURE_FAST_DENORMAL_F32);
  54. }
  55. bool hasLDEXPF() const {
  56. return getTriple().getArch() == llvm::Triple::amdgcn ||
  57. !!(GPUFeatures & llvm::AMDGPU::FEATURE_LDEXP);
  58. }
  59. static bool isAMDGCN(const llvm::Triple &TT) {
  60. return TT.getArch() == llvm::Triple::amdgcn;
  61. }
  62. static bool isR600(const llvm::Triple &TT) {
  63. return TT.getArch() == llvm::Triple::r600;
  64. }
  65. public:
  66. AMDGPUTargetInfo(const llvm::Triple &Triple, const TargetOptions &Opts);
  67. void setAddressSpaceMap(bool DefaultIsPrivate);
  68. void adjust(LangOptions &Opts) override;
  69. uint64_t getPointerWidthV(unsigned AddrSpace) const override {
  70. if (isR600(getTriple()))
  71. return 32;
  72. if (AddrSpace == Private || AddrSpace == Local)
  73. return 32;
  74. return 64;
  75. }
  76. uint64_t getPointerAlignV(unsigned AddrSpace) const override {
  77. return getPointerWidthV(AddrSpace);
  78. }
  79. uint64_t getMaxPointerWidth() const override {
  80. return getTriple().getArch() == llvm::Triple::amdgcn ? 64 : 32;
  81. }
  82. const char *getClobbers() const override { return ""; }
  83. ArrayRef<const char *> getGCCRegNames() const override;
  84. ArrayRef<TargetInfo::GCCRegAlias> getGCCRegAliases() const override {
  85. return None;
  86. }
  87. /// Accepted register names: (n, m is unsigned integer, n < m)
  88. /// v
  89. /// s
  90. /// {vn}, {v[n]}
  91. /// {sn}, {s[n]}
  92. /// {S} , where S is a special register name
  93. ////{v[n:m]}
  94. /// {s[n:m]}
  95. bool validateAsmConstraint(const char *&Name,
  96. TargetInfo::ConstraintInfo &Info) const override {
  97. static const ::llvm::StringSet<> SpecialRegs({
  98. "exec", "vcc", "flat_scratch", "m0", "scc", "tba", "tma",
  99. "flat_scratch_lo", "flat_scratch_hi", "vcc_lo", "vcc_hi", "exec_lo",
  100. "exec_hi", "tma_lo", "tma_hi", "tba_lo", "tba_hi",
  101. });
  102. StringRef S(Name);
  103. bool HasLeftParen = false;
  104. if (S.front() == '{') {
  105. HasLeftParen = true;
  106. S = S.drop_front();
  107. }
  108. if (S.empty())
  109. return false;
  110. if (S.front() != 'v' && S.front() != 's') {
  111. if (!HasLeftParen)
  112. return false;
  113. auto E = S.find('}');
  114. if (!SpecialRegs.count(S.substr(0, E)))
  115. return false;
  116. S = S.drop_front(E + 1);
  117. if (!S.empty())
  118. return false;
  119. // Found {S} where S is a special register.
  120. Info.setAllowsRegister();
  121. Name = S.data() - 1;
  122. return true;
  123. }
  124. S = S.drop_front();
  125. if (!HasLeftParen) {
  126. if (!S.empty())
  127. return false;
  128. // Found s or v.
  129. Info.setAllowsRegister();
  130. Name = S.data() - 1;
  131. return true;
  132. }
  133. bool HasLeftBracket = false;
  134. if (!S.empty() && S.front() == '[') {
  135. HasLeftBracket = true;
  136. S = S.drop_front();
  137. }
  138. unsigned long long N;
  139. if (S.empty() || consumeUnsignedInteger(S, 10, N))
  140. return false;
  141. if (!S.empty() && S.front() == ':') {
  142. if (!HasLeftBracket)
  143. return false;
  144. S = S.drop_front();
  145. unsigned long long M;
  146. if (consumeUnsignedInteger(S, 10, M) || N >= M)
  147. return false;
  148. }
  149. if (HasLeftBracket) {
  150. if (S.empty() || S.front() != ']')
  151. return false;
  152. S = S.drop_front();
  153. }
  154. if (S.empty() || S.front() != '}')
  155. return false;
  156. S = S.drop_front();
  157. if (!S.empty())
  158. return false;
  159. // Found {vn}, {sn}, {v[n]}, {s[n]}, {v[n:m]}, or {s[n:m]}.
  160. Info.setAllowsRegister();
  161. Name = S.data() - 1;
  162. return true;
  163. }
  164. // \p Constraint will be left pointing at the last character of
  165. // the constraint. In practice, it won't be changed unless the
  166. // constraint is longer than one character.
  167. std::string convertConstraint(const char *&Constraint) const override {
  168. const char *Begin = Constraint;
  169. TargetInfo::ConstraintInfo Info("", "");
  170. if (validateAsmConstraint(Constraint, Info))
  171. return std::string(Begin).substr(0, Constraint - Begin + 1);
  172. Constraint = Begin;
  173. return std::string(1, *Constraint);
  174. }
  175. bool
  176. initFeatureMap(llvm::StringMap<bool> &Features, DiagnosticsEngine &Diags,
  177. StringRef CPU,
  178. const std::vector<std::string> &FeatureVec) const override;
  179. void adjustTargetOptions(const CodeGenOptions &CGOpts,
  180. TargetOptions &TargetOpts) const override;
  181. ArrayRef<Builtin::Info> getTargetBuiltins() const override;
  182. void getTargetDefines(const LangOptions &Opts,
  183. MacroBuilder &Builder) const override;
  184. BuiltinVaListKind getBuiltinVaListKind() const override {
  185. return TargetInfo::CharPtrBuiltinVaList;
  186. }
  187. bool isValidCPUName(StringRef Name) const override {
  188. if (getTriple().getArch() == llvm::Triple::amdgcn)
  189. return llvm::AMDGPU::parseArchAMDGCN(Name) != llvm::AMDGPU::GK_NONE;
  190. return llvm::AMDGPU::parseArchR600(Name) != llvm::AMDGPU::GK_NONE;
  191. }
  192. void fillValidCPUList(SmallVectorImpl<StringRef> &Values) const override;
  193. bool setCPU(const std::string &Name) override {
  194. if (getTriple().getArch() == llvm::Triple::amdgcn) {
  195. GPUKind = llvm::AMDGPU::parseArchAMDGCN(Name);
  196. GPUFeatures = llvm::AMDGPU::getArchAttrAMDGCN(GPUKind);
  197. } else {
  198. GPUKind = llvm::AMDGPU::parseArchR600(Name);
  199. GPUFeatures = llvm::AMDGPU::getArchAttrR600(GPUKind);
  200. }
  201. return GPUKind != llvm::AMDGPU::GK_NONE;
  202. }
  203. void setSupportedOpenCLOpts() override {
  204. auto &Opts = getSupportedOpenCLOpts();
  205. Opts.support("cl_clang_storage_class_specifiers");
  206. Opts.support("cl_khr_icd");
  207. bool IsAMDGCN = isAMDGCN(getTriple());
  208. if (hasFP64())
  209. Opts.support("cl_khr_fp64");
  210. if (IsAMDGCN || GPUKind >= llvm::AMDGPU::GK_CEDAR) {
  211. Opts.support("cl_khr_byte_addressable_store");
  212. Opts.support("cl_khr_global_int32_base_atomics");
  213. Opts.support("cl_khr_global_int32_extended_atomics");
  214. Opts.support("cl_khr_local_int32_base_atomics");
  215. Opts.support("cl_khr_local_int32_extended_atomics");
  216. }
  217. if (IsAMDGCN) {
  218. Opts.support("cl_khr_fp16");
  219. Opts.support("cl_khr_int64_base_atomics");
  220. Opts.support("cl_khr_int64_extended_atomics");
  221. Opts.support("cl_khr_mipmap_image");
  222. Opts.support("cl_khr_subgroups");
  223. Opts.support("cl_khr_3d_image_writes");
  224. Opts.support("cl_amd_media_ops");
  225. Opts.support("cl_amd_media_ops2");
  226. }
  227. }
  228. LangAS getOpenCLTypeAddrSpace(OpenCLTypeKind TK) const override {
  229. switch (TK) {
  230. case OCLTK_Image:
  231. return LangAS::opencl_constant;
  232. case OCLTK_ClkEvent:
  233. case OCLTK_Queue:
  234. case OCLTK_ReserveID:
  235. return LangAS::opencl_global;
  236. default:
  237. return TargetInfo::getOpenCLTypeAddrSpace(TK);
  238. }
  239. }
  240. LangAS getOpenCLBuiltinAddressSpace(unsigned AS) const override {
  241. switch (AS) {
  242. case 0:
  243. return LangAS::opencl_generic;
  244. case 1:
  245. return LangAS::opencl_global;
  246. case 3:
  247. return LangAS::opencl_local;
  248. case 4:
  249. return LangAS::opencl_constant;
  250. case 5:
  251. return LangAS::opencl_private;
  252. default:
  253. return getLangASFromTargetAS(AS);
  254. }
  255. }
  256. LangAS getCUDABuiltinAddressSpace(unsigned AS) const override {
  257. return LangAS::Default;
  258. }
  259. llvm::Optional<LangAS> getConstantAddressSpace() const override {
  260. return getLangASFromTargetAS(Constant);
  261. }
  262. /// \returns Target specific vtbl ptr address space.
  263. unsigned getVtblPtrAddressSpace() const override {
  264. return static_cast<unsigned>(Constant);
  265. }
  266. /// \returns If a target requires an address within a target specific address
  267. /// space \p AddressSpace to be converted in order to be used, then return the
  268. /// corresponding target specific DWARF address space.
  269. ///
  270. /// \returns Otherwise return None and no conversion will be emitted in the
  271. /// DWARF.
  272. Optional<unsigned>
  273. getDWARFAddressSpace(unsigned AddressSpace) const override {
  274. const unsigned DWARF_Private = 1;
  275. const unsigned DWARF_Local = 2;
  276. if (AddressSpace == Private) {
  277. return DWARF_Private;
  278. } else if (AddressSpace == Local) {
  279. return DWARF_Local;
  280. } else {
  281. return None;
  282. }
  283. }
  284. CallingConvCheckResult checkCallingConvention(CallingConv CC) const override {
  285. switch (CC) {
  286. default:
  287. return CCCR_Warning;
  288. case CC_C:
  289. case CC_OpenCLKernel:
  290. return CCCR_OK;
  291. }
  292. }
  293. // In amdgcn target the null pointer in global, constant, and generic
  294. // address space has value 0 but in private and local address space has
  295. // value ~0.
  296. uint64_t getNullPointerValue(LangAS AS) const override {
  297. return AS == LangAS::opencl_local ? ~0 : 0;
  298. }
  299. void setAuxTarget(const TargetInfo *Aux) override;
  300. };
  301. } // namespace targets
  302. } // namespace clang
  303. #endif // LLVM_CLANG_LIB_BASIC_TARGETS_AMDGPU_H