Cuda.cpp 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401
  1. #include "clang/Basic/Cuda.h"
  2. #include "llvm/ADT/StringRef.h"
  3. #include "llvm/ADT/StringSwitch.h"
  4. #include "llvm/Support/ErrorHandling.h"
  5. #include "llvm/Support/VersionTuple.h"
  6. namespace clang {
  7. const char *CudaVersionToString(CudaVersion V) {
  8. switch (V) {
  9. case CudaVersion::UNKNOWN:
  10. return "unknown";
  11. case CudaVersion::CUDA_70:
  12. return "7.0";
  13. case CudaVersion::CUDA_75:
  14. return "7.5";
  15. case CudaVersion::CUDA_80:
  16. return "8.0";
  17. case CudaVersion::CUDA_90:
  18. return "9.0";
  19. case CudaVersion::CUDA_91:
  20. return "9.1";
  21. case CudaVersion::CUDA_92:
  22. return "9.2";
  23. case CudaVersion::CUDA_100:
  24. return "10.0";
  25. case CudaVersion::CUDA_101:
  26. return "10.1";
  27. }
  28. llvm_unreachable("invalid enum");
  29. }
  30. CudaVersion CudaStringToVersion(llvm::StringRef S) {
  31. return llvm::StringSwitch<CudaVersion>(S)
  32. .Case("7.0", CudaVersion::CUDA_70)
  33. .Case("7.5", CudaVersion::CUDA_75)
  34. .Case("8.0", CudaVersion::CUDA_80)
  35. .Case("9.0", CudaVersion::CUDA_90)
  36. .Case("9.1", CudaVersion::CUDA_91)
  37. .Case("9.2", CudaVersion::CUDA_92)
  38. .Case("10.0", CudaVersion::CUDA_100)
  39. .Case("10.1", CudaVersion::CUDA_101);
  40. }
  41. const char *CudaArchToString(CudaArch A) {
  42. switch (A) {
  43. case CudaArch::LAST:
  44. break;
  45. case CudaArch::UNKNOWN:
  46. return "unknown";
  47. case CudaArch::SM_20:
  48. return "sm_20";
  49. case CudaArch::SM_21:
  50. return "sm_21";
  51. case CudaArch::SM_30:
  52. return "sm_30";
  53. case CudaArch::SM_32:
  54. return "sm_32";
  55. case CudaArch::SM_35:
  56. return "sm_35";
  57. case CudaArch::SM_37:
  58. return "sm_37";
  59. case CudaArch::SM_50:
  60. return "sm_50";
  61. case CudaArch::SM_52:
  62. return "sm_52";
  63. case CudaArch::SM_53:
  64. return "sm_53";
  65. case CudaArch::SM_60:
  66. return "sm_60";
  67. case CudaArch::SM_61:
  68. return "sm_61";
  69. case CudaArch::SM_62:
  70. return "sm_62";
  71. case CudaArch::SM_70:
  72. return "sm_70";
  73. case CudaArch::SM_72:
  74. return "sm_72";
  75. case CudaArch::SM_75:
  76. return "sm_75";
  77. case CudaArch::GFX600: // tahiti
  78. return "gfx600";
  79. case CudaArch::GFX601: // pitcairn, verde, oland,hainan
  80. return "gfx601";
  81. case CudaArch::GFX700: // kaveri
  82. return "gfx700";
  83. case CudaArch::GFX701: // hawaii
  84. return "gfx701";
  85. case CudaArch::GFX702: // 290,290x,R390,R390x
  86. return "gfx702";
  87. case CudaArch::GFX703: // kabini mullins
  88. return "gfx703";
  89. case CudaArch::GFX704: // bonaire
  90. return "gfx704";
  91. case CudaArch::GFX801: // carrizo
  92. return "gfx801";
  93. case CudaArch::GFX802: // tonga,iceland
  94. return "gfx802";
  95. case CudaArch::GFX803: // fiji,polaris10
  96. return "gfx803";
  97. case CudaArch::GFX810: // stoney
  98. return "gfx810";
  99. case CudaArch::GFX900: // vega, instinct
  100. return "gfx900";
  101. case CudaArch::GFX902: // TBA
  102. return "gfx902";
  103. case CudaArch::GFX904: // TBA
  104. return "gfx904";
  105. case CudaArch::GFX906: // TBA
  106. return "gfx906";
  107. case CudaArch::GFX908: // TBA
  108. return "gfx908";
  109. case CudaArch::GFX909: // TBA
  110. return "gfx909";
  111. case CudaArch::GFX1010: // TBA
  112. return "gfx1010";
  113. case CudaArch::GFX1011: // TBA
  114. return "gfx1011";
  115. case CudaArch::GFX1012: // TBA
  116. return "gfx1012";
  117. }
  118. llvm_unreachable("invalid enum");
  119. }
  120. CudaArch StringToCudaArch(llvm::StringRef S) {
  121. return llvm::StringSwitch<CudaArch>(S)
  122. .Case("sm_20", CudaArch::SM_20)
  123. .Case("sm_21", CudaArch::SM_21)
  124. .Case("sm_30", CudaArch::SM_30)
  125. .Case("sm_32", CudaArch::SM_32)
  126. .Case("sm_35", CudaArch::SM_35)
  127. .Case("sm_37", CudaArch::SM_37)
  128. .Case("sm_50", CudaArch::SM_50)
  129. .Case("sm_52", CudaArch::SM_52)
  130. .Case("sm_53", CudaArch::SM_53)
  131. .Case("sm_60", CudaArch::SM_60)
  132. .Case("sm_61", CudaArch::SM_61)
  133. .Case("sm_62", CudaArch::SM_62)
  134. .Case("sm_70", CudaArch::SM_70)
  135. .Case("sm_72", CudaArch::SM_72)
  136. .Case("sm_75", CudaArch::SM_75)
  137. .Case("gfx600", CudaArch::GFX600)
  138. .Case("gfx601", CudaArch::GFX601)
  139. .Case("gfx700", CudaArch::GFX700)
  140. .Case("gfx701", CudaArch::GFX701)
  141. .Case("gfx702", CudaArch::GFX702)
  142. .Case("gfx703", CudaArch::GFX703)
  143. .Case("gfx704", CudaArch::GFX704)
  144. .Case("gfx801", CudaArch::GFX801)
  145. .Case("gfx802", CudaArch::GFX802)
  146. .Case("gfx803", CudaArch::GFX803)
  147. .Case("gfx810", CudaArch::GFX810)
  148. .Case("gfx900", CudaArch::GFX900)
  149. .Case("gfx902", CudaArch::GFX902)
  150. .Case("gfx904", CudaArch::GFX904)
  151. .Case("gfx906", CudaArch::GFX906)
  152. .Case("gfx908", CudaArch::GFX908)
  153. .Case("gfx909", CudaArch::GFX909)
  154. .Case("gfx1010", CudaArch::GFX1010)
  155. .Case("gfx1011", CudaArch::GFX1011)
  156. .Case("gfx1012", CudaArch::GFX1012)
  157. .Default(CudaArch::UNKNOWN);
  158. }
  159. const char *CudaVirtualArchToString(CudaVirtualArch A) {
  160. switch (A) {
  161. case CudaVirtualArch::UNKNOWN:
  162. return "unknown";
  163. case CudaVirtualArch::COMPUTE_20:
  164. return "compute_20";
  165. case CudaVirtualArch::COMPUTE_30:
  166. return "compute_30";
  167. case CudaVirtualArch::COMPUTE_32:
  168. return "compute_32";
  169. case CudaVirtualArch::COMPUTE_35:
  170. return "compute_35";
  171. case CudaVirtualArch::COMPUTE_37:
  172. return "compute_37";
  173. case CudaVirtualArch::COMPUTE_50:
  174. return "compute_50";
  175. case CudaVirtualArch::COMPUTE_52:
  176. return "compute_52";
  177. case CudaVirtualArch::COMPUTE_53:
  178. return "compute_53";
  179. case CudaVirtualArch::COMPUTE_60:
  180. return "compute_60";
  181. case CudaVirtualArch::COMPUTE_61:
  182. return "compute_61";
  183. case CudaVirtualArch::COMPUTE_62:
  184. return "compute_62";
  185. case CudaVirtualArch::COMPUTE_70:
  186. return "compute_70";
  187. case CudaVirtualArch::COMPUTE_72:
  188. return "compute_72";
  189. case CudaVirtualArch::COMPUTE_75:
  190. return "compute_75";
  191. case CudaVirtualArch::COMPUTE_AMDGCN:
  192. return "compute_amdgcn";
  193. }
  194. llvm_unreachable("invalid enum");
  195. }
  196. CudaVirtualArch StringToCudaVirtualArch(llvm::StringRef S) {
  197. return llvm::StringSwitch<CudaVirtualArch>(S)
  198. .Case("compute_20", CudaVirtualArch::COMPUTE_20)
  199. .Case("compute_30", CudaVirtualArch::COMPUTE_30)
  200. .Case("compute_32", CudaVirtualArch::COMPUTE_32)
  201. .Case("compute_35", CudaVirtualArch::COMPUTE_35)
  202. .Case("compute_37", CudaVirtualArch::COMPUTE_37)
  203. .Case("compute_50", CudaVirtualArch::COMPUTE_50)
  204. .Case("compute_52", CudaVirtualArch::COMPUTE_52)
  205. .Case("compute_53", CudaVirtualArch::COMPUTE_53)
  206. .Case("compute_60", CudaVirtualArch::COMPUTE_60)
  207. .Case("compute_61", CudaVirtualArch::COMPUTE_61)
  208. .Case("compute_62", CudaVirtualArch::COMPUTE_62)
  209. .Case("compute_70", CudaVirtualArch::COMPUTE_70)
  210. .Case("compute_72", CudaVirtualArch::COMPUTE_72)
  211. .Case("compute_75", CudaVirtualArch::COMPUTE_75)
  212. .Case("compute_amdgcn", CudaVirtualArch::COMPUTE_AMDGCN)
  213. .Default(CudaVirtualArch::UNKNOWN);
  214. }
  215. CudaVirtualArch VirtualArchForCudaArch(CudaArch A) {
  216. switch (A) {
  217. case CudaArch::LAST:
  218. break;
  219. case CudaArch::UNKNOWN:
  220. return CudaVirtualArch::UNKNOWN;
  221. case CudaArch::SM_20:
  222. case CudaArch::SM_21:
  223. return CudaVirtualArch::COMPUTE_20;
  224. case CudaArch::SM_30:
  225. return CudaVirtualArch::COMPUTE_30;
  226. case CudaArch::SM_32:
  227. return CudaVirtualArch::COMPUTE_32;
  228. case CudaArch::SM_35:
  229. return CudaVirtualArch::COMPUTE_35;
  230. case CudaArch::SM_37:
  231. return CudaVirtualArch::COMPUTE_37;
  232. case CudaArch::SM_50:
  233. return CudaVirtualArch::COMPUTE_50;
  234. case CudaArch::SM_52:
  235. return CudaVirtualArch::COMPUTE_52;
  236. case CudaArch::SM_53:
  237. return CudaVirtualArch::COMPUTE_53;
  238. case CudaArch::SM_60:
  239. return CudaVirtualArch::COMPUTE_60;
  240. case CudaArch::SM_61:
  241. return CudaVirtualArch::COMPUTE_61;
  242. case CudaArch::SM_62:
  243. return CudaVirtualArch::COMPUTE_62;
  244. case CudaArch::SM_70:
  245. return CudaVirtualArch::COMPUTE_70;
  246. case CudaArch::SM_72:
  247. return CudaVirtualArch::COMPUTE_72;
  248. case CudaArch::SM_75:
  249. return CudaVirtualArch::COMPUTE_75;
  250. case CudaArch::GFX600:
  251. case CudaArch::GFX601:
  252. case CudaArch::GFX700:
  253. case CudaArch::GFX701:
  254. case CudaArch::GFX702:
  255. case CudaArch::GFX703:
  256. case CudaArch::GFX704:
  257. case CudaArch::GFX801:
  258. case CudaArch::GFX802:
  259. case CudaArch::GFX803:
  260. case CudaArch::GFX810:
  261. case CudaArch::GFX900:
  262. case CudaArch::GFX902:
  263. case CudaArch::GFX904:
  264. case CudaArch::GFX906:
  265. case CudaArch::GFX908:
  266. case CudaArch::GFX909:
  267. case CudaArch::GFX1010:
  268. case CudaArch::GFX1011:
  269. case CudaArch::GFX1012:
  270. return CudaVirtualArch::COMPUTE_AMDGCN;
  271. }
  272. llvm_unreachable("invalid enum");
  273. }
  274. CudaVersion MinVersionForCudaArch(CudaArch A) {
  275. switch (A) {
  276. case CudaArch::LAST:
  277. break;
  278. case CudaArch::UNKNOWN:
  279. return CudaVersion::UNKNOWN;
  280. case CudaArch::SM_20:
  281. case CudaArch::SM_21:
  282. case CudaArch::SM_30:
  283. case CudaArch::SM_32:
  284. case CudaArch::SM_35:
  285. case CudaArch::SM_37:
  286. case CudaArch::SM_50:
  287. case CudaArch::SM_52:
  288. case CudaArch::SM_53:
  289. return CudaVersion::CUDA_70;
  290. case CudaArch::SM_60:
  291. case CudaArch::SM_61:
  292. case CudaArch::SM_62:
  293. return CudaVersion::CUDA_80;
  294. case CudaArch::SM_70:
  295. return CudaVersion::CUDA_90;
  296. case CudaArch::SM_72:
  297. return CudaVersion::CUDA_91;
  298. case CudaArch::SM_75:
  299. return CudaVersion::CUDA_100;
  300. case CudaArch::GFX600:
  301. case CudaArch::GFX601:
  302. case CudaArch::GFX700:
  303. case CudaArch::GFX701:
  304. case CudaArch::GFX702:
  305. case CudaArch::GFX703:
  306. case CudaArch::GFX704:
  307. case CudaArch::GFX801:
  308. case CudaArch::GFX802:
  309. case CudaArch::GFX803:
  310. case CudaArch::GFX810:
  311. case CudaArch::GFX900:
  312. case CudaArch::GFX902:
  313. case CudaArch::GFX904:
  314. case CudaArch::GFX906:
  315. case CudaArch::GFX908:
  316. case CudaArch::GFX909:
  317. case CudaArch::GFX1010:
  318. case CudaArch::GFX1011:
  319. case CudaArch::GFX1012:
  320. return CudaVersion::CUDA_70;
  321. }
  322. llvm_unreachable("invalid enum");
  323. }
  324. CudaVersion MaxVersionForCudaArch(CudaArch A) {
  325. switch (A) {
  326. case CudaArch::UNKNOWN:
  327. return CudaVersion::UNKNOWN;
  328. case CudaArch::SM_20:
  329. case CudaArch::SM_21:
  330. case CudaArch::GFX600:
  331. case CudaArch::GFX601:
  332. case CudaArch::GFX700:
  333. case CudaArch::GFX701:
  334. case CudaArch::GFX702:
  335. case CudaArch::GFX703:
  336. case CudaArch::GFX704:
  337. case CudaArch::GFX801:
  338. case CudaArch::GFX802:
  339. case CudaArch::GFX803:
  340. case CudaArch::GFX810:
  341. case CudaArch::GFX900:
  342. case CudaArch::GFX902:
  343. case CudaArch::GFX1010:
  344. case CudaArch::GFX1011:
  345. case CudaArch::GFX1012:
  346. return CudaVersion::CUDA_80;
  347. default:
  348. return CudaVersion::LATEST;
  349. }
  350. }
  351. static CudaVersion ToCudaVersion(llvm::VersionTuple Version) {
  352. int IVer =
  353. Version.getMajor() * 10 + Version.getMinor().getValueOr(0);
  354. switch(IVer) {
  355. case 70:
  356. return CudaVersion::CUDA_70;
  357. case 75:
  358. return CudaVersion::CUDA_75;
  359. case 80:
  360. return CudaVersion::CUDA_80;
  361. case 90:
  362. return CudaVersion::CUDA_90;
  363. case 91:
  364. return CudaVersion::CUDA_91;
  365. case 92:
  366. return CudaVersion::CUDA_92;
  367. case 100:
  368. return CudaVersion::CUDA_100;
  369. case 101:
  370. return CudaVersion::CUDA_101;
  371. default:
  372. return CudaVersion::UNKNOWN;
  373. }
  374. }
  375. bool CudaFeatureEnabled(llvm::VersionTuple Version, CudaFeature Feature) {
  376. return CudaFeatureEnabled(ToCudaVersion(Version), Feature);
  377. }
  378. bool CudaFeatureEnabled(CudaVersion Version, CudaFeature Feature) {
  379. switch (Feature) {
  380. case CudaFeature::CUDA_USES_NEW_LAUNCH:
  381. return Version >= CudaVersion::CUDA_92;
  382. case CudaFeature::CUDA_USES_FATBIN_REGISTER_END:
  383. return Version >= CudaVersion::CUDA_101;
  384. }
  385. llvm_unreachable("Unknown CUDA feature.");
  386. }
  387. } // namespace clang