IRObjectFile.cpp 9.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331
  1. //===- IRObjectFile.cpp - IR object file implementation ---------*- C++ -*-===//
  2. //
  3. // The LLVM Compiler Infrastructure
  4. //
  5. // This file is distributed under the University of Illinois Open Source
  6. // License. See LICENSE.TXT for details.
  7. //
  8. //===----------------------------------------------------------------------===//
  9. //
  10. // Part of the IRObjectFile class implementation.
  11. //
  12. //===----------------------------------------------------------------------===//
  13. #include "llvm/Object/IRObjectFile.h"
  14. #include "RecordStreamer.h"
  15. #include "llvm/ADT/STLExtras.h"
  16. #include "llvm/Bitcode/ReaderWriter.h"
  17. #include "llvm/IR/GVMaterializer.h"
  18. #include "llvm/IR/LLVMContext.h"
  19. #include "llvm/IR/Mangler.h"
  20. #include "llvm/IR/Module.h"
  21. #include "llvm/MC/MCAsmInfo.h"
  22. #include "llvm/MC/MCContext.h"
  23. #include "llvm/MC/MCInstrInfo.h"
  24. #include "llvm/MC/MCObjectFileInfo.h"
  25. #include "llvm/MC/MCParser/MCAsmParser.h"
  26. #include "llvm/MC/MCParser/MCTargetAsmParser.h"
  27. #include "llvm/MC/MCRegisterInfo.h"
  28. #include "llvm/MC/MCSubtargetInfo.h"
  29. #include "llvm/Object/ObjectFile.h"
  30. #include "llvm/Support/MemoryBuffer.h"
  31. #include "llvm/Support/SourceMgr.h"
  32. #include "llvm/Support/TargetRegistry.h"
  33. #include "llvm/Support/raw_ostream.h"
  34. using namespace llvm;
  35. using namespace object;
  36. IRObjectFile::IRObjectFile(MemoryBufferRef Object, std::unique_ptr<Module> Mod)
  37. : SymbolicFile(Binary::ID_IR, Object), M(std::move(Mod)) {
  38. Mang.reset(new Mangler());
  39. CollectAsmUndefinedRefs(Triple(M->getTargetTriple()), M->getModuleInlineAsm(),
  40. [this](StringRef Name, BasicSymbolRef::Flags Flags) {
  41. AsmSymbols.emplace_back(Name, std::move(Flags));
  42. });
  43. }
  44. // Parse inline ASM and collect the list of symbols that are not defined in
  45. // the current module. This is inspired from IRObjectFile.
  46. void IRObjectFile::CollectAsmUndefinedRefs(
  47. const Triple &TT, StringRef InlineAsm,
  48. function_ref<void(StringRef, BasicSymbolRef::Flags)> AsmUndefinedRefs) {
  49. if (InlineAsm.empty())
  50. return;
  51. std::string Err;
  52. const Target *T = TargetRegistry::lookupTarget(TT.str(), Err);
  53. if (!T)
  54. return;
  55. std::unique_ptr<MCRegisterInfo> MRI(T->createMCRegInfo(TT.str()));
  56. if (!MRI)
  57. return;
  58. std::unique_ptr<MCAsmInfo> MAI(T->createMCAsmInfo(*MRI, TT.str()));
  59. if (!MAI)
  60. return;
  61. std::unique_ptr<MCSubtargetInfo> STI(
  62. T->createMCSubtargetInfo(TT.str(), "", ""));
  63. if (!STI)
  64. return;
  65. std::unique_ptr<MCInstrInfo> MCII(T->createMCInstrInfo());
  66. if (!MCII)
  67. return;
  68. MCObjectFileInfo MOFI;
  69. MCContext MCCtx(MAI.get(), MRI.get(), &MOFI);
  70. MOFI.InitMCObjectFileInfo(TT, /*PIC*/ false, CodeModel::Default, MCCtx);
  71. std::unique_ptr<RecordStreamer> Streamer(new RecordStreamer(MCCtx));
  72. T->createNullTargetStreamer(*Streamer);
  73. std::unique_ptr<MemoryBuffer> Buffer(MemoryBuffer::getMemBuffer(InlineAsm));
  74. SourceMgr SrcMgr;
  75. SrcMgr.AddNewSourceBuffer(std::move(Buffer), SMLoc());
  76. std::unique_ptr<MCAsmParser> Parser(
  77. createMCAsmParser(SrcMgr, MCCtx, *Streamer, *MAI));
  78. MCTargetOptions MCOptions;
  79. std::unique_ptr<MCTargetAsmParser> TAP(
  80. T->createMCAsmParser(*STI, *Parser, *MCII, MCOptions));
  81. if (!TAP)
  82. return;
  83. Parser->setTargetParser(*TAP);
  84. if (Parser->Run(false))
  85. return;
  86. for (auto &KV : *Streamer) {
  87. StringRef Key = KV.first();
  88. RecordStreamer::State Value = KV.second;
  89. uint32_t Res = BasicSymbolRef::SF_None;
  90. switch (Value) {
  91. case RecordStreamer::NeverSeen:
  92. llvm_unreachable("NeverSeen should have been replaced earlier");
  93. case RecordStreamer::DefinedGlobal:
  94. Res |= BasicSymbolRef::SF_Global;
  95. break;
  96. case RecordStreamer::Defined:
  97. break;
  98. case RecordStreamer::Global:
  99. case RecordStreamer::Used:
  100. Res |= BasicSymbolRef::SF_Undefined;
  101. Res |= BasicSymbolRef::SF_Global;
  102. break;
  103. case RecordStreamer::DefinedWeak:
  104. Res |= BasicSymbolRef::SF_Weak;
  105. Res |= BasicSymbolRef::SF_Global;
  106. break;
  107. case RecordStreamer::UndefinedWeak:
  108. Res |= BasicSymbolRef::SF_Weak;
  109. Res |= BasicSymbolRef::SF_Undefined;
  110. }
  111. AsmUndefinedRefs(Key, BasicSymbolRef::Flags(Res));
  112. }
  113. }
  114. IRObjectFile::~IRObjectFile() {
  115. }
  116. static GlobalValue *getGV(DataRefImpl &Symb) {
  117. if ((Symb.p & 3) == 3)
  118. return nullptr;
  119. return reinterpret_cast<GlobalValue*>(Symb.p & ~uintptr_t(3));
  120. }
  121. static uintptr_t skipEmpty(Module::const_alias_iterator I, const Module &M) {
  122. if (I == M.alias_end())
  123. return 3;
  124. const GlobalValue *GV = &*I;
  125. return reinterpret_cast<uintptr_t>(GV) | 2;
  126. }
  127. static uintptr_t skipEmpty(Module::const_global_iterator I, const Module &M) {
  128. if (I == M.global_end())
  129. return skipEmpty(M.alias_begin(), M);
  130. const GlobalValue *GV = &*I;
  131. return reinterpret_cast<uintptr_t>(GV) | 1;
  132. }
  133. static uintptr_t skipEmpty(Module::const_iterator I, const Module &M) {
  134. if (I == M.end())
  135. return skipEmpty(M.global_begin(), M);
  136. const GlobalValue *GV = &*I;
  137. return reinterpret_cast<uintptr_t>(GV) | 0;
  138. }
  139. static unsigned getAsmSymIndex(DataRefImpl Symb) {
  140. assert((Symb.p & uintptr_t(3)) == 3);
  141. uintptr_t Index = Symb.p & ~uintptr_t(3);
  142. Index >>= 2;
  143. return Index;
  144. }
  145. void IRObjectFile::moveSymbolNext(DataRefImpl &Symb) const {
  146. const GlobalValue *GV = getGV(Symb);
  147. uintptr_t Res;
  148. switch (Symb.p & 3) {
  149. case 0: {
  150. Module::const_iterator Iter(static_cast<const Function*>(GV));
  151. ++Iter;
  152. Res = skipEmpty(Iter, *M);
  153. break;
  154. }
  155. case 1: {
  156. Module::const_global_iterator Iter(static_cast<const GlobalVariable*>(GV));
  157. ++Iter;
  158. Res = skipEmpty(Iter, *M);
  159. break;
  160. }
  161. case 2: {
  162. Module::const_alias_iterator Iter(static_cast<const GlobalAlias*>(GV));
  163. ++Iter;
  164. Res = skipEmpty(Iter, *M);
  165. break;
  166. }
  167. case 3: {
  168. unsigned Index = getAsmSymIndex(Symb);
  169. assert(Index < AsmSymbols.size());
  170. ++Index;
  171. Res = (Index << 2) | 3;
  172. break;
  173. }
  174. default:
  175. llvm_unreachable("unreachable case");
  176. }
  177. Symb.p = Res;
  178. }
  179. std::error_code IRObjectFile::printSymbolName(raw_ostream &OS,
  180. DataRefImpl Symb) const {
  181. const GlobalValue *GV = getGV(Symb);
  182. if (!GV) {
  183. unsigned Index = getAsmSymIndex(Symb);
  184. assert(Index <= AsmSymbols.size());
  185. OS << AsmSymbols[Index].first;
  186. return std::error_code();
  187. }
  188. if (GV->hasDLLImportStorageClass())
  189. OS << "__imp_";
  190. if (Mang)
  191. Mang->getNameWithPrefix(OS, GV, false);
  192. else
  193. OS << GV->getName();
  194. return std::error_code();
  195. }
  196. uint32_t IRObjectFile::getSymbolFlags(DataRefImpl Symb) const {
  197. const GlobalValue *GV = getGV(Symb);
  198. if (!GV) {
  199. unsigned Index = getAsmSymIndex(Symb);
  200. assert(Index <= AsmSymbols.size());
  201. return AsmSymbols[Index].second;
  202. }
  203. uint32_t Res = BasicSymbolRef::SF_None;
  204. if (GV->isDeclarationForLinker())
  205. Res |= BasicSymbolRef::SF_Undefined;
  206. else if (GV->hasHiddenVisibility() && !GV->hasLocalLinkage())
  207. Res |= BasicSymbolRef::SF_Hidden;
  208. if (const GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV)) {
  209. if (GVar->isConstant())
  210. Res |= BasicSymbolRef::SF_Const;
  211. }
  212. if (GV->hasPrivateLinkage())
  213. Res |= BasicSymbolRef::SF_FormatSpecific;
  214. if (!GV->hasLocalLinkage())
  215. Res |= BasicSymbolRef::SF_Global;
  216. if (GV->hasCommonLinkage())
  217. Res |= BasicSymbolRef::SF_Common;
  218. if (GV->hasLinkOnceLinkage() || GV->hasWeakLinkage() ||
  219. GV->hasExternalWeakLinkage())
  220. Res |= BasicSymbolRef::SF_Weak;
  221. if (GV->getName().startswith("llvm."))
  222. Res |= BasicSymbolRef::SF_FormatSpecific;
  223. else if (auto *Var = dyn_cast<GlobalVariable>(GV)) {
  224. if (Var->getSection() == "llvm.metadata")
  225. Res |= BasicSymbolRef::SF_FormatSpecific;
  226. }
  227. return Res;
  228. }
  229. GlobalValue *IRObjectFile::getSymbolGV(DataRefImpl Symb) { return getGV(Symb); }
  230. std::unique_ptr<Module> IRObjectFile::takeModule() { return std::move(M); }
  231. basic_symbol_iterator IRObjectFile::symbol_begin_impl() const {
  232. Module::const_iterator I = M->begin();
  233. DataRefImpl Ret;
  234. Ret.p = skipEmpty(I, *M);
  235. return basic_symbol_iterator(BasicSymbolRef(Ret, this));
  236. }
  237. basic_symbol_iterator IRObjectFile::symbol_end_impl() const {
  238. DataRefImpl Ret;
  239. uint64_t NumAsm = AsmSymbols.size();
  240. NumAsm <<= 2;
  241. Ret.p = 3 | NumAsm;
  242. return basic_symbol_iterator(BasicSymbolRef(Ret, this));
  243. }
  244. ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInObject(const ObjectFile &Obj) {
  245. for (const SectionRef &Sec : Obj.sections()) {
  246. if (Sec.isBitcode()) {
  247. StringRef SecContents;
  248. if (std::error_code EC = Sec.getContents(SecContents))
  249. return EC;
  250. return MemoryBufferRef(SecContents, Obj.getFileName());
  251. }
  252. }
  253. return object_error::bitcode_section_not_found;
  254. }
  255. ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInMemBuffer(MemoryBufferRef Object) {
  256. sys::fs::file_magic Type = sys::fs::identify_magic(Object.getBuffer());
  257. switch (Type) {
  258. case sys::fs::file_magic::bitcode:
  259. return Object;
  260. case sys::fs::file_magic::elf_relocatable:
  261. case sys::fs::file_magic::macho_object:
  262. case sys::fs::file_magic::coff_object: {
  263. Expected<std::unique_ptr<ObjectFile>> ObjFile =
  264. ObjectFile::createObjectFile(Object, Type);
  265. if (!ObjFile)
  266. return errorToErrorCode(ObjFile.takeError());
  267. return findBitcodeInObject(*ObjFile->get());
  268. }
  269. default:
  270. return object_error::invalid_file_type;
  271. }
  272. }
  273. ErrorOr<std::unique_ptr<IRObjectFile>>
  274. llvm::object::IRObjectFile::create(MemoryBufferRef Object,
  275. LLVMContext &Context) {
  276. ErrorOr<MemoryBufferRef> BCOrErr = findBitcodeInMemBuffer(Object);
  277. if (!BCOrErr)
  278. return BCOrErr.getError();
  279. std::unique_ptr<MemoryBuffer> Buff =
  280. MemoryBuffer::getMemBuffer(BCOrErr.get(), false);
  281. ErrorOr<std::unique_ptr<Module>> MOrErr =
  282. getLazyBitcodeModule(std::move(Buff), Context,
  283. /*ShouldLazyLoadMetadata*/ true);
  284. if (std::error_code EC = MOrErr.getError())
  285. return EC;
  286. std::unique_ptr<Module> &M = MOrErr.get();
  287. return llvm::make_unique<IRObjectFile>(BCOrErr.get(), std::move(M));
  288. }