109467b48Spatrick //===- ModuleSymbolTable.cpp - symbol table for in-memory IR --------------===//
209467b48Spatrick //
309467b48Spatrick // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
409467b48Spatrick // See https://llvm.org/LICENSE.txt for license information.
509467b48Spatrick // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
609467b48Spatrick //
709467b48Spatrick //===----------------------------------------------------------------------===//
809467b48Spatrick //
909467b48Spatrick // This class represents a symbol table built from in-memory IR. It provides
1009467b48Spatrick // access to GlobalValues and should only be used if such access is required
1109467b48Spatrick // (e.g. in the LTO implementation).
1209467b48Spatrick //
1309467b48Spatrick //===----------------------------------------------------------------------===//
1409467b48Spatrick 
1509467b48Spatrick #include "llvm/Object/ModuleSymbolTable.h"
1609467b48Spatrick #include "RecordStreamer.h"
1709467b48Spatrick #include "llvm/ADT/STLExtras.h"
1809467b48Spatrick #include "llvm/ADT/StringMap.h"
1909467b48Spatrick #include "llvm/ADT/StringRef.h"
2009467b48Spatrick #include "llvm/ADT/Triple.h"
2109467b48Spatrick #include "llvm/IR/Function.h"
2209467b48Spatrick #include "llvm/IR/GlobalAlias.h"
2309467b48Spatrick #include "llvm/IR/GlobalValue.h"
2409467b48Spatrick #include "llvm/IR/GlobalVariable.h"
25097a140dSpatrick #include "llvm/IR/InlineAsm.h"
2609467b48Spatrick #include "llvm/IR/Module.h"
2709467b48Spatrick #include "llvm/MC/MCAsmInfo.h"
2809467b48Spatrick #include "llvm/MC/MCContext.h"
2909467b48Spatrick #include "llvm/MC/MCInstrInfo.h"
3009467b48Spatrick #include "llvm/MC/MCObjectFileInfo.h"
3109467b48Spatrick #include "llvm/MC/MCParser/MCAsmParser.h"
3209467b48Spatrick #include "llvm/MC/MCParser/MCTargetAsmParser.h"
3309467b48Spatrick #include "llvm/MC/MCRegisterInfo.h"
3409467b48Spatrick #include "llvm/MC/MCSubtargetInfo.h"
3509467b48Spatrick #include "llvm/MC/MCSymbol.h"
3609467b48Spatrick #include "llvm/MC/MCTargetOptions.h"
37*d415bd75Srobert #include "llvm/MC/TargetRegistry.h"
3809467b48Spatrick #include "llvm/Object/SymbolicFile.h"
3909467b48Spatrick #include "llvm/Support/Casting.h"
4009467b48Spatrick #include "llvm/Support/ErrorHandling.h"
4109467b48Spatrick #include "llvm/Support/MemoryBuffer.h"
4209467b48Spatrick #include "llvm/Support/SMLoc.h"
4309467b48Spatrick #include "llvm/Support/SourceMgr.h"
4409467b48Spatrick #include "llvm/Support/raw_ostream.h"
4509467b48Spatrick #include <algorithm>
4609467b48Spatrick #include <cassert>
4709467b48Spatrick #include <cstdint>
4809467b48Spatrick #include <memory>
4909467b48Spatrick #include <string>
5009467b48Spatrick 
5109467b48Spatrick using namespace llvm;
5209467b48Spatrick using namespace object;
5309467b48Spatrick 
addModule(Module * M)5409467b48Spatrick void ModuleSymbolTable::addModule(Module *M) {
5509467b48Spatrick   if (FirstMod)
5609467b48Spatrick     assert(FirstMod->getTargetTriple() == M->getTargetTriple());
5709467b48Spatrick   else
5809467b48Spatrick     FirstMod = M;
5909467b48Spatrick 
6009467b48Spatrick   for (GlobalValue &GV : M->global_values())
6109467b48Spatrick     SymTab.push_back(&GV);
6209467b48Spatrick 
6309467b48Spatrick   CollectAsmSymbols(*M, [this](StringRef Name, BasicSymbolRef::Flags Flags) {
64097a140dSpatrick     SymTab.push_back(new (AsmSymbols.Allocate())
65097a140dSpatrick                          AsmSymbol(std::string(Name), Flags));
6609467b48Spatrick   });
6709467b48Spatrick }
6809467b48Spatrick 
6909467b48Spatrick static void
initializeRecordStreamer(const Module & M,function_ref<void (RecordStreamer &)> Init)7009467b48Spatrick initializeRecordStreamer(const Module &M,
7109467b48Spatrick                          function_ref<void(RecordStreamer &)> Init) {
7209467b48Spatrick   StringRef InlineAsm = M.getModuleInlineAsm();
7309467b48Spatrick   if (InlineAsm.empty())
7409467b48Spatrick     return;
7509467b48Spatrick 
7609467b48Spatrick   std::string Err;
7709467b48Spatrick   const Triple TT(M.getTargetTriple());
7809467b48Spatrick   const Target *T = TargetRegistry::lookupTarget(TT.str(), Err);
7909467b48Spatrick   assert(T && T->hasMCAsmParser());
8009467b48Spatrick 
8109467b48Spatrick   std::unique_ptr<MCRegisterInfo> MRI(T->createMCRegInfo(TT.str()));
8209467b48Spatrick   if (!MRI)
8309467b48Spatrick     return;
8409467b48Spatrick 
8509467b48Spatrick   MCTargetOptions MCOptions;
8609467b48Spatrick   std::unique_ptr<MCAsmInfo> MAI(T->createMCAsmInfo(*MRI, TT.str(), MCOptions));
8709467b48Spatrick   if (!MAI)
8809467b48Spatrick     return;
8909467b48Spatrick 
9009467b48Spatrick   std::unique_ptr<MCSubtargetInfo> STI(
9109467b48Spatrick       T->createMCSubtargetInfo(TT.str(), "", ""));
9209467b48Spatrick   if (!STI)
9309467b48Spatrick     return;
9409467b48Spatrick 
9509467b48Spatrick   std::unique_ptr<MCInstrInfo> MCII(T->createMCInstrInfo());
9609467b48Spatrick   if (!MCII)
9709467b48Spatrick     return;
9809467b48Spatrick 
9909467b48Spatrick   std::unique_ptr<MemoryBuffer> Buffer(MemoryBuffer::getMemBuffer(InlineAsm));
10009467b48Spatrick   SourceMgr SrcMgr;
10109467b48Spatrick   SrcMgr.AddNewSourceBuffer(std::move(Buffer), SMLoc());
10273471bf0Spatrick 
10373471bf0Spatrick   MCContext MCCtx(TT, MAI.get(), MRI.get(), STI.get(), &SrcMgr);
10473471bf0Spatrick   std::unique_ptr<MCObjectFileInfo> MOFI(
10573471bf0Spatrick       T->createMCObjectFileInfo(MCCtx, /*PIC=*/false));
10673471bf0Spatrick   MOFI->setSDKVersion(M.getSDKVersion());
10773471bf0Spatrick   MCCtx.setObjectFileInfo(MOFI.get());
10873471bf0Spatrick   RecordStreamer Streamer(MCCtx, M);
10973471bf0Spatrick   T->createNullTargetStreamer(Streamer);
11073471bf0Spatrick 
11109467b48Spatrick   std::unique_ptr<MCAsmParser> Parser(
11209467b48Spatrick       createMCAsmParser(SrcMgr, MCCtx, Streamer, *MAI));
11309467b48Spatrick 
11409467b48Spatrick   std::unique_ptr<MCTargetAsmParser> TAP(
11509467b48Spatrick       T->createMCAsmParser(*STI, *Parser, *MCII, MCOptions));
11609467b48Spatrick   if (!TAP)
11709467b48Spatrick     return;
11809467b48Spatrick 
119097a140dSpatrick   // Module-level inline asm is assumed to use At&t syntax (see
120097a140dSpatrick   // AsmPrinter::doInitialization()).
121097a140dSpatrick   Parser->setAssemblerDialect(InlineAsm::AD_ATT);
122097a140dSpatrick 
12309467b48Spatrick   Parser->setTargetParser(*TAP);
12409467b48Spatrick   if (Parser->Run(false))
12509467b48Spatrick     return;
12609467b48Spatrick 
12709467b48Spatrick   Init(Streamer);
12809467b48Spatrick }
12909467b48Spatrick 
CollectAsmSymbols(const Module & M,function_ref<void (StringRef,BasicSymbolRef::Flags)> AsmSymbol)13009467b48Spatrick void ModuleSymbolTable::CollectAsmSymbols(
13109467b48Spatrick     const Module &M,
13209467b48Spatrick     function_ref<void(StringRef, BasicSymbolRef::Flags)> AsmSymbol) {
13309467b48Spatrick   initializeRecordStreamer(M, [&](RecordStreamer &Streamer) {
13409467b48Spatrick     Streamer.flushSymverDirectives();
13509467b48Spatrick 
13609467b48Spatrick     for (auto &KV : Streamer) {
13709467b48Spatrick       StringRef Key = KV.first();
13809467b48Spatrick       RecordStreamer::State Value = KV.second;
13909467b48Spatrick       // FIXME: For now we just assume that all asm symbols are executable.
14009467b48Spatrick       uint32_t Res = BasicSymbolRef::SF_Executable;
14109467b48Spatrick       switch (Value) {
14209467b48Spatrick       case RecordStreamer::NeverSeen:
14309467b48Spatrick         llvm_unreachable("NeverSeen should have been replaced earlier");
14409467b48Spatrick       case RecordStreamer::DefinedGlobal:
14509467b48Spatrick         Res |= BasicSymbolRef::SF_Global;
14609467b48Spatrick         break;
14709467b48Spatrick       case RecordStreamer::Defined:
14809467b48Spatrick         break;
14909467b48Spatrick       case RecordStreamer::Global:
15009467b48Spatrick       case RecordStreamer::Used:
15109467b48Spatrick         Res |= BasicSymbolRef::SF_Undefined;
15209467b48Spatrick         Res |= BasicSymbolRef::SF_Global;
15309467b48Spatrick         break;
15409467b48Spatrick       case RecordStreamer::DefinedWeak:
15509467b48Spatrick         Res |= BasicSymbolRef::SF_Weak;
15609467b48Spatrick         Res |= BasicSymbolRef::SF_Global;
15709467b48Spatrick         break;
15809467b48Spatrick       case RecordStreamer::UndefinedWeak:
15909467b48Spatrick         Res |= BasicSymbolRef::SF_Weak;
16009467b48Spatrick         Res |= BasicSymbolRef::SF_Undefined;
16109467b48Spatrick       }
16209467b48Spatrick       AsmSymbol(Key, BasicSymbolRef::Flags(Res));
16309467b48Spatrick     }
16409467b48Spatrick   });
16509467b48Spatrick }
16609467b48Spatrick 
CollectAsmSymvers(const Module & M,function_ref<void (StringRef,StringRef)> AsmSymver)16709467b48Spatrick void ModuleSymbolTable::CollectAsmSymvers(
16809467b48Spatrick     const Module &M, function_ref<void(StringRef, StringRef)> AsmSymver) {
16909467b48Spatrick   initializeRecordStreamer(M, [&](RecordStreamer &Streamer) {
17009467b48Spatrick     for (auto &KV : Streamer.symverAliases())
17109467b48Spatrick       for (auto &Alias : KV.second)
17209467b48Spatrick         AsmSymver(KV.first->getName(), Alias);
17309467b48Spatrick   });
17409467b48Spatrick }
17509467b48Spatrick 
printSymbolName(raw_ostream & OS,Symbol S) const17609467b48Spatrick void ModuleSymbolTable::printSymbolName(raw_ostream &OS, Symbol S) const {
17709467b48Spatrick   if (S.is<AsmSymbol *>()) {
17809467b48Spatrick     OS << S.get<AsmSymbol *>()->first;
17909467b48Spatrick     return;
18009467b48Spatrick   }
18109467b48Spatrick 
18209467b48Spatrick   auto *GV = S.get<GlobalValue *>();
18309467b48Spatrick   if (GV->hasDLLImportStorageClass())
18409467b48Spatrick     OS << "__imp_";
18509467b48Spatrick 
18609467b48Spatrick   Mang.getNameWithPrefix(OS, GV, false);
18709467b48Spatrick }
18809467b48Spatrick 
getSymbolFlags(Symbol S) const18909467b48Spatrick uint32_t ModuleSymbolTable::getSymbolFlags(Symbol S) const {
19009467b48Spatrick   if (S.is<AsmSymbol *>())
19109467b48Spatrick     return S.get<AsmSymbol *>()->second;
19209467b48Spatrick 
19309467b48Spatrick   auto *GV = S.get<GlobalValue *>();
19409467b48Spatrick 
19509467b48Spatrick   uint32_t Res = BasicSymbolRef::SF_None;
19609467b48Spatrick   if (GV->isDeclarationForLinker())
19709467b48Spatrick     Res |= BasicSymbolRef::SF_Undefined;
19809467b48Spatrick   else if (GV->hasHiddenVisibility() && !GV->hasLocalLinkage())
19909467b48Spatrick     Res |= BasicSymbolRef::SF_Hidden;
20009467b48Spatrick   if (const GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV)) {
20109467b48Spatrick     if (GVar->isConstant())
20209467b48Spatrick       Res |= BasicSymbolRef::SF_Const;
20309467b48Spatrick   }
204*d415bd75Srobert   if (const GlobalObject *GO = GV->getAliaseeObject())
205*d415bd75Srobert     if (isa<Function>(GO) || isa<GlobalIFunc>(GO))
20609467b48Spatrick       Res |= BasicSymbolRef::SF_Executable;
20709467b48Spatrick   if (isa<GlobalAlias>(GV))
20809467b48Spatrick     Res |= BasicSymbolRef::SF_Indirect;
20909467b48Spatrick   if (GV->hasPrivateLinkage())
21009467b48Spatrick     Res |= BasicSymbolRef::SF_FormatSpecific;
21109467b48Spatrick   if (!GV->hasLocalLinkage())
21209467b48Spatrick     Res |= BasicSymbolRef::SF_Global;
21309467b48Spatrick   if (GV->hasCommonLinkage())
21409467b48Spatrick     Res |= BasicSymbolRef::SF_Common;
21509467b48Spatrick   if (GV->hasLinkOnceLinkage() || GV->hasWeakLinkage() ||
21609467b48Spatrick       GV->hasExternalWeakLinkage())
21709467b48Spatrick     Res |= BasicSymbolRef::SF_Weak;
21809467b48Spatrick 
21909467b48Spatrick   if (GV->getName().startswith("llvm."))
22009467b48Spatrick     Res |= BasicSymbolRef::SF_FormatSpecific;
22109467b48Spatrick   else if (auto *Var = dyn_cast<GlobalVariable>(GV)) {
22209467b48Spatrick     if (Var->getSection() == "llvm.metadata")
22309467b48Spatrick       Res |= BasicSymbolRef::SF_FormatSpecific;
22409467b48Spatrick   }
22509467b48Spatrick 
22609467b48Spatrick   return Res;
22709467b48Spatrick }
228