1 //===- FunctionImport.cpp - ThinLTO Summary-based Function Import ---------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements Function import based on summaries.
10 //
11 //===----------------------------------------------------------------------===//
12
13 #include "llvm/Transforms/IPO/FunctionImport.h"
14 #include "llvm/ADT/ArrayRef.h"
15 #include "llvm/ADT/STLExtras.h"
16 #include "llvm/ADT/SetVector.h"
17 #include "llvm/ADT/SmallVector.h"
18 #include "llvm/ADT/Statistic.h"
19 #include "llvm/ADT/StringMap.h"
20 #include "llvm/ADT/StringRef.h"
21 #include "llvm/Bitcode/BitcodeReader.h"
22 #include "llvm/IR/AutoUpgrade.h"
23 #include "llvm/IR/Constants.h"
24 #include "llvm/IR/Function.h"
25 #include "llvm/IR/GlobalAlias.h"
26 #include "llvm/IR/GlobalObject.h"
27 #include "llvm/IR/GlobalValue.h"
28 #include "llvm/IR/GlobalVariable.h"
29 #include "llvm/IR/Metadata.h"
30 #include "llvm/IR/Module.h"
31 #include "llvm/IR/ModuleSummaryIndex.h"
32 #include "llvm/IRReader/IRReader.h"
33 #include "llvm/InitializePasses.h"
34 #include "llvm/Linker/IRMover.h"
35 #include "llvm/Pass.h"
36 #include "llvm/Support/Casting.h"
37 #include "llvm/Support/CommandLine.h"
38 #include "llvm/Support/Debug.h"
39 #include "llvm/Support/Errc.h"
40 #include "llvm/Support/Error.h"
41 #include "llvm/Support/ErrorHandling.h"
42 #include "llvm/Support/FileSystem.h"
43 #include "llvm/Support/SourceMgr.h"
44 #include "llvm/Support/raw_ostream.h"
45 #include "llvm/Transforms/IPO/Internalize.h"
46 #include "llvm/Transforms/Utils/Cloning.h"
47 #include "llvm/Transforms/Utils/FunctionImportUtils.h"
48 #include "llvm/Transforms/Utils/ValueMapper.h"
49 #include <cassert>
50 #include <memory>
51 #include <set>
52 #include <string>
53 #include <system_error>
54 #include <tuple>
55 #include <utility>
56
57 using namespace llvm;
58
59 #define DEBUG_TYPE "function-import"
60
61 STATISTIC(NumImportedFunctionsThinLink,
62 "Number of functions thin link decided to import");
63 STATISTIC(NumImportedHotFunctionsThinLink,
64 "Number of hot functions thin link decided to import");
65 STATISTIC(NumImportedCriticalFunctionsThinLink,
66 "Number of critical functions thin link decided to import");
67 STATISTIC(NumImportedGlobalVarsThinLink,
68 "Number of global variables thin link decided to import");
69 STATISTIC(NumImportedFunctions, "Number of functions imported in backend");
70 STATISTIC(NumImportedGlobalVars,
71 "Number of global variables imported in backend");
72 STATISTIC(NumImportedModules, "Number of modules imported from");
73 STATISTIC(NumDeadSymbols, "Number of dead stripped symbols in index");
74 STATISTIC(NumLiveSymbols, "Number of live symbols in index");
75
76 /// Limit on instruction count of imported functions.
77 static cl::opt<unsigned> ImportInstrLimit(
78 "import-instr-limit", cl::init(100), cl::Hidden, cl::value_desc("N"),
79 cl::desc("Only import functions with less than N instructions"));
80
81 static cl::opt<int> ImportCutoff(
82 "import-cutoff", cl::init(-1), cl::Hidden, cl::value_desc("N"),
83 cl::desc("Only import first N functions if N>=0 (default -1)"));
84
85 static cl::opt<bool>
86 ForceImportAll("force-import-all", cl::init(false), cl::Hidden,
87 cl::desc("Import functions with noinline attribute"));
88
89 static cl::opt<float>
90 ImportInstrFactor("import-instr-evolution-factor", cl::init(0.7),
91 cl::Hidden, cl::value_desc("x"),
92 cl::desc("As we import functions, multiply the "
93 "`import-instr-limit` threshold by this factor "
94 "before processing newly imported functions"));
95
96 static cl::opt<float> ImportHotInstrFactor(
97 "import-hot-evolution-factor", cl::init(1.0), cl::Hidden,
98 cl::value_desc("x"),
99 cl::desc("As we import functions called from hot callsite, multiply the "
100 "`import-instr-limit` threshold by this factor "
101 "before processing newly imported functions"));
102
103 static cl::opt<float> ImportHotMultiplier(
104 "import-hot-multiplier", cl::init(10.0), cl::Hidden, cl::value_desc("x"),
105 cl::desc("Multiply the `import-instr-limit` threshold for hot callsites"));
106
107 static cl::opt<float> ImportCriticalMultiplier(
108 "import-critical-multiplier", cl::init(100.0), cl::Hidden,
109 cl::value_desc("x"),
110 cl::desc(
111 "Multiply the `import-instr-limit` threshold for critical callsites"));
112
113 // FIXME: This multiplier was not really tuned up.
114 static cl::opt<float> ImportColdMultiplier(
115 "import-cold-multiplier", cl::init(0), cl::Hidden, cl::value_desc("N"),
116 cl::desc("Multiply the `import-instr-limit` threshold for cold callsites"));
117
118 static cl::opt<bool> PrintImports("print-imports", cl::init(false), cl::Hidden,
119 cl::desc("Print imported functions"));
120
121 static cl::opt<bool> PrintImportFailures(
122 "print-import-failures", cl::init(false), cl::Hidden,
123 cl::desc("Print information for functions rejected for importing"));
124
125 static cl::opt<bool> ComputeDead("compute-dead", cl::init(true), cl::Hidden,
126 cl::desc("Compute dead symbols"));
127
128 static cl::opt<bool> EnableImportMetadata(
129 "enable-import-metadata", cl::init(false), cl::Hidden,
130 cl::desc("Enable import metadata like 'thinlto_src_module'"));
131
132 /// Summary file to use for function importing when using -function-import from
133 /// the command line.
134 static cl::opt<std::string>
135 SummaryFile("summary-file",
136 cl::desc("The summary file to use for function importing."));
137
138 /// Used when testing importing from distributed indexes via opt
139 // -function-import.
140 static cl::opt<bool>
141 ImportAllIndex("import-all-index",
142 cl::desc("Import all external functions in index."));
143
144 // Load lazily a module from \p FileName in \p Context.
loadFile(const std::string & FileName,LLVMContext & Context)145 static std::unique_ptr<Module> loadFile(const std::string &FileName,
146 LLVMContext &Context) {
147 SMDiagnostic Err;
148 LLVM_DEBUG(dbgs() << "Loading '" << FileName << "'\n");
149 // Metadata isn't loaded until functions are imported, to minimize
150 // the memory overhead.
151 std::unique_ptr<Module> Result =
152 getLazyIRFileModule(FileName, Err, Context,
153 /* ShouldLazyLoadMetadata = */ true);
154 if (!Result) {
155 Err.print("function-import", errs());
156 report_fatal_error("Abort");
157 }
158
159 return Result;
160 }
161
162 /// Given a list of possible callee implementation for a call site, select one
163 /// that fits the \p Threshold.
164 ///
165 /// FIXME: select "best" instead of first that fits. But what is "best"?
166 /// - The smallest: more likely to be inlined.
167 /// - The one with the least outgoing edges (already well optimized).
168 /// - One from a module already being imported from in order to reduce the
169 /// number of source modules parsed/linked.
170 /// - One that has PGO data attached.
171 /// - [insert you fancy metric here]
172 static const GlobalValueSummary *
selectCallee(const ModuleSummaryIndex & Index,ArrayRef<std::unique_ptr<GlobalValueSummary>> CalleeSummaryList,unsigned Threshold,StringRef CallerModulePath,FunctionImporter::ImportFailureReason & Reason,GlobalValue::GUID GUID)173 selectCallee(const ModuleSummaryIndex &Index,
174 ArrayRef<std::unique_ptr<GlobalValueSummary>> CalleeSummaryList,
175 unsigned Threshold, StringRef CallerModulePath,
176 FunctionImporter::ImportFailureReason &Reason,
177 GlobalValue::GUID GUID) {
178 Reason = FunctionImporter::ImportFailureReason::None;
179 auto It = llvm::find_if(
180 CalleeSummaryList,
181 [&](const std::unique_ptr<GlobalValueSummary> &SummaryPtr) {
182 auto *GVSummary = SummaryPtr.get();
183 if (!Index.isGlobalValueLive(GVSummary)) {
184 Reason = FunctionImporter::ImportFailureReason::NotLive;
185 return false;
186 }
187
188 if (GlobalValue::isInterposableLinkage(GVSummary->linkage())) {
189 Reason = FunctionImporter::ImportFailureReason::InterposableLinkage;
190 // There is no point in importing these, we can't inline them
191 return false;
192 }
193
194 auto *Summary = cast<FunctionSummary>(GVSummary->getBaseObject());
195
196 // If this is a local function, make sure we import the copy
197 // in the caller's module. The only time a local function can
198 // share an entry in the index is if there is a local with the same name
199 // in another module that had the same source file name (in a different
200 // directory), where each was compiled in their own directory so there
201 // was not distinguishing path.
202 // However, do the import from another module if there is only one
203 // entry in the list - in that case this must be a reference due
204 // to indirect call profile data, since a function pointer can point to
205 // a local in another module.
206 if (GlobalValue::isLocalLinkage(Summary->linkage()) &&
207 CalleeSummaryList.size() > 1 &&
208 Summary->modulePath() != CallerModulePath) {
209 Reason =
210 FunctionImporter::ImportFailureReason::LocalLinkageNotInModule;
211 return false;
212 }
213
214 if ((Summary->instCount() > Threshold) &&
215 !Summary->fflags().AlwaysInline && !ForceImportAll) {
216 Reason = FunctionImporter::ImportFailureReason::TooLarge;
217 return false;
218 }
219
220 // Skip if it isn't legal to import (e.g. may reference unpromotable
221 // locals).
222 if (Summary->notEligibleToImport()) {
223 Reason = FunctionImporter::ImportFailureReason::NotEligible;
224 return false;
225 }
226
227 // Don't bother importing if we can't inline it anyway.
228 if (Summary->fflags().NoInline && !ForceImportAll) {
229 Reason = FunctionImporter::ImportFailureReason::NoInline;
230 return false;
231 }
232
233 return true;
234 });
235 if (It == CalleeSummaryList.end())
236 return nullptr;
237
238 return cast<GlobalValueSummary>(It->get());
239 }
240
241 namespace {
242
243 using EdgeInfo =
244 std::tuple<const GlobalValueSummary *, unsigned /* Threshold */>;
245
246 } // anonymous namespace
247
shouldImportGlobal(const ValueInfo & VI,const GVSummaryMapTy & DefinedGVSummaries)248 static bool shouldImportGlobal(const ValueInfo &VI,
249 const GVSummaryMapTy &DefinedGVSummaries) {
250 const auto &GVS = DefinedGVSummaries.find(VI.getGUID());
251 if (GVS == DefinedGVSummaries.end())
252 return true;
253 // We should not skip import if the module contains a definition with
254 // interposable linkage type. This is required for correctness in
255 // the situation with two following conditions:
256 // * the def with interposable linkage is non-prevailing,
257 // * there is a prevailing def available for import and marked read-only.
258 // In this case, the non-prevailing def will be converted to a declaration,
259 // while the prevailing one becomes internal, thus no definitions will be
260 // available for linking. In order to prevent undefined symbol link error,
261 // the prevailing definition must be imported.
262 // FIXME: Consider adding a check that the suitable prevailing definition
263 // exists and marked read-only.
264 if (VI.getSummaryList().size() > 1 &&
265 GlobalValue::isInterposableLinkage(GVS->second->linkage()))
266 return true;
267
268 return false;
269 }
270
computeImportForReferencedGlobals(const GlobalValueSummary & Summary,const ModuleSummaryIndex & Index,const GVSummaryMapTy & DefinedGVSummaries,SmallVectorImpl<EdgeInfo> & Worklist,FunctionImporter::ImportMapTy & ImportList,StringMap<FunctionImporter::ExportSetTy> * ExportLists)271 static void computeImportForReferencedGlobals(
272 const GlobalValueSummary &Summary, const ModuleSummaryIndex &Index,
273 const GVSummaryMapTy &DefinedGVSummaries,
274 SmallVectorImpl<EdgeInfo> &Worklist,
275 FunctionImporter::ImportMapTy &ImportList,
276 StringMap<FunctionImporter::ExportSetTy> *ExportLists) {
277 for (const auto &VI : Summary.refs()) {
278 if (!shouldImportGlobal(VI, DefinedGVSummaries)) {
279 LLVM_DEBUG(
280 dbgs() << "Ref ignored! Target already in destination module.\n");
281 continue;
282 }
283
284 LLVM_DEBUG(dbgs() << " ref -> " << VI << "\n");
285
286 // If this is a local variable, make sure we import the copy
287 // in the caller's module. The only time a local variable can
288 // share an entry in the index is if there is a local with the same name
289 // in another module that had the same source file name (in a different
290 // directory), where each was compiled in their own directory so there
291 // was not distinguishing path.
292 auto LocalNotInModule = [&](const GlobalValueSummary *RefSummary) -> bool {
293 return GlobalValue::isLocalLinkage(RefSummary->linkage()) &&
294 RefSummary->modulePath() != Summary.modulePath();
295 };
296
297 for (const auto &RefSummary : VI.getSummaryList())
298 if (isa<GlobalVarSummary>(RefSummary.get()) &&
299 Index.canImportGlobalVar(RefSummary.get(), /* AnalyzeRefs */ true) &&
300 !LocalNotInModule(RefSummary.get())) {
301 auto ILI = ImportList[RefSummary->modulePath()].insert(VI.getGUID());
302 // Only update stat and exports if we haven't already imported this
303 // variable.
304 if (!ILI.second)
305 break;
306 NumImportedGlobalVarsThinLink++;
307 // Any references made by this variable will be marked exported later,
308 // in ComputeCrossModuleImport, after import decisions are complete,
309 // which is more efficient than adding them here.
310 if (ExportLists)
311 (*ExportLists)[RefSummary->modulePath()].insert(VI);
312
313 // If variable is not writeonly we attempt to recursively analyze
314 // its references in order to import referenced constants.
315 if (!Index.isWriteOnly(cast<GlobalVarSummary>(RefSummary.get())))
316 Worklist.emplace_back(RefSummary.get(), 0);
317 break;
318 }
319 }
320 }
321
322 static const char *
getFailureName(FunctionImporter::ImportFailureReason Reason)323 getFailureName(FunctionImporter::ImportFailureReason Reason) {
324 switch (Reason) {
325 case FunctionImporter::ImportFailureReason::None:
326 return "None";
327 case FunctionImporter::ImportFailureReason::GlobalVar:
328 return "GlobalVar";
329 case FunctionImporter::ImportFailureReason::NotLive:
330 return "NotLive";
331 case FunctionImporter::ImportFailureReason::TooLarge:
332 return "TooLarge";
333 case FunctionImporter::ImportFailureReason::InterposableLinkage:
334 return "InterposableLinkage";
335 case FunctionImporter::ImportFailureReason::LocalLinkageNotInModule:
336 return "LocalLinkageNotInModule";
337 case FunctionImporter::ImportFailureReason::NotEligible:
338 return "NotEligible";
339 case FunctionImporter::ImportFailureReason::NoInline:
340 return "NoInline";
341 }
342 llvm_unreachable("invalid reason");
343 }
344
345 /// Compute the list of functions to import for a given caller. Mark these
346 /// imported functions and the symbols they reference in their source module as
347 /// exported from their source module.
computeImportForFunction(const FunctionSummary & Summary,const ModuleSummaryIndex & Index,const unsigned Threshold,const GVSummaryMapTy & DefinedGVSummaries,SmallVectorImpl<EdgeInfo> & Worklist,FunctionImporter::ImportMapTy & ImportList,StringMap<FunctionImporter::ExportSetTy> * ExportLists,FunctionImporter::ImportThresholdsTy & ImportThresholds)348 static void computeImportForFunction(
349 const FunctionSummary &Summary, const ModuleSummaryIndex &Index,
350 const unsigned Threshold, const GVSummaryMapTy &DefinedGVSummaries,
351 SmallVectorImpl<EdgeInfo> &Worklist,
352 FunctionImporter::ImportMapTy &ImportList,
353 StringMap<FunctionImporter::ExportSetTy> *ExportLists,
354 FunctionImporter::ImportThresholdsTy &ImportThresholds) {
355 computeImportForReferencedGlobals(Summary, Index, DefinedGVSummaries,
356 Worklist, ImportList, ExportLists);
357 static int ImportCount = 0;
358 for (const auto &Edge : Summary.calls()) {
359 ValueInfo VI = Edge.first;
360 LLVM_DEBUG(dbgs() << " edge -> " << VI << " Threshold:" << Threshold
361 << "\n");
362
363 if (ImportCutoff >= 0 && ImportCount >= ImportCutoff) {
364 LLVM_DEBUG(dbgs() << "ignored! import-cutoff value of " << ImportCutoff
365 << " reached.\n");
366 continue;
367 }
368
369 if (DefinedGVSummaries.count(VI.getGUID())) {
370 // FIXME: Consider not skipping import if the module contains
371 // a non-prevailing def with interposable linkage. The prevailing copy
372 // can safely be imported (see shouldImportGlobal()).
373 LLVM_DEBUG(dbgs() << "ignored! Target already in destination module.\n");
374 continue;
375 }
376
377 auto GetBonusMultiplier = [](CalleeInfo::HotnessType Hotness) -> float {
378 if (Hotness == CalleeInfo::HotnessType::Hot)
379 return ImportHotMultiplier;
380 if (Hotness == CalleeInfo::HotnessType::Cold)
381 return ImportColdMultiplier;
382 if (Hotness == CalleeInfo::HotnessType::Critical)
383 return ImportCriticalMultiplier;
384 return 1.0;
385 };
386
387 const auto NewThreshold =
388 Threshold * GetBonusMultiplier(Edge.second.getHotness());
389
390 auto IT = ImportThresholds.insert(std::make_pair(
391 VI.getGUID(), std::make_tuple(NewThreshold, nullptr, nullptr)));
392 bool PreviouslyVisited = !IT.second;
393 auto &ProcessedThreshold = std::get<0>(IT.first->second);
394 auto &CalleeSummary = std::get<1>(IT.first->second);
395 auto &FailureInfo = std::get<2>(IT.first->second);
396
397 bool IsHotCallsite =
398 Edge.second.getHotness() == CalleeInfo::HotnessType::Hot;
399 bool IsCriticalCallsite =
400 Edge.second.getHotness() == CalleeInfo::HotnessType::Critical;
401
402 const FunctionSummary *ResolvedCalleeSummary = nullptr;
403 if (CalleeSummary) {
404 assert(PreviouslyVisited);
405 // Since the traversal of the call graph is DFS, we can revisit a function
406 // a second time with a higher threshold. In this case, it is added back
407 // to the worklist with the new threshold (so that its own callee chains
408 // can be considered with the higher threshold).
409 if (NewThreshold <= ProcessedThreshold) {
410 LLVM_DEBUG(
411 dbgs() << "ignored! Target was already imported with Threshold "
412 << ProcessedThreshold << "\n");
413 continue;
414 }
415 // Update with new larger threshold.
416 ProcessedThreshold = NewThreshold;
417 ResolvedCalleeSummary = cast<FunctionSummary>(CalleeSummary);
418 } else {
419 // If we already rejected importing a callee at the same or higher
420 // threshold, don't waste time calling selectCallee.
421 if (PreviouslyVisited && NewThreshold <= ProcessedThreshold) {
422 LLVM_DEBUG(
423 dbgs() << "ignored! Target was already rejected with Threshold "
424 << ProcessedThreshold << "\n");
425 if (PrintImportFailures) {
426 assert(FailureInfo &&
427 "Expected FailureInfo for previously rejected candidate");
428 FailureInfo->Attempts++;
429 }
430 continue;
431 }
432
433 FunctionImporter::ImportFailureReason Reason;
434 CalleeSummary = selectCallee(Index, VI.getSummaryList(), NewThreshold,
435 Summary.modulePath(), Reason, VI.getGUID());
436 if (!CalleeSummary) {
437 // Update with new larger threshold if this was a retry (otherwise
438 // we would have already inserted with NewThreshold above). Also
439 // update failure info if requested.
440 if (PreviouslyVisited) {
441 ProcessedThreshold = NewThreshold;
442 if (PrintImportFailures) {
443 assert(FailureInfo &&
444 "Expected FailureInfo for previously rejected candidate");
445 FailureInfo->Reason = Reason;
446 FailureInfo->Attempts++;
447 FailureInfo->MaxHotness =
448 std::max(FailureInfo->MaxHotness, Edge.second.getHotness());
449 }
450 } else if (PrintImportFailures) {
451 assert(!FailureInfo &&
452 "Expected no FailureInfo for newly rejected candidate");
453 FailureInfo = std::make_unique<FunctionImporter::ImportFailureInfo>(
454 VI, Edge.second.getHotness(), Reason, 1);
455 }
456 if (ForceImportAll) {
457 std::string Msg = std::string("Failed to import function ") +
458 VI.name().str() + " due to " +
459 getFailureName(Reason);
460 auto Error = make_error<StringError>(
461 Msg, make_error_code(errc::not_supported));
462 logAllUnhandledErrors(std::move(Error), errs(),
463 "Error importing module: ");
464 break;
465 } else {
466 LLVM_DEBUG(dbgs()
467 << "ignored! No qualifying callee with summary found.\n");
468 continue;
469 }
470 }
471
472 // "Resolve" the summary
473 CalleeSummary = CalleeSummary->getBaseObject();
474 ResolvedCalleeSummary = cast<FunctionSummary>(CalleeSummary);
475
476 assert((ResolvedCalleeSummary->fflags().AlwaysInline || ForceImportAll ||
477 (ResolvedCalleeSummary->instCount() <= NewThreshold)) &&
478 "selectCallee() didn't honor the threshold");
479
480 auto ExportModulePath = ResolvedCalleeSummary->modulePath();
481 auto ILI = ImportList[ExportModulePath].insert(VI.getGUID());
482 // We previously decided to import this GUID definition if it was already
483 // inserted in the set of imports from the exporting module.
484 bool PreviouslyImported = !ILI.second;
485 if (!PreviouslyImported) {
486 NumImportedFunctionsThinLink++;
487 if (IsHotCallsite)
488 NumImportedHotFunctionsThinLink++;
489 if (IsCriticalCallsite)
490 NumImportedCriticalFunctionsThinLink++;
491 }
492
493 // Any calls/references made by this function will be marked exported
494 // later, in ComputeCrossModuleImport, after import decisions are
495 // complete, which is more efficient than adding them here.
496 if (ExportLists)
497 (*ExportLists)[ExportModulePath].insert(VI);
498 }
499
500 auto GetAdjustedThreshold = [](unsigned Threshold, bool IsHotCallsite) {
501 // Adjust the threshold for next level of imported functions.
502 // The threshold is different for hot callsites because we can then
503 // inline chains of hot calls.
504 if (IsHotCallsite)
505 return Threshold * ImportHotInstrFactor;
506 return Threshold * ImportInstrFactor;
507 };
508
509 const auto AdjThreshold = GetAdjustedThreshold(Threshold, IsHotCallsite);
510
511 ImportCount++;
512
513 // Insert the newly imported function to the worklist.
514 Worklist.emplace_back(ResolvedCalleeSummary, AdjThreshold);
515 }
516 }
517
518 /// Given the list of globals defined in a module, compute the list of imports
519 /// as well as the list of "exports", i.e. the list of symbols referenced from
520 /// another module (that may require promotion).
ComputeImportForModule(const GVSummaryMapTy & DefinedGVSummaries,const ModuleSummaryIndex & Index,StringRef ModName,FunctionImporter::ImportMapTy & ImportList,StringMap<FunctionImporter::ExportSetTy> * ExportLists=nullptr)521 static void ComputeImportForModule(
522 const GVSummaryMapTy &DefinedGVSummaries, const ModuleSummaryIndex &Index,
523 StringRef ModName, FunctionImporter::ImportMapTy &ImportList,
524 StringMap<FunctionImporter::ExportSetTy> *ExportLists = nullptr) {
525 // Worklist contains the list of function imported in this module, for which
526 // we will analyse the callees and may import further down the callgraph.
527 SmallVector<EdgeInfo, 128> Worklist;
528 FunctionImporter::ImportThresholdsTy ImportThresholds;
529
530 // Populate the worklist with the import for the functions in the current
531 // module
532 for (const auto &GVSummary : DefinedGVSummaries) {
533 #ifndef NDEBUG
534 // FIXME: Change the GVSummaryMapTy to hold ValueInfo instead of GUID
535 // so this map look up (and possibly others) can be avoided.
536 auto VI = Index.getValueInfo(GVSummary.first);
537 #endif
538 if (!Index.isGlobalValueLive(GVSummary.second)) {
539 LLVM_DEBUG(dbgs() << "Ignores Dead GUID: " << VI << "\n");
540 continue;
541 }
542 auto *FuncSummary =
543 dyn_cast<FunctionSummary>(GVSummary.second->getBaseObject());
544 if (!FuncSummary)
545 // Skip import for global variables
546 continue;
547 LLVM_DEBUG(dbgs() << "Initialize import for " << VI << "\n");
548 computeImportForFunction(*FuncSummary, Index, ImportInstrLimit,
549 DefinedGVSummaries, Worklist, ImportList,
550 ExportLists, ImportThresholds);
551 }
552
553 // Process the newly imported functions and add callees to the worklist.
554 while (!Worklist.empty()) {
555 auto GVInfo = Worklist.pop_back_val();
556 auto *Summary = std::get<0>(GVInfo);
557 auto Threshold = std::get<1>(GVInfo);
558
559 if (auto *FS = dyn_cast<FunctionSummary>(Summary))
560 computeImportForFunction(*FS, Index, Threshold, DefinedGVSummaries,
561 Worklist, ImportList, ExportLists,
562 ImportThresholds);
563 else
564 computeImportForReferencedGlobals(*Summary, Index, DefinedGVSummaries,
565 Worklist, ImportList, ExportLists);
566 }
567
568 // Print stats about functions considered but rejected for importing
569 // when requested.
570 if (PrintImportFailures) {
571 dbgs() << "Missed imports into module " << ModName << "\n";
572 for (auto &I : ImportThresholds) {
573 auto &ProcessedThreshold = std::get<0>(I.second);
574 auto &CalleeSummary = std::get<1>(I.second);
575 auto &FailureInfo = std::get<2>(I.second);
576 if (CalleeSummary)
577 continue; // We are going to import.
578 assert(FailureInfo);
579 FunctionSummary *FS = nullptr;
580 if (!FailureInfo->VI.getSummaryList().empty())
581 FS = dyn_cast<FunctionSummary>(
582 FailureInfo->VI.getSummaryList()[0]->getBaseObject());
583 dbgs() << FailureInfo->VI
584 << ": Reason = " << getFailureName(FailureInfo->Reason)
585 << ", Threshold = " << ProcessedThreshold
586 << ", Size = " << (FS ? (int)FS->instCount() : -1)
587 << ", MaxHotness = " << getHotnessName(FailureInfo->MaxHotness)
588 << ", Attempts = " << FailureInfo->Attempts << "\n";
589 }
590 }
591 }
592
593 #ifndef NDEBUG
isGlobalVarSummary(const ModuleSummaryIndex & Index,ValueInfo VI)594 static bool isGlobalVarSummary(const ModuleSummaryIndex &Index, ValueInfo VI) {
595 auto SL = VI.getSummaryList();
596 return SL.empty()
597 ? false
598 : SL[0]->getSummaryKind() == GlobalValueSummary::GlobalVarKind;
599 }
600
isGlobalVarSummary(const ModuleSummaryIndex & Index,GlobalValue::GUID G)601 static bool isGlobalVarSummary(const ModuleSummaryIndex &Index,
602 GlobalValue::GUID G) {
603 if (const auto &VI = Index.getValueInfo(G))
604 return isGlobalVarSummary(Index, VI);
605 return false;
606 }
607
608 template <class T>
numGlobalVarSummaries(const ModuleSummaryIndex & Index,T & Cont)609 static unsigned numGlobalVarSummaries(const ModuleSummaryIndex &Index,
610 T &Cont) {
611 unsigned NumGVS = 0;
612 for (auto &V : Cont)
613 if (isGlobalVarSummary(Index, V))
614 ++NumGVS;
615 return NumGVS;
616 }
617 #endif
618
619 #ifndef NDEBUG
620 static bool
checkVariableImport(const ModuleSummaryIndex & Index,StringMap<FunctionImporter::ImportMapTy> & ImportLists,StringMap<FunctionImporter::ExportSetTy> & ExportLists)621 checkVariableImport(const ModuleSummaryIndex &Index,
622 StringMap<FunctionImporter::ImportMapTy> &ImportLists,
623 StringMap<FunctionImporter::ExportSetTy> &ExportLists) {
624
625 DenseSet<GlobalValue::GUID> FlattenedImports;
626
627 for (auto &ImportPerModule : ImportLists)
628 for (auto &ExportPerModule : ImportPerModule.second)
629 FlattenedImports.insert(ExportPerModule.second.begin(),
630 ExportPerModule.second.end());
631
632 // Checks that all GUIDs of read/writeonly vars we see in export lists
633 // are also in the import lists. Otherwise we my face linker undefs,
634 // because readonly and writeonly vars are internalized in their
635 // source modules.
636 auto IsReadOrWriteOnlyVar = [&](StringRef ModulePath, const ValueInfo &VI) {
637 auto *GVS = dyn_cast_or_null<GlobalVarSummary>(
638 Index.findSummaryInModule(VI, ModulePath));
639 return GVS && (Index.isReadOnly(GVS) || Index.isWriteOnly(GVS));
640 };
641
642 for (auto &ExportPerModule : ExportLists)
643 for (auto &VI : ExportPerModule.second)
644 if (!FlattenedImports.count(VI.getGUID()) &&
645 IsReadOrWriteOnlyVar(ExportPerModule.first(), VI))
646 return false;
647
648 return true;
649 }
650 #endif
651
652 /// Compute all the import and export for every module using the Index.
ComputeCrossModuleImport(const ModuleSummaryIndex & Index,const StringMap<GVSummaryMapTy> & ModuleToDefinedGVSummaries,StringMap<FunctionImporter::ImportMapTy> & ImportLists,StringMap<FunctionImporter::ExportSetTy> & ExportLists)653 void llvm::ComputeCrossModuleImport(
654 const ModuleSummaryIndex &Index,
655 const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries,
656 StringMap<FunctionImporter::ImportMapTy> &ImportLists,
657 StringMap<FunctionImporter::ExportSetTy> &ExportLists) {
658 // For each module that has function defined, compute the import/export lists.
659 for (const auto &DefinedGVSummaries : ModuleToDefinedGVSummaries) {
660 auto &ImportList = ImportLists[DefinedGVSummaries.first()];
661 LLVM_DEBUG(dbgs() << "Computing import for Module '"
662 << DefinedGVSummaries.first() << "'\n");
663 ComputeImportForModule(DefinedGVSummaries.second, Index,
664 DefinedGVSummaries.first(), ImportList,
665 &ExportLists);
666 }
667
668 // When computing imports we only added the variables and functions being
669 // imported to the export list. We also need to mark any references and calls
670 // they make as exported as well. We do this here, as it is more efficient
671 // since we may import the same values multiple times into different modules
672 // during the import computation.
673 for (auto &ELI : ExportLists) {
674 FunctionImporter::ExportSetTy NewExports;
675 const auto &DefinedGVSummaries =
676 ModuleToDefinedGVSummaries.lookup(ELI.first());
677 for (auto &EI : ELI.second) {
678 // Find the copy defined in the exporting module so that we can mark the
679 // values it references in that specific definition as exported.
680 // Below we will add all references and called values, without regard to
681 // whether they are also defined in this module. We subsequently prune the
682 // list to only include those defined in the exporting module, see comment
683 // there as to why.
684 auto DS = DefinedGVSummaries.find(EI.getGUID());
685 // Anything marked exported during the import computation must have been
686 // defined in the exporting module.
687 assert(DS != DefinedGVSummaries.end());
688 auto *S = DS->getSecond();
689 S = S->getBaseObject();
690 if (auto *GVS = dyn_cast<GlobalVarSummary>(S)) {
691 // Export referenced functions and variables. We don't export/promote
692 // objects referenced by writeonly variable initializer, because
693 // we convert such variables initializers to "zeroinitializer".
694 // See processGlobalForThinLTO.
695 if (!Index.isWriteOnly(GVS))
696 for (const auto &VI : GVS->refs())
697 NewExports.insert(VI);
698 } else {
699 auto *FS = cast<FunctionSummary>(S);
700 for (const auto &Edge : FS->calls())
701 NewExports.insert(Edge.first);
702 for (const auto &Ref : FS->refs())
703 NewExports.insert(Ref);
704 }
705 }
706 // Prune list computed above to only include values defined in the exporting
707 // module. We do this after the above insertion since we may hit the same
708 // ref/call target multiple times in above loop, and it is more efficient to
709 // avoid a set lookup each time.
710 for (auto EI = NewExports.begin(); EI != NewExports.end();) {
711 if (!DefinedGVSummaries.count(EI->getGUID()))
712 NewExports.erase(EI++);
713 else
714 ++EI;
715 }
716 ELI.second.insert(NewExports.begin(), NewExports.end());
717 }
718
719 assert(checkVariableImport(Index, ImportLists, ExportLists));
720 #ifndef NDEBUG
721 LLVM_DEBUG(dbgs() << "Import/Export lists for " << ImportLists.size()
722 << " modules:\n");
723 for (auto &ModuleImports : ImportLists) {
724 auto ModName = ModuleImports.first();
725 auto &Exports = ExportLists[ModName];
726 unsigned NumGVS = numGlobalVarSummaries(Index, Exports);
727 LLVM_DEBUG(dbgs() << "* Module " << ModName << " exports "
728 << Exports.size() - NumGVS << " functions and " << NumGVS
729 << " vars. Imports from " << ModuleImports.second.size()
730 << " modules.\n");
731 for (auto &Src : ModuleImports.second) {
732 auto SrcModName = Src.first();
733 unsigned NumGVSPerMod = numGlobalVarSummaries(Index, Src.second);
734 LLVM_DEBUG(dbgs() << " - " << Src.second.size() - NumGVSPerMod
735 << " functions imported from " << SrcModName << "\n");
736 LLVM_DEBUG(dbgs() << " - " << NumGVSPerMod
737 << " global vars imported from " << SrcModName << "\n");
738 }
739 }
740 #endif
741 }
742
743 #ifndef NDEBUG
dumpImportListForModule(const ModuleSummaryIndex & Index,StringRef ModulePath,FunctionImporter::ImportMapTy & ImportList)744 static void dumpImportListForModule(const ModuleSummaryIndex &Index,
745 StringRef ModulePath,
746 FunctionImporter::ImportMapTy &ImportList) {
747 LLVM_DEBUG(dbgs() << "* Module " << ModulePath << " imports from "
748 << ImportList.size() << " modules.\n");
749 for (auto &Src : ImportList) {
750 auto SrcModName = Src.first();
751 unsigned NumGVSPerMod = numGlobalVarSummaries(Index, Src.second);
752 LLVM_DEBUG(dbgs() << " - " << Src.second.size() - NumGVSPerMod
753 << " functions imported from " << SrcModName << "\n");
754 LLVM_DEBUG(dbgs() << " - " << NumGVSPerMod << " vars imported from "
755 << SrcModName << "\n");
756 }
757 }
758 #endif
759
760 /// Compute all the imports for the given module in the Index.
ComputeCrossModuleImportForModule(StringRef ModulePath,const ModuleSummaryIndex & Index,FunctionImporter::ImportMapTy & ImportList)761 void llvm::ComputeCrossModuleImportForModule(
762 StringRef ModulePath, const ModuleSummaryIndex &Index,
763 FunctionImporter::ImportMapTy &ImportList) {
764 // Collect the list of functions this module defines.
765 // GUID -> Summary
766 GVSummaryMapTy FunctionSummaryMap;
767 Index.collectDefinedFunctionsForModule(ModulePath, FunctionSummaryMap);
768
769 // Compute the import list for this module.
770 LLVM_DEBUG(dbgs() << "Computing import for Module '" << ModulePath << "'\n");
771 ComputeImportForModule(FunctionSummaryMap, Index, ModulePath, ImportList);
772
773 #ifndef NDEBUG
774 dumpImportListForModule(Index, ModulePath, ImportList);
775 #endif
776 }
777
778 // Mark all external summaries in Index for import into the given module.
779 // Used for distributed builds using a distributed index.
ComputeCrossModuleImportForModuleFromIndex(StringRef ModulePath,const ModuleSummaryIndex & Index,FunctionImporter::ImportMapTy & ImportList)780 void llvm::ComputeCrossModuleImportForModuleFromIndex(
781 StringRef ModulePath, const ModuleSummaryIndex &Index,
782 FunctionImporter::ImportMapTy &ImportList) {
783 for (const auto &GlobalList : Index) {
784 // Ignore entries for undefined references.
785 if (GlobalList.second.SummaryList.empty())
786 continue;
787
788 auto GUID = GlobalList.first;
789 assert(GlobalList.second.SummaryList.size() == 1 &&
790 "Expected individual combined index to have one summary per GUID");
791 auto &Summary = GlobalList.second.SummaryList[0];
792 // Skip the summaries for the importing module. These are included to
793 // e.g. record required linkage changes.
794 if (Summary->modulePath() == ModulePath)
795 continue;
796 // Add an entry to provoke importing by thinBackend.
797 ImportList[Summary->modulePath()].insert(GUID);
798 }
799 #ifndef NDEBUG
800 dumpImportListForModule(Index, ModulePath, ImportList);
801 #endif
802 }
803
804 // For SamplePGO, the indirect call targets for local functions will
805 // have its original name annotated in profile. We try to find the
806 // corresponding PGOFuncName as the GUID, and fix up the edges
807 // accordingly.
updateValueInfoForIndirectCalls(ModuleSummaryIndex & Index,FunctionSummary * FS)808 void updateValueInfoForIndirectCalls(ModuleSummaryIndex &Index,
809 FunctionSummary *FS) {
810 for (auto &EI : FS->mutableCalls()) {
811 if (!EI.first.getSummaryList().empty())
812 continue;
813 auto GUID = Index.getGUIDFromOriginalID(EI.first.getGUID());
814 if (GUID == 0)
815 continue;
816 // Update the edge to point directly to the correct GUID.
817 auto VI = Index.getValueInfo(GUID);
818 if (llvm::any_of(
819 VI.getSummaryList(),
820 [&](const std::unique_ptr<GlobalValueSummary> &SummaryPtr) {
821 // The mapping from OriginalId to GUID may return a GUID
822 // that corresponds to a static variable. Filter it out here.
823 // This can happen when
824 // 1) There is a call to a library function which is not defined
825 // in the index.
826 // 2) There is a static variable with the OriginalGUID identical
827 // to the GUID of the library function in 1);
828 // When this happens the static variable in 2) will be found,
829 // which needs to be filtered out.
830 return SummaryPtr->getSummaryKind() ==
831 GlobalValueSummary::GlobalVarKind;
832 }))
833 continue;
834 EI.first = VI;
835 }
836 }
837
updateIndirectCalls(ModuleSummaryIndex & Index)838 void llvm::updateIndirectCalls(ModuleSummaryIndex &Index) {
839 for (const auto &Entry : Index) {
840 for (const auto &S : Entry.second.SummaryList) {
841 if (auto *FS = dyn_cast<FunctionSummary>(S.get()))
842 updateValueInfoForIndirectCalls(Index, FS);
843 }
844 }
845 }
846
computeDeadSymbolsAndUpdateIndirectCalls(ModuleSummaryIndex & Index,const DenseSet<GlobalValue::GUID> & GUIDPreservedSymbols,function_ref<PrevailingType (GlobalValue::GUID)> isPrevailing)847 void llvm::computeDeadSymbolsAndUpdateIndirectCalls(
848 ModuleSummaryIndex &Index,
849 const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols,
850 function_ref<PrevailingType(GlobalValue::GUID)> isPrevailing) {
851 assert(!Index.withGlobalValueDeadStripping());
852 if (!ComputeDead ||
853 // Don't do anything when nothing is live, this is friendly with tests.
854 GUIDPreservedSymbols.empty()) {
855 // Still need to update indirect calls.
856 updateIndirectCalls(Index);
857 return;
858 }
859 unsigned LiveSymbols = 0;
860 SmallVector<ValueInfo, 128> Worklist;
861 Worklist.reserve(GUIDPreservedSymbols.size() * 2);
862 for (auto GUID : GUIDPreservedSymbols) {
863 ValueInfo VI = Index.getValueInfo(GUID);
864 if (!VI)
865 continue;
866 for (const auto &S : VI.getSummaryList())
867 S->setLive(true);
868 }
869
870 // Add values flagged in the index as live roots to the worklist.
871 for (const auto &Entry : Index) {
872 auto VI = Index.getValueInfo(Entry);
873 for (const auto &S : Entry.second.SummaryList) {
874 if (auto *FS = dyn_cast<FunctionSummary>(S.get()))
875 updateValueInfoForIndirectCalls(Index, FS);
876 if (S->isLive()) {
877 LLVM_DEBUG(dbgs() << "Live root: " << VI << "\n");
878 Worklist.push_back(VI);
879 ++LiveSymbols;
880 break;
881 }
882 }
883 }
884
885 // Make value live and add it to the worklist if it was not live before.
886 auto visit = [&](ValueInfo VI, bool IsAliasee) {
887 // FIXME: If we knew which edges were created for indirect call profiles,
888 // we could skip them here. Any that are live should be reached via
889 // other edges, e.g. reference edges. Otherwise, using a profile collected
890 // on a slightly different binary might provoke preserving, importing
891 // and ultimately promoting calls to functions not linked into this
892 // binary, which increases the binary size unnecessarily. Note that
893 // if this code changes, the importer needs to change so that edges
894 // to functions marked dead are skipped.
895
896 if (llvm::any_of(VI.getSummaryList(),
897 [](const std::unique_ptr<llvm::GlobalValueSummary> &S) {
898 return S->isLive();
899 }))
900 return;
901
902 // We only keep live symbols that are known to be non-prevailing if any are
903 // available_externally, linkonceodr, weakodr. Those symbols are discarded
904 // later in the EliminateAvailableExternally pass and setting them to
905 // not-live could break downstreams users of liveness information (PR36483)
906 // or limit optimization opportunities.
907 if (isPrevailing(VI.getGUID()) == PrevailingType::No) {
908 bool KeepAliveLinkage = false;
909 bool Interposable = false;
910 for (const auto &S : VI.getSummaryList()) {
911 if (S->linkage() == GlobalValue::AvailableExternallyLinkage ||
912 S->linkage() == GlobalValue::WeakODRLinkage ||
913 S->linkage() == GlobalValue::LinkOnceODRLinkage)
914 KeepAliveLinkage = true;
915 else if (GlobalValue::isInterposableLinkage(S->linkage()))
916 Interposable = true;
917 }
918
919 if (!IsAliasee) {
920 if (!KeepAliveLinkage)
921 return;
922
923 if (Interposable)
924 report_fatal_error(
925 "Interposable and available_externally/linkonce_odr/weak_odr "
926 "symbol");
927 }
928 }
929
930 for (const auto &S : VI.getSummaryList())
931 S->setLive(true);
932 ++LiveSymbols;
933 Worklist.push_back(VI);
934 };
935
936 while (!Worklist.empty()) {
937 auto VI = Worklist.pop_back_val();
938 for (const auto &Summary : VI.getSummaryList()) {
939 if (auto *AS = dyn_cast<AliasSummary>(Summary.get())) {
940 // If this is an alias, visit the aliasee VI to ensure that all copies
941 // are marked live and it is added to the worklist for further
942 // processing of its references.
943 visit(AS->getAliaseeVI(), true);
944 continue;
945 }
946 for (auto Ref : Summary->refs())
947 visit(Ref, false);
948 if (auto *FS = dyn_cast<FunctionSummary>(Summary.get()))
949 for (auto Call : FS->calls())
950 visit(Call.first, false);
951 }
952 }
953 Index.setWithGlobalValueDeadStripping();
954
955 unsigned DeadSymbols = Index.size() - LiveSymbols;
956 LLVM_DEBUG(dbgs() << LiveSymbols << " symbols Live, and " << DeadSymbols
957 << " symbols Dead \n");
958 NumDeadSymbols += DeadSymbols;
959 NumLiveSymbols += LiveSymbols;
960 }
961
962 // Compute dead symbols and propagate constants in combined index.
computeDeadSymbolsWithConstProp(ModuleSummaryIndex & Index,const DenseSet<GlobalValue::GUID> & GUIDPreservedSymbols,function_ref<PrevailingType (GlobalValue::GUID)> isPrevailing,bool ImportEnabled)963 void llvm::computeDeadSymbolsWithConstProp(
964 ModuleSummaryIndex &Index,
965 const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols,
966 function_ref<PrevailingType(GlobalValue::GUID)> isPrevailing,
967 bool ImportEnabled) {
968 computeDeadSymbolsAndUpdateIndirectCalls(Index, GUIDPreservedSymbols,
969 isPrevailing);
970 if (ImportEnabled)
971 Index.propagateAttributes(GUIDPreservedSymbols);
972 }
973
974 /// Compute the set of summaries needed for a ThinLTO backend compilation of
975 /// \p ModulePath.
gatherImportedSummariesForModule(StringRef ModulePath,const StringMap<GVSummaryMapTy> & ModuleToDefinedGVSummaries,const FunctionImporter::ImportMapTy & ImportList,std::map<std::string,GVSummaryMapTy> & ModuleToSummariesForIndex)976 void llvm::gatherImportedSummariesForModule(
977 StringRef ModulePath,
978 const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries,
979 const FunctionImporter::ImportMapTy &ImportList,
980 std::map<std::string, GVSummaryMapTy> &ModuleToSummariesForIndex) {
981 // Include all summaries from the importing module.
982 ModuleToSummariesForIndex[std::string(ModulePath)] =
983 ModuleToDefinedGVSummaries.lookup(ModulePath);
984 // Include summaries for imports.
985 for (const auto &ILI : ImportList) {
986 auto &SummariesForIndex =
987 ModuleToSummariesForIndex[std::string(ILI.first())];
988 const auto &DefinedGVSummaries =
989 ModuleToDefinedGVSummaries.lookup(ILI.first());
990 for (const auto &GI : ILI.second) {
991 const auto &DS = DefinedGVSummaries.find(GI);
992 assert(DS != DefinedGVSummaries.end() &&
993 "Expected a defined summary for imported global value");
994 SummariesForIndex[GI] = DS->second;
995 }
996 }
997 }
998
999 /// Emit the files \p ModulePath will import from into \p OutputFilename.
EmitImportsFiles(StringRef ModulePath,StringRef OutputFilename,const std::map<std::string,GVSummaryMapTy> & ModuleToSummariesForIndex)1000 std::error_code llvm::EmitImportsFiles(
1001 StringRef ModulePath, StringRef OutputFilename,
1002 const std::map<std::string, GVSummaryMapTy> &ModuleToSummariesForIndex) {
1003 std::error_code EC;
1004 raw_fd_ostream ImportsOS(OutputFilename, EC, sys::fs::OpenFlags::OF_None);
1005 if (EC)
1006 return EC;
1007 for (const auto &ILI : ModuleToSummariesForIndex)
1008 // The ModuleToSummariesForIndex map includes an entry for the current
1009 // Module (needed for writing out the index files). We don't want to
1010 // include it in the imports file, however, so filter it out.
1011 if (ILI.first != ModulePath)
1012 ImportsOS << ILI.first << "\n";
1013 return std::error_code();
1014 }
1015
convertToDeclaration(GlobalValue & GV)1016 bool llvm::convertToDeclaration(GlobalValue &GV) {
1017 LLVM_DEBUG(dbgs() << "Converting to a declaration: `" << GV.getName()
1018 << "\n");
1019 if (Function *F = dyn_cast<Function>(&GV)) {
1020 F->deleteBody();
1021 F->clearMetadata();
1022 F->setComdat(nullptr);
1023 } else if (GlobalVariable *V = dyn_cast<GlobalVariable>(&GV)) {
1024 V->setInitializer(nullptr);
1025 V->setLinkage(GlobalValue::ExternalLinkage);
1026 V->clearMetadata();
1027 V->setComdat(nullptr);
1028 } else {
1029 GlobalValue *NewGV;
1030 if (GV.getValueType()->isFunctionTy())
1031 NewGV =
1032 Function::Create(cast<FunctionType>(GV.getValueType()),
1033 GlobalValue::ExternalLinkage, GV.getAddressSpace(),
1034 "", GV.getParent());
1035 else
1036 NewGV =
1037 new GlobalVariable(*GV.getParent(), GV.getValueType(),
1038 /*isConstant*/ false, GlobalValue::ExternalLinkage,
1039 /*init*/ nullptr, "",
1040 /*insertbefore*/ nullptr, GV.getThreadLocalMode(),
1041 GV.getType()->getAddressSpace());
1042 NewGV->takeName(&GV);
1043 GV.replaceAllUsesWith(NewGV);
1044 return false;
1045 }
1046 if (!GV.isImplicitDSOLocal())
1047 GV.setDSOLocal(false);
1048 return true;
1049 }
1050
thinLTOFinalizeInModule(Module & TheModule,const GVSummaryMapTy & DefinedGlobals,bool PropagateAttrs)1051 void llvm::thinLTOFinalizeInModule(Module &TheModule,
1052 const GVSummaryMapTy &DefinedGlobals,
1053 bool PropagateAttrs) {
1054 DenseSet<Comdat *> NonPrevailingComdats;
1055 auto FinalizeInModule = [&](GlobalValue &GV, bool Propagate = false) {
1056 // See if the global summary analysis computed a new resolved linkage.
1057 const auto &GS = DefinedGlobals.find(GV.getGUID());
1058 if (GS == DefinedGlobals.end())
1059 return;
1060
1061 if (Propagate)
1062 if (FunctionSummary *FS = dyn_cast<FunctionSummary>(GS->second)) {
1063 if (Function *F = dyn_cast<Function>(&GV)) {
1064 // TODO: propagate ReadNone and ReadOnly.
1065 if (FS->fflags().ReadNone && !F->doesNotAccessMemory())
1066 F->setDoesNotAccessMemory();
1067
1068 if (FS->fflags().ReadOnly && !F->onlyReadsMemory())
1069 F->setOnlyReadsMemory();
1070
1071 if (FS->fflags().NoRecurse && !F->doesNotRecurse())
1072 F->setDoesNotRecurse();
1073
1074 if (FS->fflags().NoUnwind && !F->doesNotThrow())
1075 F->setDoesNotThrow();
1076 }
1077 }
1078
1079 auto NewLinkage = GS->second->linkage();
1080 if (GlobalValue::isLocalLinkage(GV.getLinkage()) ||
1081 // Don't internalize anything here, because the code below
1082 // lacks necessary correctness checks. Leave this job to
1083 // LLVM 'internalize' pass.
1084 GlobalValue::isLocalLinkage(NewLinkage) ||
1085 // In case it was dead and already converted to declaration.
1086 GV.isDeclaration())
1087 return;
1088
1089 // Set the potentially more constraining visibility computed from summaries.
1090 // The DefaultVisibility condition is because older GlobalValueSummary does
1091 // not record DefaultVisibility and we don't want to change protected/hidden
1092 // to default.
1093 if (GS->second->getVisibility() != GlobalValue::DefaultVisibility)
1094 GV.setVisibility(GS->second->getVisibility());
1095
1096 if (NewLinkage == GV.getLinkage())
1097 return;
1098
1099 // Check for a non-prevailing def that has interposable linkage
1100 // (e.g. non-odr weak or linkonce). In that case we can't simply
1101 // convert to available_externally, since it would lose the
1102 // interposable property and possibly get inlined. Simply drop
1103 // the definition in that case.
1104 if (GlobalValue::isAvailableExternallyLinkage(NewLinkage) &&
1105 GlobalValue::isInterposableLinkage(GV.getLinkage())) {
1106 if (!convertToDeclaration(GV))
1107 // FIXME: Change this to collect replaced GVs and later erase
1108 // them from the parent module once thinLTOResolvePrevailingGUID is
1109 // changed to enable this for aliases.
1110 llvm_unreachable("Expected GV to be converted");
1111 } else {
1112 // If all copies of the original symbol had global unnamed addr and
1113 // linkonce_odr linkage, or if all of them had local unnamed addr linkage
1114 // and are constants, then it should be an auto hide symbol. In that case
1115 // the thin link would have marked it as CanAutoHide. Add hidden
1116 // visibility to the symbol to preserve the property.
1117 if (NewLinkage == GlobalValue::WeakODRLinkage &&
1118 GS->second->canAutoHide()) {
1119 assert(GV.canBeOmittedFromSymbolTable());
1120 GV.setVisibility(GlobalValue::HiddenVisibility);
1121 }
1122
1123 LLVM_DEBUG(dbgs() << "ODR fixing up linkage for `" << GV.getName()
1124 << "` from " << GV.getLinkage() << " to " << NewLinkage
1125 << "\n");
1126 GV.setLinkage(NewLinkage);
1127 }
1128 // Remove declarations from comdats, including available_externally
1129 // as this is a declaration for the linker, and will be dropped eventually.
1130 // It is illegal for comdats to contain declarations.
1131 auto *GO = dyn_cast_or_null<GlobalObject>(&GV);
1132 if (GO && GO->isDeclarationForLinker() && GO->hasComdat()) {
1133 if (GO->getComdat()->getName() == GO->getName())
1134 NonPrevailingComdats.insert(GO->getComdat());
1135 GO->setComdat(nullptr);
1136 }
1137 };
1138
1139 // Process functions and global now
1140 for (auto &GV : TheModule)
1141 FinalizeInModule(GV, PropagateAttrs);
1142 for (auto &GV : TheModule.globals())
1143 FinalizeInModule(GV);
1144 for (auto &GV : TheModule.aliases())
1145 FinalizeInModule(GV);
1146
1147 // For a non-prevailing comdat, all its members must be available_externally.
1148 // FinalizeInModule has handled non-local-linkage GlobalValues. Here we handle
1149 // local linkage GlobalValues.
1150 if (NonPrevailingComdats.empty())
1151 return;
1152 for (auto &GO : TheModule.global_objects()) {
1153 if (auto *C = GO.getComdat(); C && NonPrevailingComdats.count(C)) {
1154 GO.setComdat(nullptr);
1155 GO.setLinkage(GlobalValue::AvailableExternallyLinkage);
1156 }
1157 }
1158 bool Changed;
1159 do {
1160 Changed = false;
1161 // If an alias references a GlobalValue in a non-prevailing comdat, change
1162 // it to available_externally. For simplicity we only handle GlobalValue and
1163 // ConstantExpr with a base object. ConstantExpr without a base object is
1164 // unlikely used in a COMDAT.
1165 for (auto &GA : TheModule.aliases()) {
1166 if (GA.hasAvailableExternallyLinkage())
1167 continue;
1168 GlobalObject *Obj = GA.getAliaseeObject();
1169 assert(Obj && "aliasee without an base object is unimplemented");
1170 if (Obj->hasAvailableExternallyLinkage()) {
1171 GA.setLinkage(GlobalValue::AvailableExternallyLinkage);
1172 Changed = true;
1173 }
1174 }
1175 } while (Changed);
1176 }
1177
1178 /// Run internalization on \p TheModule based on symmary analysis.
thinLTOInternalizeModule(Module & TheModule,const GVSummaryMapTy & DefinedGlobals)1179 void llvm::thinLTOInternalizeModule(Module &TheModule,
1180 const GVSummaryMapTy &DefinedGlobals) {
1181 // Declare a callback for the internalize pass that will ask for every
1182 // candidate GlobalValue if it can be internalized or not.
1183 auto MustPreserveGV = [&](const GlobalValue &GV) -> bool {
1184 // It may be the case that GV is on a chain of an ifunc, its alias and
1185 // subsequent aliases. In this case, the summary for the value is not
1186 // available.
1187 if (isa<GlobalIFunc>(&GV) ||
1188 (isa<GlobalAlias>(&GV) &&
1189 isa<GlobalIFunc>(cast<GlobalAlias>(&GV)->getAliaseeObject())))
1190 return true;
1191
1192 // Lookup the linkage recorded in the summaries during global analysis.
1193 auto GS = DefinedGlobals.find(GV.getGUID());
1194 if (GS == DefinedGlobals.end()) {
1195 // Must have been promoted (possibly conservatively). Find original
1196 // name so that we can access the correct summary and see if it can
1197 // be internalized again.
1198 // FIXME: Eventually we should control promotion instead of promoting
1199 // and internalizing again.
1200 StringRef OrigName =
1201 ModuleSummaryIndex::getOriginalNameBeforePromote(GV.getName());
1202 std::string OrigId = GlobalValue::getGlobalIdentifier(
1203 OrigName, GlobalValue::InternalLinkage,
1204 TheModule.getSourceFileName());
1205 GS = DefinedGlobals.find(GlobalValue::getGUID(OrigId));
1206 if (GS == DefinedGlobals.end()) {
1207 // Also check the original non-promoted non-globalized name. In some
1208 // cases a preempted weak value is linked in as a local copy because
1209 // it is referenced by an alias (IRLinker::linkGlobalValueProto).
1210 // In that case, since it was originally not a local value, it was
1211 // recorded in the index using the original name.
1212 // FIXME: This may not be needed once PR27866 is fixed.
1213 GS = DefinedGlobals.find(GlobalValue::getGUID(OrigName));
1214 assert(GS != DefinedGlobals.end());
1215 }
1216 }
1217 return !GlobalValue::isLocalLinkage(GS->second->linkage());
1218 };
1219
1220 // FIXME: See if we can just internalize directly here via linkage changes
1221 // based on the index, rather than invoking internalizeModule.
1222 internalizeModule(TheModule, MustPreserveGV);
1223 }
1224
1225 /// Make alias a clone of its aliasee.
replaceAliasWithAliasee(Module * SrcModule,GlobalAlias * GA)1226 static Function *replaceAliasWithAliasee(Module *SrcModule, GlobalAlias *GA) {
1227 Function *Fn = cast<Function>(GA->getAliaseeObject());
1228
1229 ValueToValueMapTy VMap;
1230 Function *NewFn = CloneFunction(Fn, VMap);
1231 // Clone should use the original alias's linkage, visibility and name, and we
1232 // ensure all uses of alias instead use the new clone (casted if necessary).
1233 NewFn->setLinkage(GA->getLinkage());
1234 NewFn->setVisibility(GA->getVisibility());
1235 GA->replaceAllUsesWith(ConstantExpr::getBitCast(NewFn, GA->getType()));
1236 NewFn->takeName(GA);
1237 return NewFn;
1238 }
1239
1240 // Internalize values that we marked with specific attribute
1241 // in processGlobalForThinLTO.
internalizeGVsAfterImport(Module & M)1242 static void internalizeGVsAfterImport(Module &M) {
1243 for (auto &GV : M.globals())
1244 // Skip GVs which have been converted to declarations
1245 // by dropDeadSymbols.
1246 if (!GV.isDeclaration() && GV.hasAttribute("thinlto-internalize")) {
1247 GV.setLinkage(GlobalValue::InternalLinkage);
1248 GV.setVisibility(GlobalValue::DefaultVisibility);
1249 }
1250 }
1251
1252 // Automatically import functions in Module \p DestModule based on the summaries
1253 // index.
importFunctions(Module & DestModule,const FunctionImporter::ImportMapTy & ImportList)1254 Expected<bool> FunctionImporter::importFunctions(
1255 Module &DestModule, const FunctionImporter::ImportMapTy &ImportList) {
1256 LLVM_DEBUG(dbgs() << "Starting import for Module "
1257 << DestModule.getModuleIdentifier() << "\n");
1258 unsigned ImportedCount = 0, ImportedGVCount = 0;
1259
1260 IRMover Mover(DestModule);
1261 // Do the actual import of functions now, one Module at a time
1262 std::set<StringRef> ModuleNameOrderedList;
1263 for (const auto &FunctionsToImportPerModule : ImportList) {
1264 ModuleNameOrderedList.insert(FunctionsToImportPerModule.first());
1265 }
1266 for (const auto &Name : ModuleNameOrderedList) {
1267 // Get the module for the import
1268 const auto &FunctionsToImportPerModule = ImportList.find(Name);
1269 assert(FunctionsToImportPerModule != ImportList.end());
1270 Expected<std::unique_ptr<Module>> SrcModuleOrErr = ModuleLoader(Name);
1271 if (!SrcModuleOrErr)
1272 return SrcModuleOrErr.takeError();
1273 std::unique_ptr<Module> SrcModule = std::move(*SrcModuleOrErr);
1274 assert(&DestModule.getContext() == &SrcModule->getContext() &&
1275 "Context mismatch");
1276
1277 // If modules were created with lazy metadata loading, materialize it
1278 // now, before linking it (otherwise this will be a noop).
1279 if (Error Err = SrcModule->materializeMetadata())
1280 return std::move(Err);
1281
1282 auto &ImportGUIDs = FunctionsToImportPerModule->second;
1283 // Find the globals to import
1284 SetVector<GlobalValue *> GlobalsToImport;
1285 for (Function &F : *SrcModule) {
1286 if (!F.hasName())
1287 continue;
1288 auto GUID = F.getGUID();
1289 auto Import = ImportGUIDs.count(GUID);
1290 LLVM_DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing function "
1291 << GUID << " " << F.getName() << " from "
1292 << SrcModule->getSourceFileName() << "\n");
1293 if (Import) {
1294 if (Error Err = F.materialize())
1295 return std::move(Err);
1296 if (EnableImportMetadata) {
1297 // Add 'thinlto_src_module' metadata for statistics and debugging.
1298 F.setMetadata(
1299 "thinlto_src_module",
1300 MDNode::get(DestModule.getContext(),
1301 {MDString::get(DestModule.getContext(),
1302 SrcModule->getSourceFileName())}));
1303 }
1304 GlobalsToImport.insert(&F);
1305 }
1306 }
1307 for (GlobalVariable &GV : SrcModule->globals()) {
1308 if (!GV.hasName())
1309 continue;
1310 auto GUID = GV.getGUID();
1311 auto Import = ImportGUIDs.count(GUID);
1312 LLVM_DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing global "
1313 << GUID << " " << GV.getName() << " from "
1314 << SrcModule->getSourceFileName() << "\n");
1315 if (Import) {
1316 if (Error Err = GV.materialize())
1317 return std::move(Err);
1318 ImportedGVCount += GlobalsToImport.insert(&GV);
1319 }
1320 }
1321 for (GlobalAlias &GA : SrcModule->aliases()) {
1322 if (!GA.hasName() || isa<GlobalIFunc>(GA.getAliaseeObject()))
1323 continue;
1324 auto GUID = GA.getGUID();
1325 auto Import = ImportGUIDs.count(GUID);
1326 LLVM_DEBUG(dbgs() << (Import ? "Is" : "Not") << " importing alias "
1327 << GUID << " " << GA.getName() << " from "
1328 << SrcModule->getSourceFileName() << "\n");
1329 if (Import) {
1330 if (Error Err = GA.materialize())
1331 return std::move(Err);
1332 // Import alias as a copy of its aliasee.
1333 GlobalObject *GO = GA.getAliaseeObject();
1334 if (Error Err = GO->materialize())
1335 return std::move(Err);
1336 auto *Fn = replaceAliasWithAliasee(SrcModule.get(), &GA);
1337 LLVM_DEBUG(dbgs() << "Is importing aliasee fn " << GO->getGUID() << " "
1338 << GO->getName() << " from "
1339 << SrcModule->getSourceFileName() << "\n");
1340 if (EnableImportMetadata) {
1341 // Add 'thinlto_src_module' metadata for statistics and debugging.
1342 Fn->setMetadata(
1343 "thinlto_src_module",
1344 MDNode::get(DestModule.getContext(),
1345 {MDString::get(DestModule.getContext(),
1346 SrcModule->getSourceFileName())}));
1347 }
1348 GlobalsToImport.insert(Fn);
1349 }
1350 }
1351
1352 // Upgrade debug info after we're done materializing all the globals and we
1353 // have loaded all the required metadata!
1354 UpgradeDebugInfo(*SrcModule);
1355
1356 // Set the partial sample profile ratio in the profile summary module flag
1357 // of the imported source module, if applicable, so that the profile summary
1358 // module flag will match with that of the destination module when it's
1359 // imported.
1360 SrcModule->setPartialSampleProfileRatio(Index);
1361
1362 // Link in the specified functions.
1363 if (renameModuleForThinLTO(*SrcModule, Index, ClearDSOLocalOnDeclarations,
1364 &GlobalsToImport))
1365 return true;
1366
1367 if (PrintImports) {
1368 for (const auto *GV : GlobalsToImport)
1369 dbgs() << DestModule.getSourceFileName() << ": Import " << GV->getName()
1370 << " from " << SrcModule->getSourceFileName() << "\n";
1371 }
1372
1373 if (Error Err = Mover.move(std::move(SrcModule),
1374 GlobalsToImport.getArrayRef(), nullptr,
1375 /*IsPerformingImport=*/true))
1376 report_fatal_error(Twine("Function Import: link error: ") +
1377 toString(std::move(Err)));
1378
1379 ImportedCount += GlobalsToImport.size();
1380 NumImportedModules++;
1381 }
1382
1383 internalizeGVsAfterImport(DestModule);
1384
1385 NumImportedFunctions += (ImportedCount - ImportedGVCount);
1386 NumImportedGlobalVars += ImportedGVCount;
1387
1388 LLVM_DEBUG(dbgs() << "Imported " << ImportedCount - ImportedGVCount
1389 << " functions for Module "
1390 << DestModule.getModuleIdentifier() << "\n");
1391 LLVM_DEBUG(dbgs() << "Imported " << ImportedGVCount
1392 << " global variables for Module "
1393 << DestModule.getModuleIdentifier() << "\n");
1394 return ImportedCount;
1395 }
1396
doImportingForModule(Module & M)1397 static bool doImportingForModule(Module &M) {
1398 if (SummaryFile.empty())
1399 report_fatal_error("error: -function-import requires -summary-file\n");
1400 Expected<std::unique_ptr<ModuleSummaryIndex>> IndexPtrOrErr =
1401 getModuleSummaryIndexForFile(SummaryFile);
1402 if (!IndexPtrOrErr) {
1403 logAllUnhandledErrors(IndexPtrOrErr.takeError(), errs(),
1404 "Error loading file '" + SummaryFile + "': ");
1405 return false;
1406 }
1407 std::unique_ptr<ModuleSummaryIndex> Index = std::move(*IndexPtrOrErr);
1408
1409 // First step is collecting the import list.
1410 FunctionImporter::ImportMapTy ImportList;
1411 // If requested, simply import all functions in the index. This is used
1412 // when testing distributed backend handling via the opt tool, when
1413 // we have distributed indexes containing exactly the summaries to import.
1414 if (ImportAllIndex)
1415 ComputeCrossModuleImportForModuleFromIndex(M.getModuleIdentifier(), *Index,
1416 ImportList);
1417 else
1418 ComputeCrossModuleImportForModule(M.getModuleIdentifier(), *Index,
1419 ImportList);
1420
1421 // Conservatively mark all internal values as promoted. This interface is
1422 // only used when doing importing via the function importing pass. The pass
1423 // is only enabled when testing importing via the 'opt' tool, which does
1424 // not do the ThinLink that would normally determine what values to promote.
1425 for (auto &I : *Index) {
1426 for (auto &S : I.second.SummaryList) {
1427 if (GlobalValue::isLocalLinkage(S->linkage()))
1428 S->setLinkage(GlobalValue::ExternalLinkage);
1429 }
1430 }
1431
1432 // Next we need to promote to global scope and rename any local values that
1433 // are potentially exported to other modules.
1434 if (renameModuleForThinLTO(M, *Index, /*ClearDSOLocalOnDeclarations=*/false,
1435 /*GlobalsToImport=*/nullptr)) {
1436 errs() << "Error renaming module\n";
1437 return false;
1438 }
1439
1440 // Perform the import now.
1441 auto ModuleLoader = [&M](StringRef Identifier) {
1442 return loadFile(std::string(Identifier), M.getContext());
1443 };
1444 FunctionImporter Importer(*Index, ModuleLoader,
1445 /*ClearDSOLocalOnDeclarations=*/false);
1446 Expected<bool> Result = Importer.importFunctions(M, ImportList);
1447
1448 // FIXME: Probably need to propagate Errors through the pass manager.
1449 if (!Result) {
1450 logAllUnhandledErrors(Result.takeError(), errs(),
1451 "Error importing module: ");
1452 return false;
1453 }
1454
1455 return *Result;
1456 }
1457
run(Module & M,ModuleAnalysisManager & AM)1458 PreservedAnalyses FunctionImportPass::run(Module &M,
1459 ModuleAnalysisManager &AM) {
1460 if (!doImportingForModule(M))
1461 return PreservedAnalyses::all();
1462
1463 return PreservedAnalyses::none();
1464 }
1465