LLVM 22.0.0git
LTO.cpp
Go to the documentation of this file.
1//===-LTO.cpp - LLVM Link Time Optimizer ----------------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file implements functions and classes used to support LTO.
10//
11//===----------------------------------------------------------------------===//
12
13#include "llvm/LTO/LTO.h"
14#include "llvm/ADT/ArrayRef.h"
15#include "llvm/ADT/ScopeExit.h"
16#include "llvm/ADT/SmallSet.h"
18#include "llvm/ADT/Statistic.h"
27#include "llvm/Config/llvm-config.h"
28#include "llvm/IR/AutoUpgrade.h"
30#include "llvm/IR/Intrinsics.h"
33#include "llvm/IR/Mangler.h"
34#include "llvm/IR/Metadata.h"
36#include "llvm/LTO/LTOBackend.h"
37#include "llvm/Linker/IRMover.h"
43#include "llvm/Support/Error.h"
45#include "llvm/Support/JSON.h"
47#include "llvm/Support/Path.h"
49#include "llvm/Support/SHA1.h"
56#include "llvm/Support/VCSRevision.h"
59#include "llvm/Transforms/IPO.h"
64
65#include <optional>
66#include <set>
67
68using namespace llvm;
69using namespace lto;
70using namespace object;
71
72#define DEBUG_TYPE "lto"
73
74static cl::opt<bool>
75 DumpThinCGSCCs("dump-thin-cg-sccs", cl::init(false), cl::Hidden,
76 cl::desc("Dump the SCCs in the ThinLTO index's callgraph"));
77
78namespace llvm {
81} // end namespace llvm
82
83namespace llvm {
84/// Enable global value internalization in LTO.
86 "enable-lto-internalization", cl::init(true), cl::Hidden,
87 cl::desc("Enable global value internalization in LTO"));
88
89static cl::opt<bool>
90 LTOKeepSymbolCopies("lto-keep-symbol-copies", cl::init(false), cl::Hidden,
91 cl::desc("Keep copies of symbols in LTO indexing"));
92
93/// Indicate we are linking with an allocator that supports hot/cold operator
94/// new interfaces.
96
97/// Enable MemProf context disambiguation for thin link.
99} // namespace llvm
100
101// Computes a unique hash for the Module considering the current list of
102// export/import and other global analysis results.
103// Returns the hash in its hexadecimal representation.
105 const Config &Conf, const ModuleSummaryIndex &Index, StringRef ModuleID,
106 const FunctionImporter::ImportMapTy &ImportList,
107 const FunctionImporter::ExportSetTy &ExportList,
108 const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes> &ResolvedODR,
109 const GVSummaryMapTy &DefinedGlobals,
110 const DenseSet<GlobalValue::GUID> &CfiFunctionDefs,
111 const DenseSet<GlobalValue::GUID> &CfiFunctionDecls) {
112 // Compute the unique hash for this entry.
113 // This is based on the current compiler version, the module itself, the
114 // export list, the hash for every single module in the import list, the
115 // list of ResolvedODR for the module, and the list of preserved symbols.
116 SHA1 Hasher;
117
118 // Start with the compiler revision
119 Hasher.update(LLVM_VERSION_STRING);
120#ifdef LLVM_REVISION
121 Hasher.update(LLVM_REVISION);
122#endif
123
124 // Include the parts of the LTO configuration that affect code generation.
125 auto AddString = [&](StringRef Str) {
126 Hasher.update(Str);
127 Hasher.update(ArrayRef<uint8_t>{0});
128 };
129 auto AddUnsigned = [&](unsigned I) {
130 uint8_t Data[4];
132 Hasher.update(Data);
133 };
134 auto AddUint64 = [&](uint64_t I) {
135 uint8_t Data[8];
137 Hasher.update(Data);
138 };
139 auto AddUint8 = [&](const uint8_t I) {
140 Hasher.update(ArrayRef<uint8_t>(&I, 1));
141 };
142 AddString(Conf.CPU);
143 // FIXME: Hash more of Options. For now all clients initialize Options from
144 // command-line flags (which is unsupported in production), but may set
145 // X86RelaxRelocations. The clang driver can also pass FunctionSections,
146 // DataSections and DebuggerTuning via command line flags.
147 AddUnsigned(Conf.Options.MCOptions.X86RelaxRelocations);
148 AddUnsigned(Conf.Options.FunctionSections);
149 AddUnsigned(Conf.Options.DataSections);
150 AddUnsigned((unsigned)Conf.Options.DebuggerTuning);
151 for (auto &A : Conf.MAttrs)
152 AddString(A);
153 if (Conf.RelocModel)
154 AddUnsigned(*Conf.RelocModel);
155 else
156 AddUnsigned(-1);
157 if (Conf.CodeModel)
158 AddUnsigned(*Conf.CodeModel);
159 else
160 AddUnsigned(-1);
161 for (const auto &S : Conf.MllvmArgs)
162 AddString(S);
163 AddUnsigned(static_cast<int>(Conf.CGOptLevel));
164 AddUnsigned(static_cast<int>(Conf.CGFileType));
165 AddUnsigned(Conf.OptLevel);
166 AddUnsigned(Conf.Freestanding);
167 AddString(Conf.OptPipeline);
168 AddString(Conf.AAPipeline);
169 AddString(Conf.OverrideTriple);
170 AddString(Conf.DefaultTriple);
171 AddString(Conf.DwoDir);
172 AddUint8(Conf.Dtlto);
173
174 // Include the hash for the current module
175 auto ModHash = Index.getModuleHash(ModuleID);
176 Hasher.update(ArrayRef<uint8_t>((uint8_t *)&ModHash[0], sizeof(ModHash)));
177
178 // TODO: `ExportList` is determined by `ImportList`. Since `ImportList` is
179 // used to compute cache key, we could omit hashing `ExportList` here.
180 std::vector<uint64_t> ExportsGUID;
181 ExportsGUID.reserve(ExportList.size());
182 for (const auto &VI : ExportList)
183 ExportsGUID.push_back(VI.getGUID());
184
185 // Sort the export list elements GUIDs.
186 llvm::sort(ExportsGUID);
187 for (auto GUID : ExportsGUID)
188 Hasher.update(ArrayRef<uint8_t>((uint8_t *)&GUID, sizeof(GUID)));
189
190 // Order using module hash, to be both independent of module name and
191 // module order.
192 auto Comp = [&](const std::pair<StringRef, GlobalValue::GUID> &L,
193 const std::pair<StringRef, GlobalValue::GUID> &R) {
194 return std::make_pair(Index.getModule(L.first)->second, L.second) <
195 std::make_pair(Index.getModule(R.first)->second, R.second);
196 };
197 FunctionImporter::SortedImportList SortedImportList(ImportList, Comp);
198
199 // Count the number of imports for each source module.
200 DenseMap<StringRef, unsigned> ModuleToNumImports;
201 for (const auto &[FromModule, GUID, Type] : SortedImportList)
202 ++ModuleToNumImports[FromModule];
203
204 std::optional<StringRef> LastModule;
205 for (const auto &[FromModule, GUID, Type] : SortedImportList) {
206 if (LastModule != FromModule) {
207 // Include the hash for every module we import functions from. The set of
208 // imported symbols for each module may affect code generation and is
209 // sensitive to link order, so include that as well.
210 LastModule = FromModule;
211 auto ModHash = Index.getModule(FromModule)->second;
212 Hasher.update(ArrayRef<uint8_t>((uint8_t *)&ModHash[0], sizeof(ModHash)));
213 AddUint64(ModuleToNumImports[FromModule]);
214 }
215 AddUint64(GUID);
216 AddUint8(Type);
217 }
218
219 // Include the hash for the resolved ODR.
220 for (auto &Entry : ResolvedODR) {
221 Hasher.update(ArrayRef<uint8_t>((const uint8_t *)&Entry.first,
222 sizeof(GlobalValue::GUID)));
223 Hasher.update(ArrayRef<uint8_t>((const uint8_t *)&Entry.second,
225 }
226
227 // Members of CfiFunctionDefs and CfiFunctionDecls that are referenced or
228 // defined in this module.
229 std::set<GlobalValue::GUID> UsedCfiDefs;
230 std::set<GlobalValue::GUID> UsedCfiDecls;
231
232 // Typeids used in this module.
233 std::set<GlobalValue::GUID> UsedTypeIds;
234
235 auto AddUsedCfiGlobal = [&](GlobalValue::GUID ValueGUID) {
236 if (CfiFunctionDefs.contains(ValueGUID))
237 UsedCfiDefs.insert(ValueGUID);
238 if (CfiFunctionDecls.contains(ValueGUID))
239 UsedCfiDecls.insert(ValueGUID);
240 };
241
242 auto AddUsedThings = [&](GlobalValueSummary *GS) {
243 if (!GS) return;
244 AddUnsigned(GS->getVisibility());
245 AddUnsigned(GS->isLive());
246 AddUnsigned(GS->canAutoHide());
247 for (const ValueInfo &VI : GS->refs()) {
248 AddUnsigned(VI.isDSOLocal(Index.withDSOLocalPropagation()));
249 AddUsedCfiGlobal(VI.getGUID());
250 }
251 if (auto *GVS = dyn_cast<GlobalVarSummary>(GS)) {
252 AddUnsigned(GVS->maybeReadOnly());
253 AddUnsigned(GVS->maybeWriteOnly());
254 }
255 if (auto *FS = dyn_cast<FunctionSummary>(GS)) {
256 for (auto &TT : FS->type_tests())
257 UsedTypeIds.insert(TT);
258 for (auto &TT : FS->type_test_assume_vcalls())
259 UsedTypeIds.insert(TT.GUID);
260 for (auto &TT : FS->type_checked_load_vcalls())
261 UsedTypeIds.insert(TT.GUID);
262 for (auto &TT : FS->type_test_assume_const_vcalls())
263 UsedTypeIds.insert(TT.VFunc.GUID);
264 for (auto &TT : FS->type_checked_load_const_vcalls())
265 UsedTypeIds.insert(TT.VFunc.GUID);
266 for (auto &ET : FS->calls()) {
267 AddUnsigned(ET.first.isDSOLocal(Index.withDSOLocalPropagation()));
268 AddUsedCfiGlobal(ET.first.getGUID());
269 }
270 }
271 };
272
273 // Include the hash for the linkage type to reflect internalization and weak
274 // resolution, and collect any used type identifier resolutions.
275 for (auto &GS : DefinedGlobals) {
276 GlobalValue::LinkageTypes Linkage = GS.second->linkage();
277 Hasher.update(
278 ArrayRef<uint8_t>((const uint8_t *)&Linkage, sizeof(Linkage)));
279 AddUsedCfiGlobal(GS.first);
280 AddUsedThings(GS.second);
281 }
282
283 // Imported functions may introduce new uses of type identifier resolutions,
284 // so we need to collect their used resolutions as well.
285 for (const auto &[FromModule, GUID, Type] : SortedImportList) {
286 GlobalValueSummary *S = Index.findSummaryInModule(GUID, FromModule);
287 AddUsedThings(S);
288 // If this is an alias, we also care about any types/etc. that the aliasee
289 // may reference.
290 if (auto *AS = dyn_cast_or_null<AliasSummary>(S))
291 AddUsedThings(AS->getBaseObject());
292 }
293
294 auto AddTypeIdSummary = [&](StringRef TId, const TypeIdSummary &S) {
295 AddString(TId);
296
297 AddUnsigned(S.TTRes.TheKind);
298 AddUnsigned(S.TTRes.SizeM1BitWidth);
299
300 AddUint64(S.TTRes.AlignLog2);
301 AddUint64(S.TTRes.SizeM1);
302 AddUint64(S.TTRes.BitMask);
303 AddUint64(S.TTRes.InlineBits);
304
305 AddUint64(S.WPDRes.size());
306 for (auto &WPD : S.WPDRes) {
307 AddUnsigned(WPD.first);
308 AddUnsigned(WPD.second.TheKind);
309 AddString(WPD.second.SingleImplName);
310
311 AddUint64(WPD.second.ResByArg.size());
312 for (auto &ByArg : WPD.second.ResByArg) {
313 AddUint64(ByArg.first.size());
314 for (uint64_t Arg : ByArg.first)
315 AddUint64(Arg);
316 AddUnsigned(ByArg.second.TheKind);
317 AddUint64(ByArg.second.Info);
318 AddUnsigned(ByArg.second.Byte);
319 AddUnsigned(ByArg.second.Bit);
320 }
321 }
322 };
323
324 // Include the hash for all type identifiers used by this module.
325 for (GlobalValue::GUID TId : UsedTypeIds) {
326 auto TidIter = Index.typeIds().equal_range(TId);
327 for (const auto &I : make_range(TidIter))
328 AddTypeIdSummary(I.second.first, I.second.second);
329 }
330
331 AddUnsigned(UsedCfiDefs.size());
332 for (auto &V : UsedCfiDefs)
333 AddUint64(V);
334
335 AddUnsigned(UsedCfiDecls.size());
336 for (auto &V : UsedCfiDecls)
337 AddUint64(V);
338
339 if (!Conf.SampleProfile.empty()) {
340 auto FileOrErr = MemoryBuffer::getFile(Conf.SampleProfile);
341 if (FileOrErr) {
342 Hasher.update(FileOrErr.get()->getBuffer());
343
344 if (!Conf.ProfileRemapping.empty()) {
345 FileOrErr = MemoryBuffer::getFile(Conf.ProfileRemapping);
346 if (FileOrErr)
347 Hasher.update(FileOrErr.get()->getBuffer());
348 }
349 }
350 }
351
352 return toHex(Hasher.result());
353}
354
355std::string llvm::recomputeLTOCacheKey(const std::string &Key,
356 StringRef ExtraID) {
357 SHA1 Hasher;
358
359 auto AddString = [&](StringRef Str) {
360 Hasher.update(Str);
361 Hasher.update(ArrayRef<uint8_t>{0});
362 };
363 AddString(Key);
364 AddString(ExtraID);
365
366 return toHex(Hasher.result());
367}
368
370 const Config &C, ValueInfo VI,
371 DenseSet<GlobalValueSummary *> &GlobalInvolvedWithAlias,
373 isPrevailing,
375 recordNewLinkage,
376 const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols) {
378 C.VisibilityScheme == Config::ELF ? VI.getELFVisibility()
380 for (auto &S : VI.getSummaryList()) {
381 GlobalValue::LinkageTypes OriginalLinkage = S->linkage();
382 // Ignore local and appending linkage values since the linker
383 // doesn't resolve them.
384 if (GlobalValue::isLocalLinkage(OriginalLinkage) ||
386 continue;
387 // We need to emit only one of these. The prevailing module will keep it,
388 // but turned into a weak, while the others will drop it when possible.
389 // This is both a compile-time optimization and a correctness
390 // transformation. This is necessary for correctness when we have exported
391 // a reference - we need to convert the linkonce to weak to
392 // ensure a copy is kept to satisfy the exported reference.
393 // FIXME: We may want to split the compile time and correctness
394 // aspects into separate routines.
395 if (isPrevailing(VI.getGUID(), S.get())) {
396 if (GlobalValue::isLinkOnceLinkage(OriginalLinkage)) {
397 S->setLinkage(GlobalValue::getWeakLinkage(
398 GlobalValue::isLinkOnceODRLinkage(OriginalLinkage)));
399 // The kept copy is eligible for auto-hiding (hidden visibility) if all
400 // copies were (i.e. they were all linkonce_odr global unnamed addr).
401 // If any copy is not (e.g. it was originally weak_odr), then the symbol
402 // must remain externally available (e.g. a weak_odr from an explicitly
403 // instantiated template). Additionally, if it is in the
404 // GUIDPreservedSymbols set, that means that it is visibile outside
405 // the summary (e.g. in a native object or a bitcode file without
406 // summary), and in that case we cannot hide it as it isn't possible to
407 // check all copies.
408 S->setCanAutoHide(VI.canAutoHide() &&
409 !GUIDPreservedSymbols.count(VI.getGUID()));
410 }
411 if (C.VisibilityScheme == Config::FromPrevailing)
412 Visibility = S->getVisibility();
413 }
414 // Alias and aliasee can't be turned into available_externally.
415 // When force-import-all is used, it indicates that object linking is not
416 // supported by the target. In this case, we can't change the linkage as
417 // well in case the global is converted to declaration.
418 else if (!isa<AliasSummary>(S.get()) &&
419 !GlobalInvolvedWithAlias.count(S.get()) && !ForceImportAll)
421
422 // For ELF, set visibility to the computed visibility from summaries. We
423 // don't track visibility from declarations so this may be more relaxed than
424 // the most constraining one.
425 if (C.VisibilityScheme == Config::ELF)
426 S->setVisibility(Visibility);
427
428 if (S->linkage() != OriginalLinkage)
429 recordNewLinkage(S->modulePath(), VI.getGUID(), S->linkage());
430 }
431
432 if (C.VisibilityScheme == Config::FromPrevailing) {
433 for (auto &S : VI.getSummaryList()) {
434 GlobalValue::LinkageTypes OriginalLinkage = S->linkage();
435 if (GlobalValue::isLocalLinkage(OriginalLinkage) ||
437 continue;
438 S->setVisibility(Visibility);
439 }
440 }
441}
442
443/// Resolve linkage for prevailing symbols in the \p Index.
444//
445// We'd like to drop these functions if they are no longer referenced in the
446// current module. However there is a chance that another module is still
447// referencing them because of the import. We make sure we always emit at least
448// one copy.
450 const Config &C, ModuleSummaryIndex &Index,
452 isPrevailing,
454 recordNewLinkage,
455 const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols) {
456 // We won't optimize the globals that are referenced by an alias for now
457 // Ideally we should turn the alias into a global and duplicate the definition
458 // when needed.
459 DenseSet<GlobalValueSummary *> GlobalInvolvedWithAlias;
460 for (auto &I : Index)
461 for (auto &S : I.second.getSummaryList())
462 if (auto AS = dyn_cast<AliasSummary>(S.get()))
463 GlobalInvolvedWithAlias.insert(&AS->getAliasee());
464
465 for (auto &I : Index)
466 thinLTOResolvePrevailingGUID(C, Index.getValueInfo(I),
467 GlobalInvolvedWithAlias, isPrevailing,
468 recordNewLinkage, GUIDPreservedSymbols);
469}
470
472 ValueInfo VI, function_ref<bool(StringRef, ValueInfo)> isExported,
474 isPrevailing) {
475 // Before performing index-based internalization and promotion for this GUID,
476 // the local flag should be consistent with the summary list linkage types.
477 VI.verifyLocal();
478
479 const bool SingleExternallyVisibleCopy =
480 VI.getSummaryList().size() == 1 &&
481 !GlobalValue::isLocalLinkage(VI.getSummaryList().front()->linkage());
482
483 for (auto &S : VI.getSummaryList()) {
484 // First see if we need to promote an internal value because it is not
485 // exported.
486 if (isExported(S->modulePath(), VI)) {
487 if (GlobalValue::isLocalLinkage(S->linkage()))
488 S->setLinkage(GlobalValue::ExternalLinkage);
489 continue;
490 }
491
492 // Otherwise, see if we can internalize.
494 continue;
495
496 // Non-exported values with external linkage can be internalized.
497 if (GlobalValue::isExternalLinkage(S->linkage())) {
498 S->setLinkage(GlobalValue::InternalLinkage);
499 continue;
500 }
501
502 // Non-exported function and variable definitions with a weak-for-linker
503 // linkage can be internalized in certain cases. The minimum legality
504 // requirements would be that they are not address taken to ensure that we
505 // don't break pointer equality checks, and that variables are either read-
506 // or write-only. For functions, this is the case if either all copies are
507 // [local_]unnamed_addr, or we can propagate reference edge attributes
508 // (which is how this is guaranteed for variables, when analyzing whether
509 // they are read or write-only).
510 //
511 // However, we only get to this code for weak-for-linkage values in one of
512 // two cases:
513 // 1) The prevailing copy is not in IR (it is in native code).
514 // 2) The prevailing copy in IR is not exported from its module.
515 // Additionally, at least for the new LTO API, case 2 will only happen if
516 // there is exactly one definition of the value (i.e. in exactly one
517 // module), as duplicate defs are result in the value being marked exported.
518 // Likely, users of the legacy LTO API are similar, however, currently there
519 // are llvm-lto based tests of the legacy LTO API that do not mark
520 // duplicate linkonce_odr copies as exported via the tool, so we need
521 // to handle that case below by checking the number of copies.
522 //
523 // Generally, we only want to internalize a weak-for-linker value in case
524 // 2, because in case 1 we cannot see how the value is used to know if it
525 // is read or write-only. We also don't want to bloat the binary with
526 // multiple internalized copies of non-prevailing linkonce/weak functions.
527 // Note if we don't internalize, we will convert non-prevailing copies to
528 // available_externally anyway, so that we drop them after inlining. The
529 // only reason to internalize such a function is if we indeed have a single
530 // copy, because internalizing it won't increase binary size, and enables
531 // use of inliner heuristics that are more aggressive in the face of a
532 // single call to a static (local). For variables, internalizing a read or
533 // write only variable can enable more aggressive optimization. However, we
534 // already perform this elsewhere in the ThinLTO backend handling for
535 // read or write-only variables (processGlobalForThinLTO).
536 //
537 // Therefore, only internalize linkonce/weak if there is a single copy, that
538 // is prevailing in this IR module. We can do so aggressively, without
539 // requiring the address to be insignificant, or that a variable be read or
540 // write-only.
541 if (!GlobalValue::isWeakForLinker(S->linkage()) ||
543 continue;
544
545 // We may have a single summary copy that is externally visible but not
546 // prevailing if the prevailing copy is in a native object.
547 if (SingleExternallyVisibleCopy && isPrevailing(VI.getGUID(), S.get()))
548 S->setLinkage(GlobalValue::InternalLinkage);
549 }
550}
551
552// Update the linkages in the given \p Index to mark exported values
553// as external and non-exported values as internal.
555 ModuleSummaryIndex &Index,
556 function_ref<bool(StringRef, ValueInfo)> isExported,
558 isPrevailing) {
559 assert(!Index.withInternalizeAndPromote());
560 for (auto &I : Index)
561 thinLTOInternalizeAndPromoteGUID(Index.getValueInfo(I), isExported,
562 isPrevailing);
563 Index.setWithInternalizeAndPromote();
564}
565
566// Requires a destructor for std::vector<InputModule>.
567InputFile::~InputFile() = default;
568
570 std::unique_ptr<InputFile> File(new InputFile);
571
572 Expected<IRSymtabFile> FOrErr = readIRSymtab(Object);
573 if (!FOrErr)
574 return FOrErr.takeError();
575
576 File->TargetTriple = FOrErr->TheReader.getTargetTriple();
577 File->SourceFileName = FOrErr->TheReader.getSourceFileName();
578 File->COFFLinkerOpts = FOrErr->TheReader.getCOFFLinkerOpts();
579 File->DependentLibraries = FOrErr->TheReader.getDependentLibraries();
580 File->ComdatTable = FOrErr->TheReader.getComdatTable();
581 File->MbRef =
582 Object; // Save a memory buffer reference to an input file object.
583
584 for (unsigned I = 0; I != FOrErr->Mods.size(); ++I) {
585 size_t Begin = File->Symbols.size();
586 for (const irsymtab::Reader::SymbolRef &Sym :
587 FOrErr->TheReader.module_symbols(I))
588 // Skip symbols that are irrelevant to LTO. Note that this condition needs
589 // to match the one in Skip() in LTO::addRegularLTO().
590 if (Sym.isGlobal() && !Sym.isFormatSpecific())
591 File->Symbols.push_back(Sym);
592 File->ModuleSymIndices.push_back({Begin, File->Symbols.size()});
593 }
594
595 File->Mods = FOrErr->Mods;
596 File->Strtab = std::move(FOrErr->Strtab);
597 return std::move(File);
598}
599
601 return Mods[0].getModuleIdentifier();
602}
603
605 assert(Mods.size() == 1 && "Expect only one bitcode module");
606 return Mods[0];
607}
608
609LTO::RegularLTOState::RegularLTOState(unsigned ParallelCodeGenParallelismLevel,
610 const Config &Conf)
611 : ParallelCodeGenParallelismLevel(ParallelCodeGenParallelismLevel),
612 Ctx(Conf), CombinedModule(std::make_unique<Module>("ld-temp.o", Ctx)),
613 Mover(std::make_unique<IRMover>(*CombinedModule)) {}
614
615LTO::ThinLTOState::ThinLTOState(ThinBackend BackendParam)
616 : Backend(std::move(BackendParam)), CombinedIndex(/*HaveGVs*/ false) {
617 if (!Backend.isValid())
618 Backend =
620}
621
623 unsigned ParallelCodeGenParallelismLevel, LTOKind LTOMode)
624 : Conf(std::move(Conf)),
625 RegularLTO(ParallelCodeGenParallelismLevel, this->Conf),
626 ThinLTO(std::move(Backend)),
627 GlobalResolutions(
628 std::make_unique<DenseMap<StringRef, GlobalResolution>>()),
629 LTOMode(LTOMode) {
630 if (Conf.KeepSymbolNameCopies || LTOKeepSymbolCopies) {
631 Alloc = std::make_unique<BumpPtrAllocator>();
632 GlobalResolutionSymbolSaver = std::make_unique<llvm::StringSaver>(*Alloc);
633 }
634}
635
636// Requires a destructor for MapVector<BitcodeModule>.
637LTO::~LTO() = default;
638
639// Add the symbols in the given module to the GlobalResolutions map, and resolve
640// their partitions.
641void LTO::addModuleToGlobalRes(ArrayRef<InputFile::Symbol> Syms,
643 unsigned Partition, bool InSummary) {
644 llvm::TimeTraceScope timeScope("LTO add module to global resolution");
645 auto *ResI = Res.begin();
646 auto *ResE = Res.end();
647 (void)ResE;
648 for (const InputFile::Symbol &Sym : Syms) {
649 assert(ResI != ResE);
650 SymbolResolution Res = *ResI++;
651
652 StringRef SymbolName = Sym.getName();
653 // Keep copies of symbols if the client of LTO says so.
654 if (GlobalResolutionSymbolSaver && !GlobalResolutions->contains(SymbolName))
655 SymbolName = GlobalResolutionSymbolSaver->save(SymbolName);
656
657 auto &GlobalRes = (*GlobalResolutions)[SymbolName];
658 GlobalRes.UnnamedAddr &= Sym.isUnnamedAddr();
659 if (Res.Prevailing) {
660 assert(!GlobalRes.Prevailing &&
661 "Multiple prevailing defs are not allowed");
662 GlobalRes.Prevailing = true;
663 GlobalRes.IRName = std::string(Sym.getIRName());
664 } else if (!GlobalRes.Prevailing && GlobalRes.IRName.empty()) {
665 // Sometimes it can be two copies of symbol in a module and prevailing
666 // symbol can have no IR name. That might happen if symbol is defined in
667 // module level inline asm block. In case we have multiple modules with
668 // the same symbol we want to use IR name of the prevailing symbol.
669 // Otherwise, if we haven't seen a prevailing symbol, set the name so that
670 // we can later use it to check if there is any prevailing copy in IR.
671 GlobalRes.IRName = std::string(Sym.getIRName());
672 }
673
674 // In rare occasion, the symbol used to initialize GlobalRes has a different
675 // IRName from the inspected Symbol. This can happen on macOS + iOS, when a
676 // symbol is referenced through its mangled name, say @"\01_symbol" while
677 // the IRName is @symbol (the prefix underscore comes from MachO mangling).
678 // In that case, we have the same actual Symbol that can get two different
679 // GUID, leading to some invalid internalization. Workaround this by marking
680 // the GlobalRes external.
681
682 // FIXME: instead of this check, it would be desirable to compute GUIDs
683 // based on mangled name, but this requires an access to the Target Triple
684 // and would be relatively invasive on the codebase.
685 if (GlobalRes.IRName != Sym.getIRName()) {
686 GlobalRes.Partition = GlobalResolution::External;
687 GlobalRes.VisibleOutsideSummary = true;
688 }
689
690 // Set the partition to external if we know it is re-defined by the linker
691 // with -defsym or -wrap options, used elsewhere, e.g. it is visible to a
692 // regular object, is referenced from llvm.compiler.used/llvm.used, or was
693 // already recorded as being referenced from a different partition.
694 if (Res.LinkerRedefined || Res.VisibleToRegularObj || Sym.isUsed() ||
695 (GlobalRes.Partition != GlobalResolution::Unknown &&
696 GlobalRes.Partition != Partition)) {
697 GlobalRes.Partition = GlobalResolution::External;
698 } else
699 // First recorded reference, save the current partition.
700 GlobalRes.Partition = Partition;
701
702 // Flag as visible outside of summary if visible from a regular object or
703 // from a module that does not have a summary.
704 GlobalRes.VisibleOutsideSummary |=
705 (Res.VisibleToRegularObj || Sym.isUsed() || !InSummary);
706
707 GlobalRes.ExportDynamic |= Res.ExportDynamic;
708 }
709}
710
711void LTO::releaseGlobalResolutionsMemory() {
712 // Release GlobalResolutions dense-map itself.
713 GlobalResolutions.reset();
714 // Release the string saver memory.
715 GlobalResolutionSymbolSaver.reset();
716 Alloc.reset();
717}
718
721 StringRef Path = Input->getName();
722 OS << Path << '\n';
723 auto ResI = Res.begin();
724 for (const InputFile::Symbol &Sym : Input->symbols()) {
725 assert(ResI != Res.end());
726 SymbolResolution Res = *ResI++;
727
728 OS << "-r=" << Path << ',' << Sym.getName() << ',';
729 if (Res.Prevailing)
730 OS << 'p';
732 OS << 'l';
733 if (Res.VisibleToRegularObj)
734 OS << 'x';
735 if (Res.LinkerRedefined)
736 OS << 'r';
737 OS << '\n';
738 }
739 OS.flush();
740 assert(ResI == Res.end());
741}
742
743Error LTO::add(std::unique_ptr<InputFile> InputPtr,
745 llvm::TimeTraceScope timeScope("LTO add input", InputPtr->getName());
746 assert(!CalledGetMaxTasks);
747
749 addInput(std::move(InputPtr));
750 if (!InputOrErr)
751 return InputOrErr.takeError();
752 InputFile *Input = (*InputOrErr).get();
753
754 if (Conf.ResolutionFile)
755 writeToResolutionFile(*Conf.ResolutionFile, Input, Res);
756
757 if (RegularLTO.CombinedModule->getTargetTriple().empty()) {
758 Triple InputTriple(Input->getTargetTriple());
759 RegularLTO.CombinedModule->setTargetTriple(InputTriple);
760 if (InputTriple.isOSBinFormatELF())
761 Conf.VisibilityScheme = Config::ELF;
762 }
763
764 ArrayRef<SymbolResolution> InputRes = Res;
765 for (unsigned I = 0; I != Input->Mods.size(); ++I) {
766 if (auto Err = addModule(*Input, InputRes, I, Res).moveInto(Res))
767 return Err;
768 }
769
770 assert(Res.empty());
771 return Error::success();
772}
773
775LTO::addModule(InputFile &Input, ArrayRef<SymbolResolution> InputRes,
776 unsigned ModI, ArrayRef<SymbolResolution> Res) {
777 llvm::TimeTraceScope timeScope("LTO add module", Input.getName());
778 Expected<BitcodeLTOInfo> LTOInfo = Input.Mods[ModI].getLTOInfo();
779 if (!LTOInfo)
780 return LTOInfo.takeError();
781
782 if (EnableSplitLTOUnit) {
783 // If only some modules were split, flag this in the index so that
784 // we can skip or error on optimizations that need consistently split
785 // modules (whole program devirt and lower type tests).
786 if (*EnableSplitLTOUnit != LTOInfo->EnableSplitLTOUnit)
787 ThinLTO.CombinedIndex.setPartiallySplitLTOUnits();
788 } else
789 EnableSplitLTOUnit = LTOInfo->EnableSplitLTOUnit;
790
791 BitcodeModule BM = Input.Mods[ModI];
792
793 if ((LTOMode == LTOK_UnifiedRegular || LTOMode == LTOK_UnifiedThin) &&
794 !LTOInfo->UnifiedLTO)
796 "unified LTO compilation must use "
797 "compatible bitcode modules (use -funified-lto)",
799
800 if (LTOInfo->UnifiedLTO && LTOMode == LTOK_Default)
801 LTOMode = LTOK_UnifiedThin;
802
803 bool IsThinLTO = LTOInfo->IsThinLTO && (LTOMode != LTOK_UnifiedRegular);
804 // If any of the modules inside of a input bitcode file was compiled with
805 // ThinLTO, we assume that the whole input file also was compiled with
806 // ThinLTO.
807 Input.IsThinLTO = IsThinLTO;
808
809 auto ModSyms = Input.module_symbols(ModI);
810 addModuleToGlobalRes(ModSyms, Res,
811 IsThinLTO ? ThinLTO.ModuleMap.size() + 1 : 0,
812 LTOInfo->HasSummary);
813
814 if (IsThinLTO)
815 return addThinLTO(BM, ModSyms, Res);
816
817 RegularLTO.EmptyCombinedModule = false;
818 auto ModOrErr = addRegularLTO(Input, InputRes, BM, ModSyms, Res);
819 if (!ModOrErr)
820 return ModOrErr.takeError();
821 Res = ModOrErr->second;
822
823 if (!LTOInfo->HasSummary) {
824 if (Error Err = linkRegularLTO(std::move(ModOrErr->first),
825 /*LivenessFromIndex=*/false))
826 return Err;
827 return Res;
828 }
829
830 // Regular LTO module summaries are added to a dummy module that represents
831 // the combined regular LTO module.
832 if (Error Err = BM.readSummary(ThinLTO.CombinedIndex, ""))
833 return Err;
834 RegularLTO.ModsWithSummaries.push_back(std::move(ModOrErr->first));
835 return Res;
836}
837
838// Checks whether the given global value is in a non-prevailing comdat
839// (comdat containing values the linker indicated were not prevailing,
840// which we then dropped to available_externally), and if so, removes
841// it from the comdat. This is called for all global values to ensure the
842// comdat is empty rather than leaving an incomplete comdat. It is needed for
843// regular LTO modules, in case we are in a mixed-LTO mode (both regular
844// and thin LTO modules) compilation. Since the regular LTO module will be
845// linked first in the final native link, we want to make sure the linker
846// doesn't select any of these incomplete comdats that would be left
847// in the regular LTO module without this cleanup.
848static void
850 std::set<const Comdat *> &NonPrevailingComdats) {
851 Comdat *C = GV.getComdat();
852 if (!C)
853 return;
854
855 if (!NonPrevailingComdats.count(C))
856 return;
857
858 // Additionally need to drop all global values from the comdat to
859 // available_externally, to satisfy the COMDAT requirement that all members
860 // are discarded as a unit. The non-local linkage global values avoid
861 // duplicate definition linker errors.
863
864 if (auto GO = dyn_cast<GlobalObject>(&GV))
865 GO->setComdat(nullptr);
866}
867
868// Add a regular LTO object to the link.
869// The resulting module needs to be linked into the combined LTO module with
870// linkRegularLTO.
871Expected<
872 std::pair<LTO::RegularLTOState::AddedModule, ArrayRef<SymbolResolution>>>
873LTO::addRegularLTO(InputFile &Input, ArrayRef<SymbolResolution> InputRes,
874 BitcodeModule BM, ArrayRef<InputFile::Symbol> Syms,
876 llvm::TimeTraceScope timeScope("LTO add regular LTO");
878 Expected<std::unique_ptr<Module>> MOrErr =
879 BM.getLazyModule(RegularLTO.Ctx, /*ShouldLazyLoadMetadata*/ true,
880 /*IsImporting*/ false);
881 if (!MOrErr)
882 return MOrErr.takeError();
883 Module &M = **MOrErr;
884 Mod.M = std::move(*MOrErr);
885
886 if (Error Err = M.materializeMetadata())
887 return std::move(Err);
888
889 if (LTOMode == LTOK_UnifiedRegular) {
890 // cfi.functions metadata is intended to be used with ThinLTO and may
891 // trigger invalid IR transformations if they are present when doing regular
892 // LTO, so delete it.
893 if (NamedMDNode *CfiFunctionsMD = M.getNamedMetadata("cfi.functions"))
894 M.eraseNamedMetadata(CfiFunctionsMD);
895 } else if (NamedMDNode *AliasesMD = M.getNamedMetadata("aliases")) {
896 // Delete aliases entries for non-prevailing symbols on the ThinLTO side of
897 // this input file.
898 DenseSet<StringRef> Prevailing;
899 for (auto [I, R] : zip(Input.symbols(), InputRes))
900 if (R.Prevailing && !I.getIRName().empty())
901 Prevailing.insert(I.getIRName());
902 std::vector<MDNode *> AliasGroups;
903 for (MDNode *AliasGroup : AliasesMD->operands()) {
904 std::vector<Metadata *> Aliases;
905 for (Metadata *Alias : AliasGroup->operands()) {
906 if (isa<MDString>(Alias) &&
907 Prevailing.count(cast<MDString>(Alias)->getString()))
908 Aliases.push_back(Alias);
909 }
910 if (Aliases.size() > 1)
911 AliasGroups.push_back(MDTuple::get(RegularLTO.Ctx, Aliases));
912 }
913 AliasesMD->clearOperands();
914 for (MDNode *G : AliasGroups)
915 AliasesMD->addOperand(G);
916 }
917
919
920 ModuleSymbolTable SymTab;
921 SymTab.addModule(&M);
922
923 for (GlobalVariable &GV : M.globals())
924 if (GV.hasAppendingLinkage())
925 Mod.Keep.push_back(&GV);
926
927 DenseSet<GlobalObject *> AliasedGlobals;
928 for (auto &GA : M.aliases())
929 if (GlobalObject *GO = GA.getAliaseeObject())
930 AliasedGlobals.insert(GO);
931
932 // In this function we need IR GlobalValues matching the symbols in Syms
933 // (which is not backed by a module), so we need to enumerate them in the same
934 // order. The symbol enumeration order of a ModuleSymbolTable intentionally
935 // matches the order of an irsymtab, but when we read the irsymtab in
936 // InputFile::create we omit some symbols that are irrelevant to LTO. The
937 // Skip() function skips the same symbols from the module as InputFile does
938 // from the symbol table.
939 auto MsymI = SymTab.symbols().begin(), MsymE = SymTab.symbols().end();
940 auto Skip = [&]() {
941 while (MsymI != MsymE) {
942 auto Flags = SymTab.getSymbolFlags(*MsymI);
943 if ((Flags & object::BasicSymbolRef::SF_Global) &&
945 return;
946 ++MsymI;
947 }
948 };
949 Skip();
950
951 std::set<const Comdat *> NonPrevailingComdats;
952 SmallSet<StringRef, 2> NonPrevailingAsmSymbols;
953 for (const InputFile::Symbol &Sym : Syms) {
954 assert(!Res.empty());
955 const SymbolResolution &R = Res.consume_front();
956
957 assert(MsymI != MsymE);
958 ModuleSymbolTable::Symbol Msym = *MsymI++;
959 Skip();
960
961 if (GlobalValue *GV = dyn_cast_if_present<GlobalValue *>(Msym)) {
962 if (R.Prevailing) {
963 if (Sym.isUndefined())
964 continue;
965 Mod.Keep.push_back(GV);
966 // For symbols re-defined with linker -wrap and -defsym options,
967 // set the linkage to weak to inhibit IPO. The linkage will be
968 // restored by the linker.
969 if (R.LinkerRedefined)
970 GV->setLinkage(GlobalValue::WeakAnyLinkage);
971
972 GlobalValue::LinkageTypes OriginalLinkage = GV->getLinkage();
973 if (GlobalValue::isLinkOnceLinkage(OriginalLinkage))
974 GV->setLinkage(GlobalValue::getWeakLinkage(
975 GlobalValue::isLinkOnceODRLinkage(OriginalLinkage)));
976 } else if (isa<GlobalObject>(GV) &&
977 (GV->hasLinkOnceODRLinkage() || GV->hasWeakODRLinkage() ||
978 GV->hasAvailableExternallyLinkage()) &&
979 !AliasedGlobals.count(cast<GlobalObject>(GV))) {
980 // Any of the above three types of linkage indicates that the
981 // chosen prevailing symbol will have the same semantics as this copy of
982 // the symbol, so we may be able to link it with available_externally
983 // linkage. We will decide later whether to do that when we link this
984 // module (in linkRegularLTO), based on whether it is undefined.
985 Mod.Keep.push_back(GV);
987 if (GV->hasComdat())
988 NonPrevailingComdats.insert(GV->getComdat());
989 cast<GlobalObject>(GV)->setComdat(nullptr);
990 }
991
992 // Set the 'local' flag based on the linker resolution for this symbol.
993 if (R.FinalDefinitionInLinkageUnit) {
994 GV->setDSOLocal(true);
995 if (GV->hasDLLImportStorageClass())
996 GV->setDLLStorageClass(GlobalValue::DLLStorageClassTypes::
997 DefaultStorageClass);
998 }
999 } else if (auto *AS =
1001 // Collect non-prevailing symbols.
1002 if (!R.Prevailing)
1003 NonPrevailingAsmSymbols.insert(AS->first);
1004 } else {
1005 llvm_unreachable("unknown symbol type");
1006 }
1007
1008 // Common resolution: collect the maximum size/alignment over all commons.
1009 // We also record if we see an instance of a common as prevailing, so that
1010 // if none is prevailing we can ignore it later.
1011 if (Sym.isCommon()) {
1012 // FIXME: We should figure out what to do about commons defined by asm.
1013 // For now they aren't reported correctly by ModuleSymbolTable.
1014 auto &CommonRes = RegularLTO.Commons[std::string(Sym.getIRName())];
1015 CommonRes.Size = std::max(CommonRes.Size, Sym.getCommonSize());
1016 if (uint32_t SymAlignValue = Sym.getCommonAlignment()) {
1017 CommonRes.Alignment =
1018 std::max(Align(SymAlignValue), CommonRes.Alignment);
1019 }
1020 CommonRes.Prevailing |= R.Prevailing;
1021 }
1022 }
1023
1024 if (!M.getComdatSymbolTable().empty())
1025 for (GlobalValue &GV : M.global_values())
1026 handleNonPrevailingComdat(GV, NonPrevailingComdats);
1027
1028 // Prepend ".lto_discard <sym>, <sym>*" directive to each module inline asm
1029 // block.
1030 if (!M.getModuleInlineAsm().empty()) {
1031 std::string NewIA = ".lto_discard";
1032 if (!NonPrevailingAsmSymbols.empty()) {
1033 // Don't dicard a symbol if there is a live .symver for it.
1035 M, [&](StringRef Name, StringRef Alias) {
1036 if (!NonPrevailingAsmSymbols.count(Alias))
1037 NonPrevailingAsmSymbols.erase(Name);
1038 });
1039 NewIA += " " + llvm::join(NonPrevailingAsmSymbols, ", ");
1040 }
1041 NewIA += "\n";
1042 M.setModuleInlineAsm(NewIA + M.getModuleInlineAsm());
1043 }
1044
1045 assert(MsymI == MsymE);
1046 return std::make_pair(std::move(Mod), Res);
1047}
1048
1049Error LTO::linkRegularLTO(RegularLTOState::AddedModule Mod,
1050 bool LivenessFromIndex) {
1051 llvm::TimeTraceScope timeScope("LTO link regular LTO");
1052 std::vector<GlobalValue *> Keep;
1053 for (GlobalValue *GV : Mod.Keep) {
1054 if (LivenessFromIndex && !ThinLTO.CombinedIndex.isGUIDLive(GV->getGUID())) {
1055 if (Function *F = dyn_cast<Function>(GV)) {
1056 if (DiagnosticOutputFile) {
1057 if (Error Err = F->materialize())
1058 return Err;
1059 OptimizationRemarkEmitter ORE(F, nullptr);
1060 ORE.emit(OptimizationRemark(DEBUG_TYPE, "deadfunction", F)
1061 << ore::NV("Function", F)
1062 << " not added to the combined module ");
1063 }
1064 }
1065 continue;
1066 }
1067
1068 if (!GV->hasAvailableExternallyLinkage()) {
1069 Keep.push_back(GV);
1070 continue;
1071 }
1072
1073 // Only link available_externally definitions if we don't already have a
1074 // definition.
1075 GlobalValue *CombinedGV =
1076 RegularLTO.CombinedModule->getNamedValue(GV->getName());
1077 if (CombinedGV && !CombinedGV->isDeclaration())
1078 continue;
1079
1080 Keep.push_back(GV);
1081 }
1082
1083 return RegularLTO.Mover->move(std::move(Mod.M), Keep, nullptr,
1084 /* IsPerformingImport */ false);
1085}
1086
1087// Add a ThinLTO module to the link.
1088Expected<ArrayRef<SymbolResolution>>
1089LTO::addThinLTO(BitcodeModule BM, ArrayRef<InputFile::Symbol> Syms,
1091 llvm::TimeTraceScope timeScope("LTO add thin LTO");
1092 const auto BMID = BM.getModuleIdentifier();
1093 ArrayRef<SymbolResolution> ResTmp = Res;
1094 for (const InputFile::Symbol &Sym : Syms) {
1095 assert(!ResTmp.empty());
1096 const SymbolResolution &R = ResTmp.consume_front();
1097
1098 if (!Sym.getIRName().empty() && R.Prevailing) {
1100 GlobalValue::getGlobalIdentifier(Sym.getIRName(),
1102 ThinLTO.setPrevailingModuleForGUID(GUID, BMID);
1103 }
1104 }
1105
1106 if (Error Err = BM.readSummary(
1107 ThinLTO.CombinedIndex, BMID, [&](GlobalValue::GUID GUID) {
1108 return ThinLTO.isPrevailingModuleForGUID(GUID, BMID);
1109 }))
1110 return Err;
1111 LLVM_DEBUG(dbgs() << "Module " << BMID << "\n");
1112
1113 for (const InputFile::Symbol &Sym : Syms) {
1114 assert(!Res.empty());
1115 const SymbolResolution &R = Res.consume_front();
1116
1117 if (!Sym.getIRName().empty() &&
1118 (R.Prevailing || R.FinalDefinitionInLinkageUnit)) {
1120 GlobalValue::getGlobalIdentifier(Sym.getIRName(),
1122 if (R.Prevailing) {
1123 assert(ThinLTO.isPrevailingModuleForGUID(GUID, BMID));
1124
1125 // For linker redefined symbols (via --wrap or --defsym) we want to
1126 // switch the linkage to `weak` to prevent IPOs from happening.
1127 // Find the summary in the module for this very GV and record the new
1128 // linkage so that we can switch it when we import the GV.
1129 if (R.LinkerRedefined)
1130 if (auto S = ThinLTO.CombinedIndex.findSummaryInModule(GUID, BMID))
1131 S->setLinkage(GlobalValue::WeakAnyLinkage);
1132 }
1133
1134 // If the linker resolved the symbol to a local definition then mark it
1135 // as local in the summary for the module we are adding.
1136 if (R.FinalDefinitionInLinkageUnit) {
1137 if (auto S = ThinLTO.CombinedIndex.findSummaryInModule(GUID, BMID)) {
1138 S->setDSOLocal(true);
1139 }
1140 }
1141 }
1142 }
1143
1144 if (!ThinLTO.ModuleMap.insert({BMID, BM}).second)
1146 "Expected at most one ThinLTO module per bitcode file",
1148
1149 if (!Conf.ThinLTOModulesToCompile.empty()) {
1150 if (!ThinLTO.ModulesToCompile)
1151 ThinLTO.ModulesToCompile = ModuleMapType();
1152 // This is a fuzzy name matching where only modules with name containing the
1153 // specified switch values are going to be compiled.
1154 for (const std::string &Name : Conf.ThinLTOModulesToCompile) {
1155 if (BMID.contains(Name)) {
1156 ThinLTO.ModulesToCompile->insert({BMID, BM});
1157 LLVM_DEBUG(dbgs() << "[ThinLTO] Selecting " << BMID << " to compile\n");
1158 break;
1159 }
1160 }
1161 }
1162
1163 return Res;
1164}
1165
1166unsigned LTO::getMaxTasks() const {
1167 CalledGetMaxTasks = true;
1168 auto ModuleCount = ThinLTO.ModulesToCompile ? ThinLTO.ModulesToCompile->size()
1169 : ThinLTO.ModuleMap.size();
1170 return RegularLTO.ParallelCodeGenParallelismLevel + ModuleCount;
1171}
1172
1173// If only some of the modules were split, we cannot correctly handle
1174// code that contains type tests or type checked loads.
1175Error LTO::checkPartiallySplit() {
1176 if (!ThinLTO.CombinedIndex.partiallySplitLTOUnits())
1177 return Error::success();
1178
1179 const Module *Combined = RegularLTO.CombinedModule.get();
1180 Function *TypeTestFunc =
1181 Intrinsic::getDeclarationIfExists(Combined, Intrinsic::type_test);
1182 Function *TypeCheckedLoadFunc =
1183 Intrinsic::getDeclarationIfExists(Combined, Intrinsic::type_checked_load);
1184 Function *TypeCheckedLoadRelativeFunc = Intrinsic::getDeclarationIfExists(
1185 Combined, Intrinsic::type_checked_load_relative);
1186
1187 // First check if there are type tests / type checked loads in the
1188 // merged regular LTO module IR.
1189 if ((TypeTestFunc && !TypeTestFunc->use_empty()) ||
1190 (TypeCheckedLoadFunc && !TypeCheckedLoadFunc->use_empty()) ||
1191 (TypeCheckedLoadRelativeFunc &&
1192 !TypeCheckedLoadRelativeFunc->use_empty()))
1194 "inconsistent LTO Unit splitting (recompile with -fsplit-lto-unit)",
1196
1197 // Otherwise check if there are any recorded in the combined summary from the
1198 // ThinLTO modules.
1199 for (auto &P : ThinLTO.CombinedIndex) {
1200 for (auto &S : P.second.getSummaryList()) {
1201 auto *FS = dyn_cast<FunctionSummary>(S.get());
1202 if (!FS)
1203 continue;
1204 if (!FS->type_test_assume_vcalls().empty() ||
1205 !FS->type_checked_load_vcalls().empty() ||
1206 !FS->type_test_assume_const_vcalls().empty() ||
1207 !FS->type_checked_load_const_vcalls().empty() ||
1208 !FS->type_tests().empty())
1210 "inconsistent LTO Unit splitting (recompile with -fsplit-lto-unit)",
1212 }
1213 }
1214 return Error::success();
1215}
1216
1218 if (Error EC = handleArchiveInputs())
1219 return EC;
1220
1221 // Compute "dead" symbols, we don't want to import/export these!
1222 DenseSet<GlobalValue::GUID> GUIDPreservedSymbols;
1223 DenseMap<GlobalValue::GUID, PrevailingType> GUIDPrevailingResolutions;
1224 for (auto &Res : *GlobalResolutions) {
1225 // Normally resolution have IR name of symbol. We can do nothing here
1226 // otherwise. See comments in GlobalResolution struct for more details.
1227 if (Res.second.IRName.empty())
1228 continue;
1229
1231 GlobalValue::dropLLVMManglingEscape(Res.second.IRName));
1232
1233 if (Res.second.VisibleOutsideSummary && Res.second.Prevailing)
1234 GUIDPreservedSymbols.insert(GUID);
1235
1236 if (Res.second.ExportDynamic)
1237 DynamicExportSymbols.insert(GUID);
1238
1239 GUIDPrevailingResolutions[GUID] =
1240 Res.second.Prevailing ? PrevailingType::Yes : PrevailingType::No;
1241 }
1242
1243 auto isPrevailing = [&](GlobalValue::GUID G) {
1244 auto It = GUIDPrevailingResolutions.find(G);
1245 if (It == GUIDPrevailingResolutions.end())
1247 return It->second;
1248 };
1249 computeDeadSymbolsWithConstProp(ThinLTO.CombinedIndex, GUIDPreservedSymbols,
1250 isPrevailing, Conf.OptLevel > 0);
1251
1252 // Setup output file to emit statistics.
1253 auto StatsFileOrErr = setupStatsFile(Conf.StatsFile);
1254 if (!StatsFileOrErr)
1255 return StatsFileOrErr.takeError();
1256 std::unique_ptr<ToolOutputFile> StatsFile = std::move(StatsFileOrErr.get());
1257
1258 // TODO: Ideally this would be controlled automatically by detecting that we
1259 // are linking with an allocator that supports these interfaces, rather than
1260 // an internal option (which would still be needed for tests, however). For
1261 // example, if the library exported a symbol like __malloc_hot_cold the linker
1262 // could recognize that and set a flag in the lto::Config.
1264 ThinLTO.CombinedIndex.setWithSupportsHotColdNew();
1265
1266 Error Result = runRegularLTO(AddStream);
1267 if (!Result)
1268 // This will reset the GlobalResolutions optional once done with it to
1269 // reduce peak memory before importing.
1270 Result = runThinLTO(AddStream, Cache, GUIDPreservedSymbols);
1271
1272 if (StatsFile)
1273 PrintStatisticsJSON(StatsFile->os());
1274
1275 return Result;
1276}
1277
1278Error LTO::runRegularLTO(AddStreamFn AddStream) {
1279 llvm::TimeTraceScope timeScope("Run regular LTO");
1280 LLVMContext &CombinedCtx = RegularLTO.CombinedModule->getContext();
1281 // Setup optimization remarks.
1282 auto DiagFileOrErr = lto::setupLLVMOptimizationRemarks(
1283 CombinedCtx, Conf.RemarksFilename, Conf.RemarksPasses, Conf.RemarksFormat,
1285 LLVM_DEBUG(dbgs() << "Running regular LTO\n");
1286 if (!DiagFileOrErr)
1287 return DiagFileOrErr.takeError();
1288 DiagnosticOutputFile = std::move(*DiagFileOrErr);
1289
1290 // Finalize linking of regular LTO modules containing summaries now that
1291 // we have computed liveness information.
1292 {
1293 llvm::TimeTraceScope timeScope("Link regular LTO");
1294 for (auto &M : RegularLTO.ModsWithSummaries)
1295 if (Error Err = linkRegularLTO(std::move(M), /*LivenessFromIndex=*/true))
1296 return Err;
1297 }
1298
1299 // Ensure we don't have inconsistently split LTO units with type tests.
1300 // FIXME: this checks both LTO and ThinLTO. It happens to work as we take
1301 // this path both cases but eventually this should be split into two and
1302 // do the ThinLTO checks in `runThinLTO`.
1303 if (Error Err = checkPartiallySplit())
1304 return Err;
1305
1306 // Make sure commons have the right size/alignment: we kept the largest from
1307 // all the prevailing when adding the inputs, and we apply it here.
1308 const DataLayout &DL = RegularLTO.CombinedModule->getDataLayout();
1309 for (auto &I : RegularLTO.Commons) {
1310 if (!I.second.Prevailing)
1311 // Don't do anything if no instance of this common was prevailing.
1312 continue;
1313 GlobalVariable *OldGV = RegularLTO.CombinedModule->getNamedGlobal(I.first);
1314 if (OldGV && DL.getTypeAllocSize(OldGV->getValueType()) == I.second.Size) {
1315 // Don't create a new global if the type is already correct, just make
1316 // sure the alignment is correct.
1317 OldGV->setAlignment(I.second.Alignment);
1318 continue;
1319 }
1320 ArrayType *Ty =
1321 ArrayType::get(Type::getInt8Ty(RegularLTO.Ctx), I.second.Size);
1322 auto *GV = new GlobalVariable(*RegularLTO.CombinedModule, Ty, false,
1325 GV->setAlignment(I.second.Alignment);
1326 if (OldGV) {
1327 OldGV->replaceAllUsesWith(GV);
1328 GV->takeName(OldGV);
1329 OldGV->eraseFromParent();
1330 } else {
1331 GV->setName(I.first);
1332 }
1333 }
1334
1335 bool WholeProgramVisibilityEnabledInLTO =
1336 Conf.HasWholeProgramVisibility &&
1337 // If validation is enabled, upgrade visibility only when all vtables
1338 // have typeinfos.
1339 (!Conf.ValidateAllVtablesHaveTypeInfos || Conf.AllVtablesHaveTypeInfos);
1340
1341 // This returns true when the name is local or not defined. Locals are
1342 // expected to be handled separately.
1343 auto IsVisibleToRegularObj = [&](StringRef name) {
1344 auto It = GlobalResolutions->find(name);
1345 return (It == GlobalResolutions->end() ||
1346 It->second.VisibleOutsideSummary || !It->second.Prevailing);
1347 };
1348
1349 // If allowed, upgrade public vcall visibility metadata to linkage unit
1350 // visibility before whole program devirtualization in the optimizer.
1352 *RegularLTO.CombinedModule, WholeProgramVisibilityEnabledInLTO,
1353 DynamicExportSymbols, Conf.ValidateAllVtablesHaveTypeInfos,
1354 IsVisibleToRegularObj);
1355 updatePublicTypeTestCalls(*RegularLTO.CombinedModule,
1356 WholeProgramVisibilityEnabledInLTO);
1357
1358 if (Conf.PreOptModuleHook &&
1359 !Conf.PreOptModuleHook(0, *RegularLTO.CombinedModule))
1360 return finalizeOptimizationRemarks(std::move(DiagnosticOutputFile));
1361
1362 if (!Conf.CodeGenOnly) {
1363 for (const auto &R : *GlobalResolutions) {
1364 GlobalValue *GV =
1365 RegularLTO.CombinedModule->getNamedValue(R.second.IRName);
1366 if (!R.second.isPrevailingIRSymbol())
1367 continue;
1368 if (R.second.Partition != 0 &&
1369 R.second.Partition != GlobalResolution::External)
1370 continue;
1371
1372 // Ignore symbols defined in other partitions.
1373 // Also skip declarations, which are not allowed to have internal linkage.
1374 if (!GV || GV->hasLocalLinkage() || GV->isDeclaration())
1375 continue;
1376
1377 // Symbols that are marked DLLImport or DLLExport should not be
1378 // internalized, as they are either externally visible or referencing
1379 // external symbols. Symbols that have AvailableExternally or Appending
1380 // linkage might be used by future passes and should be kept as is.
1381 // These linkages are seen in Unified regular LTO, because the process
1382 // of creating split LTO units introduces symbols with that linkage into
1383 // one of the created modules. Normally, only the ThinLTO backend would
1384 // compile this module, but Unified Regular LTO processes both
1385 // modules created by the splitting process as regular LTO modules.
1386 if ((LTOMode == LTOKind::LTOK_UnifiedRegular) &&
1389 continue;
1390
1391 GV->setUnnamedAddr(R.second.UnnamedAddr ? GlobalValue::UnnamedAddr::Global
1393 if (EnableLTOInternalization && R.second.Partition == 0)
1395 }
1396
1397 if (Conf.PostInternalizeModuleHook &&
1398 !Conf.PostInternalizeModuleHook(0, *RegularLTO.CombinedModule))
1399 return finalizeOptimizationRemarks(std::move(DiagnosticOutputFile));
1400 }
1401
1402 if (!RegularLTO.EmptyCombinedModule || Conf.AlwaysEmitRegularLTOObj) {
1403 if (Error Err =
1404 backend(Conf, AddStream, RegularLTO.ParallelCodeGenParallelismLevel,
1405 *RegularLTO.CombinedModule, ThinLTO.CombinedIndex))
1406 return Err;
1407 }
1408
1409 return finalizeOptimizationRemarks(std::move(DiagnosticOutputFile));
1410}
1411
1413 RTLIB::RuntimeLibcallsInfo Libcalls(TT);
1414 SmallVector<const char *> LibcallSymbols;
1415 LibcallSymbols.reserve(Libcalls.getNumAvailableLibcallImpls());
1416
1417 for (RTLIB::LibcallImpl Impl : RTLIB::libcall_impls()) {
1418 if (Libcalls.isAvailable(Impl))
1419 LibcallSymbols.push_back(Libcalls.getLibcallImplName(Impl).data());
1420 }
1421
1422 return LibcallSymbols;
1423}
1424
1426 const FunctionImporter::ImportMapTy &ImportList, llvm::StringRef ModulePath,
1427 const std::string &NewModulePath) const {
1428 return emitFiles(ImportList, ModulePath, NewModulePath,
1429 NewModulePath + ".thinlto.bc",
1430 /*ImportsFiles=*/std::nullopt);
1431}
1432
1434 const FunctionImporter::ImportMapTy &ImportList, llvm::StringRef ModulePath,
1435 const std::string &NewModulePath, StringRef SummaryPath,
1436 std::optional<std::reference_wrapper<ImportsFilesContainer>> ImportsFiles)
1437 const {
1438 ModuleToSummariesForIndexTy ModuleToSummariesForIndex;
1439 GVSummaryPtrSet DeclarationSummaries;
1440
1441 std::error_code EC;
1443 ImportList, ModuleToSummariesForIndex,
1444 DeclarationSummaries);
1445
1446 raw_fd_ostream OS(SummaryPath, EC, sys::fs::OpenFlags::OF_None);
1447 if (EC)
1448 return createFileError("cannot open " + Twine(SummaryPath), EC);
1449
1450 writeIndexToFile(CombinedIndex, OS, &ModuleToSummariesForIndex,
1451 &DeclarationSummaries);
1452
1454 Error ImportsFilesError = EmitImportsFiles(
1455 ModulePath, NewModulePath + ".imports", ModuleToSummariesForIndex);
1456 if (ImportsFilesError)
1457 return ImportsFilesError;
1458 }
1459
1460 // Optionally, store the imports files.
1461 if (ImportsFiles)
1463 ModulePath, ModuleToSummariesForIndex,
1464 [&](StringRef M) { ImportsFiles->get().push_back(M.str()); });
1465
1466 return Error::success();
1467}
1468
1469namespace {
1470/// Base class for ThinLTO backends that perform code generation and insert the
1471/// generated files back into the link.
1472class CGThinBackend : public ThinBackendProc {
1473protected:
1474 AddStreamFn AddStream;
1475 DenseSet<GlobalValue::GUID> CfiFunctionDefs;
1476 DenseSet<GlobalValue::GUID> CfiFunctionDecls;
1477 bool ShouldEmitIndexFiles;
1478
1479public:
1480 CGThinBackend(
1481 const Config &Conf, ModuleSummaryIndex &CombinedIndex,
1482 const DenseMap<StringRef, GVSummaryMapTy> &ModuleToDefinedGVSummaries,
1483 AddStreamFn AddStream, lto::IndexWriteCallback OnWrite,
1484 bool ShouldEmitIndexFiles, bool ShouldEmitImportsFiles,
1485 ThreadPoolStrategy ThinLTOParallelism)
1486 : ThinBackendProc(Conf, CombinedIndex, ModuleToDefinedGVSummaries,
1487 OnWrite, ShouldEmitImportsFiles, ThinLTOParallelism),
1488 AddStream(std::move(AddStream)),
1489 ShouldEmitIndexFiles(ShouldEmitIndexFiles) {
1490 auto &Defs = CombinedIndex.cfiFunctionDefs();
1491 CfiFunctionDefs.insert_range(Defs.guids());
1492 auto &Decls = CombinedIndex.cfiFunctionDecls();
1493 CfiFunctionDecls.insert_range(Decls.guids());
1494 }
1495};
1496
1497/// This backend performs code generation by scheduling a job to run on
1498/// an in-process thread when invoked for each task.
1499class InProcessThinBackend : public CGThinBackend {
1500protected:
1501 FileCache Cache;
1502
1503public:
1504 InProcessThinBackend(
1505 const Config &Conf, ModuleSummaryIndex &CombinedIndex,
1506 ThreadPoolStrategy ThinLTOParallelism,
1507 const DenseMap<StringRef, GVSummaryMapTy> &ModuleToDefinedGVSummaries,
1508 AddStreamFn AddStream, FileCache Cache, lto::IndexWriteCallback OnWrite,
1509 bool ShouldEmitIndexFiles, bool ShouldEmitImportsFiles)
1510 : CGThinBackend(Conf, CombinedIndex, ModuleToDefinedGVSummaries,
1511 AddStream, OnWrite, ShouldEmitIndexFiles,
1512 ShouldEmitImportsFiles, ThinLTOParallelism),
1513 Cache(std::move(Cache)) {}
1514
1515 virtual Error runThinLTOBackendThread(
1516 AddStreamFn AddStream, FileCache Cache, unsigned Task, BitcodeModule BM,
1517 ModuleSummaryIndex &CombinedIndex,
1518 const FunctionImporter::ImportMapTy &ImportList,
1519 const FunctionImporter::ExportSetTy &ExportList,
1520 const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes> &ResolvedODR,
1521 const GVSummaryMapTy &DefinedGlobals,
1522 MapVector<StringRef, BitcodeModule> &ModuleMap) {
1523 auto ModuleID = BM.getModuleIdentifier();
1524 llvm::TimeTraceScope timeScope("Run ThinLTO backend thread (in-process)",
1525 ModuleID);
1526 auto RunThinBackend = [&](AddStreamFn AddStream) {
1527 LTOLLVMContext BackendContext(Conf);
1528 Expected<std::unique_ptr<Module>> MOrErr = BM.parseModule(BackendContext);
1529 if (!MOrErr)
1530 return MOrErr.takeError();
1531
1532 return thinBackend(Conf, Task, AddStream, **MOrErr, CombinedIndex,
1533 ImportList, DefinedGlobals, &ModuleMap,
1534 Conf.CodeGenOnly);
1535 };
1536 if (ShouldEmitIndexFiles) {
1537 if (auto E = emitFiles(ImportList, ModuleID, ModuleID.str()))
1538 return E;
1539 }
1540
1541 if (!Cache.isValid() || !CombinedIndex.modulePaths().count(ModuleID) ||
1542 all_of(CombinedIndex.getModuleHash(ModuleID),
1543 [](uint32_t V) { return V == 0; }))
1544 // Cache disabled or no entry for this module in the combined index or
1545 // no module hash.
1546 return RunThinBackend(AddStream);
1547
1548 // The module may be cached, this helps handling it.
1549 std::string Key = computeLTOCacheKey(
1550 Conf, CombinedIndex, ModuleID, ImportList, ExportList, ResolvedODR,
1551 DefinedGlobals, CfiFunctionDefs, CfiFunctionDecls);
1552 Expected<AddStreamFn> CacheAddStreamOrErr = Cache(Task, Key, ModuleID);
1553 if (Error Err = CacheAddStreamOrErr.takeError())
1554 return Err;
1555 AddStreamFn &CacheAddStream = *CacheAddStreamOrErr;
1556 if (CacheAddStream)
1557 return RunThinBackend(CacheAddStream);
1558
1559 return Error::success();
1560 }
1561
1562 Error start(
1563 unsigned Task, BitcodeModule BM,
1564 const FunctionImporter::ImportMapTy &ImportList,
1565 const FunctionImporter::ExportSetTy &ExportList,
1566 const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes> &ResolvedODR,
1567 MapVector<StringRef, BitcodeModule> &ModuleMap) override {
1568 StringRef ModulePath = BM.getModuleIdentifier();
1569 assert(ModuleToDefinedGVSummaries.count(ModulePath));
1570 const GVSummaryMapTy &DefinedGlobals =
1571 ModuleToDefinedGVSummaries.find(ModulePath)->second;
1572 BackendThreadPool.async(
1573 [=](BitcodeModule BM, ModuleSummaryIndex &CombinedIndex,
1574 const FunctionImporter::ImportMapTy &ImportList,
1575 const FunctionImporter::ExportSetTy &ExportList,
1576 const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes>
1577 &ResolvedODR,
1578 const GVSummaryMapTy &DefinedGlobals,
1579 MapVector<StringRef, BitcodeModule> &ModuleMap) {
1580 if (LLVM_ENABLE_THREADS && Conf.TimeTraceEnabled)
1582 "thin backend");
1583 Error E = runThinLTOBackendThread(
1584 AddStream, Cache, Task, BM, CombinedIndex, ImportList, ExportList,
1585 ResolvedODR, DefinedGlobals, ModuleMap);
1586 if (E) {
1587 std::unique_lock<std::mutex> L(ErrMu);
1588 if (Err)
1589 Err = joinErrors(std::move(*Err), std::move(E));
1590 else
1591 Err = std::move(E);
1592 }
1593 if (LLVM_ENABLE_THREADS && Conf.TimeTraceEnabled)
1595 },
1596 BM, std::ref(CombinedIndex), std::ref(ImportList), std::ref(ExportList),
1597 std::ref(ResolvedODR), std::ref(DefinedGlobals), std::ref(ModuleMap));
1598
1599 if (OnWrite)
1600 OnWrite(std::string(ModulePath));
1601 return Error::success();
1602 }
1603};
1604
1605/// This backend is utilized in the first round of a two-codegen round process.
1606/// It first saves optimized bitcode files to disk before the codegen process
1607/// begins. After codegen, it stores the resulting object files in a scratch
1608/// buffer. Note the codegen data stored in the scratch buffer will be extracted
1609/// and merged in the subsequent step.
1610class FirstRoundThinBackend : public InProcessThinBackend {
1611 AddStreamFn IRAddStream;
1612 FileCache IRCache;
1613
1614public:
1615 FirstRoundThinBackend(
1616 const Config &Conf, ModuleSummaryIndex &CombinedIndex,
1617 ThreadPoolStrategy ThinLTOParallelism,
1618 const DenseMap<StringRef, GVSummaryMapTy> &ModuleToDefinedGVSummaries,
1619 AddStreamFn CGAddStream, FileCache CGCache, AddStreamFn IRAddStream,
1620 FileCache IRCache)
1621 : InProcessThinBackend(Conf, CombinedIndex, ThinLTOParallelism,
1622 ModuleToDefinedGVSummaries, std::move(CGAddStream),
1623 std::move(CGCache), /*OnWrite=*/nullptr,
1624 /*ShouldEmitIndexFiles=*/false,
1625 /*ShouldEmitImportsFiles=*/false),
1626 IRAddStream(std::move(IRAddStream)), IRCache(std::move(IRCache)) {}
1627
1628 Error runThinLTOBackendThread(
1629 AddStreamFn CGAddStream, FileCache CGCache, unsigned Task,
1630 BitcodeModule BM, ModuleSummaryIndex &CombinedIndex,
1631 const FunctionImporter::ImportMapTy &ImportList,
1632 const FunctionImporter::ExportSetTy &ExportList,
1633 const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes> &ResolvedODR,
1634 const GVSummaryMapTy &DefinedGlobals,
1635 MapVector<StringRef, BitcodeModule> &ModuleMap) override {
1636 auto ModuleID = BM.getModuleIdentifier();
1637 llvm::TimeTraceScope timeScope("Run ThinLTO backend thread (first round)",
1638 ModuleID);
1639 auto RunThinBackend = [&](AddStreamFn CGAddStream,
1640 AddStreamFn IRAddStream) {
1641 LTOLLVMContext BackendContext(Conf);
1642 Expected<std::unique_ptr<Module>> MOrErr = BM.parseModule(BackendContext);
1643 if (!MOrErr)
1644 return MOrErr.takeError();
1645
1646 return thinBackend(Conf, Task, CGAddStream, **MOrErr, CombinedIndex,
1647 ImportList, DefinedGlobals, &ModuleMap,
1648 Conf.CodeGenOnly, IRAddStream);
1649 };
1650 // Like InProcessThinBackend, we produce index files as needed for
1651 // FirstRoundThinBackend. However, these files are not generated for
1652 // SecondRoundThinBackend.
1653 if (ShouldEmitIndexFiles) {
1654 if (auto E = emitFiles(ImportList, ModuleID, ModuleID.str()))
1655 return E;
1656 }
1657
1658 assert((CGCache.isValid() == IRCache.isValid()) &&
1659 "Both caches for CG and IR should have matching availability");
1660 if (!CGCache.isValid() || !CombinedIndex.modulePaths().count(ModuleID) ||
1661 all_of(CombinedIndex.getModuleHash(ModuleID),
1662 [](uint32_t V) { return V == 0; }))
1663 // Cache disabled or no entry for this module in the combined index or
1664 // no module hash.
1665 return RunThinBackend(CGAddStream, IRAddStream);
1666
1667 // Get CGKey for caching object in CGCache.
1668 std::string CGKey = computeLTOCacheKey(
1669 Conf, CombinedIndex, ModuleID, ImportList, ExportList, ResolvedODR,
1670 DefinedGlobals, CfiFunctionDefs, CfiFunctionDecls);
1671 Expected<AddStreamFn> CacheCGAddStreamOrErr =
1672 CGCache(Task, CGKey, ModuleID);
1673 if (Error Err = CacheCGAddStreamOrErr.takeError())
1674 return Err;
1675 AddStreamFn &CacheCGAddStream = *CacheCGAddStreamOrErr;
1676
1677 // Get IRKey for caching (optimized) IR in IRCache with an extra ID.
1678 std::string IRKey = recomputeLTOCacheKey(CGKey, /*ExtraID=*/"IR");
1679 Expected<AddStreamFn> CacheIRAddStreamOrErr =
1680 IRCache(Task, IRKey, ModuleID);
1681 if (Error Err = CacheIRAddStreamOrErr.takeError())
1682 return Err;
1683 AddStreamFn &CacheIRAddStream = *CacheIRAddStreamOrErr;
1684
1685 // Ideally, both CG and IR caching should be synchronized. However, in
1686 // practice, their availability may differ due to different expiration
1687 // times. Therefore, if either cache is missing, the backend process is
1688 // triggered.
1689 if (CacheCGAddStream || CacheIRAddStream) {
1690 LLVM_DEBUG(dbgs() << "[FirstRound] Cache Miss for "
1691 << BM.getModuleIdentifier() << "\n");
1692 return RunThinBackend(CacheCGAddStream ? CacheCGAddStream : CGAddStream,
1693 CacheIRAddStream ? CacheIRAddStream : IRAddStream);
1694 }
1695
1696 return Error::success();
1697 }
1698};
1699
1700/// This backend operates in the second round of a two-codegen round process.
1701/// It starts by reading the optimized bitcode files that were saved during the
1702/// first round. The backend then executes the codegen only to further optimize
1703/// the code, utilizing the codegen data merged from the first round. Finally,
1704/// it writes the resulting object files as usual.
1705class SecondRoundThinBackend : public InProcessThinBackend {
1706 std::unique_ptr<SmallVector<StringRef>> IRFiles;
1707 stable_hash CombinedCGDataHash;
1708
1709public:
1710 SecondRoundThinBackend(
1711 const Config &Conf, ModuleSummaryIndex &CombinedIndex,
1712 ThreadPoolStrategy ThinLTOParallelism,
1713 const DenseMap<StringRef, GVSummaryMapTy> &ModuleToDefinedGVSummaries,
1714 AddStreamFn AddStream, FileCache Cache,
1715 std::unique_ptr<SmallVector<StringRef>> IRFiles,
1716 stable_hash CombinedCGDataHash)
1717 : InProcessThinBackend(Conf, CombinedIndex, ThinLTOParallelism,
1718 ModuleToDefinedGVSummaries, std::move(AddStream),
1719 std::move(Cache),
1720 /*OnWrite=*/nullptr,
1721 /*ShouldEmitIndexFiles=*/false,
1722 /*ShouldEmitImportsFiles=*/false),
1723 IRFiles(std::move(IRFiles)), CombinedCGDataHash(CombinedCGDataHash) {}
1724
1725 Error runThinLTOBackendThread(
1726 AddStreamFn AddStream, FileCache Cache, unsigned Task, BitcodeModule BM,
1727 ModuleSummaryIndex &CombinedIndex,
1728 const FunctionImporter::ImportMapTy &ImportList,
1729 const FunctionImporter::ExportSetTy &ExportList,
1730 const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes> &ResolvedODR,
1731 const GVSummaryMapTy &DefinedGlobals,
1732 MapVector<StringRef, BitcodeModule> &ModuleMap) override {
1733 auto ModuleID = BM.getModuleIdentifier();
1734 llvm::TimeTraceScope timeScope("Run ThinLTO backend thread (second round)",
1735 ModuleID);
1736 auto RunThinBackend = [&](AddStreamFn AddStream) {
1737 LTOLLVMContext BackendContext(Conf);
1738 std::unique_ptr<Module> LoadedModule =
1739 cgdata::loadModuleForTwoRounds(BM, Task, BackendContext, *IRFiles);
1740
1741 return thinBackend(Conf, Task, AddStream, *LoadedModule, CombinedIndex,
1742 ImportList, DefinedGlobals, &ModuleMap,
1743 /*CodeGenOnly=*/true);
1744 };
1745 if (!Cache.isValid() || !CombinedIndex.modulePaths().count(ModuleID) ||
1746 all_of(CombinedIndex.getModuleHash(ModuleID),
1747 [](uint32_t V) { return V == 0; }))
1748 // Cache disabled or no entry for this module in the combined index or
1749 // no module hash.
1750 return RunThinBackend(AddStream);
1751
1752 // Get Key for caching the final object file in Cache with the combined
1753 // CGData hash.
1754 std::string Key = computeLTOCacheKey(
1755 Conf, CombinedIndex, ModuleID, ImportList, ExportList, ResolvedODR,
1756 DefinedGlobals, CfiFunctionDefs, CfiFunctionDecls);
1758 /*ExtraID=*/std::to_string(CombinedCGDataHash));
1759 Expected<AddStreamFn> CacheAddStreamOrErr = Cache(Task, Key, ModuleID);
1760 if (Error Err = CacheAddStreamOrErr.takeError())
1761 return Err;
1762 AddStreamFn &CacheAddStream = *CacheAddStreamOrErr;
1763
1764 if (CacheAddStream) {
1765 LLVM_DEBUG(dbgs() << "[SecondRound] Cache Miss for "
1766 << BM.getModuleIdentifier() << "\n");
1767 return RunThinBackend(CacheAddStream);
1768 }
1769
1770 return Error::success();
1771 }
1772};
1773} // end anonymous namespace
1774
1777 bool ShouldEmitIndexFiles,
1778 bool ShouldEmitImportsFiles) {
1779 auto Func =
1780 [=](const Config &Conf, ModuleSummaryIndex &CombinedIndex,
1781 const DenseMap<StringRef, GVSummaryMapTy> &ModuleToDefinedGVSummaries,
1782 AddStreamFn AddStream, FileCache Cache) {
1783 return std::make_unique<InProcessThinBackend>(
1784 Conf, CombinedIndex, Parallelism, ModuleToDefinedGVSummaries,
1785 AddStream, Cache, OnWrite, ShouldEmitIndexFiles,
1786 ShouldEmitImportsFiles);
1787 };
1788 return ThinBackend(Func, Parallelism);
1789}
1790
1792 if (!TheTriple.isOSDarwin())
1793 return "";
1794 if (TheTriple.getArch() == Triple::x86_64)
1795 return "core2";
1796 if (TheTriple.getArch() == Triple::x86)
1797 return "yonah";
1798 if (TheTriple.isArm64e())
1799 return "apple-a12";
1800 if (TheTriple.getArch() == Triple::aarch64 ||
1801 TheTriple.getArch() == Triple::aarch64_32)
1802 return "cyclone";
1803 return "";
1804}
1805
1806// Given the original \p Path to an output file, replace any path
1807// prefix matching \p OldPrefix with \p NewPrefix. Also, create the
1808// resulting directory if it does not yet exist.
1810 StringRef NewPrefix) {
1811 if (OldPrefix.empty() && NewPrefix.empty())
1812 return std::string(Path);
1813 SmallString<128> NewPath(Path);
1814 llvm::sys::path::replace_path_prefix(NewPath, OldPrefix, NewPrefix);
1815 StringRef ParentPath = llvm::sys::path::parent_path(NewPath.str());
1816 if (!ParentPath.empty()) {
1817 // Make sure the new directory exists, creating it if necessary.
1818 if (std::error_code EC = llvm::sys::fs::create_directories(ParentPath))
1819 llvm::errs() << "warning: could not create directory '" << ParentPath
1820 << "': " << EC.message() << '\n';
1821 }
1822 return std::string(NewPath);
1823}
1824
1825namespace {
1826class WriteIndexesThinBackend : public ThinBackendProc {
1827 std::string OldPrefix, NewPrefix, NativeObjectPrefix;
1828 raw_fd_ostream *LinkedObjectsFile;
1829
1830public:
1831 WriteIndexesThinBackend(
1832 const Config &Conf, ModuleSummaryIndex &CombinedIndex,
1833 ThreadPoolStrategy ThinLTOParallelism,
1834 const DenseMap<StringRef, GVSummaryMapTy> &ModuleToDefinedGVSummaries,
1835 std::string OldPrefix, std::string NewPrefix,
1836 std::string NativeObjectPrefix, bool ShouldEmitImportsFiles,
1837 raw_fd_ostream *LinkedObjectsFile, lto::IndexWriteCallback OnWrite)
1838 : ThinBackendProc(Conf, CombinedIndex, ModuleToDefinedGVSummaries,
1839 OnWrite, ShouldEmitImportsFiles, ThinLTOParallelism),
1840 OldPrefix(OldPrefix), NewPrefix(NewPrefix),
1841 NativeObjectPrefix(NativeObjectPrefix),
1842 LinkedObjectsFile(LinkedObjectsFile) {}
1843
1844 Error start(
1845 unsigned Task, BitcodeModule BM,
1846 const FunctionImporter::ImportMapTy &ImportList,
1847 const FunctionImporter::ExportSetTy &ExportList,
1848 const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes> &ResolvedODR,
1849 MapVector<StringRef, BitcodeModule> &ModuleMap) override {
1850 StringRef ModulePath = BM.getModuleIdentifier();
1851
1852 // The contents of this file may be used as input to a native link, and must
1853 // therefore contain the processed modules in a determinstic order that
1854 // match the order they are provided on the command line. For that reason,
1855 // we cannot include this in the asynchronously executed lambda below.
1856 if (LinkedObjectsFile) {
1857 std::string ObjectPrefix =
1858 NativeObjectPrefix.empty() ? NewPrefix : NativeObjectPrefix;
1859 std::string LinkedObjectsFilePath =
1860 getThinLTOOutputFile(ModulePath, OldPrefix, ObjectPrefix);
1861 *LinkedObjectsFile << LinkedObjectsFilePath << '\n';
1862 }
1863
1864 BackendThreadPool.async(
1865 [this](const StringRef ModulePath,
1866 const FunctionImporter::ImportMapTy &ImportList,
1867 const std::string &OldPrefix, const std::string &NewPrefix) {
1868 std::string NewModulePath =
1869 getThinLTOOutputFile(ModulePath, OldPrefix, NewPrefix);
1870 auto E = emitFiles(ImportList, ModulePath, NewModulePath);
1871 if (E) {
1872 std::unique_lock<std::mutex> L(ErrMu);
1873 if (Err)
1874 Err = joinErrors(std::move(*Err), std::move(E));
1875 else
1876 Err = std::move(E);
1877 return;
1878 }
1879 },
1880 ModulePath, ImportList, OldPrefix, NewPrefix);
1881
1882 if (OnWrite)
1883 OnWrite(std::string(ModulePath));
1884 return Error::success();
1885 }
1886
1887 bool isSensitiveToInputOrder() override {
1888 // The order which modules are written to LinkedObjectsFile should be
1889 // deterministic and match the order they are passed on the command line.
1890 return true;
1891 }
1892};
1893} // end anonymous namespace
1894
1896 ThreadPoolStrategy Parallelism, std::string OldPrefix,
1897 std::string NewPrefix, std::string NativeObjectPrefix,
1898 bool ShouldEmitImportsFiles, raw_fd_ostream *LinkedObjectsFile,
1899 IndexWriteCallback OnWrite) {
1900 auto Func =
1901 [=](const Config &Conf, ModuleSummaryIndex &CombinedIndex,
1902 const DenseMap<StringRef, GVSummaryMapTy> &ModuleToDefinedGVSummaries,
1903 AddStreamFn AddStream, FileCache Cache) {
1904 return std::make_unique<WriteIndexesThinBackend>(
1905 Conf, CombinedIndex, Parallelism, ModuleToDefinedGVSummaries,
1906 OldPrefix, NewPrefix, NativeObjectPrefix, ShouldEmitImportsFiles,
1907 LinkedObjectsFile, OnWrite);
1908 };
1909 return ThinBackend(Func, Parallelism);
1910}
1911
1912Error LTO::runThinLTO(AddStreamFn AddStream, FileCache Cache,
1913 const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols) {
1914 llvm::TimeTraceScope timeScope("Run ThinLTO");
1915 LLVM_DEBUG(dbgs() << "Running ThinLTO\n");
1916 ThinLTO.CombinedIndex.releaseTemporaryMemory();
1917 timeTraceProfilerBegin("ThinLink", StringRef(""));
1918 auto TimeTraceScopeExit = llvm::make_scope_exit([]() {
1921 });
1922 if (ThinLTO.ModuleMap.empty())
1923 return Error::success();
1924
1925 if (ThinLTO.ModulesToCompile && ThinLTO.ModulesToCompile->empty()) {
1926 llvm::errs() << "warning: [ThinLTO] No module compiled\n";
1927 return Error::success();
1928 }
1929
1930 if (Conf.CombinedIndexHook &&
1931 !Conf.CombinedIndexHook(ThinLTO.CombinedIndex, GUIDPreservedSymbols))
1932 return Error::success();
1933
1934 // Collect for each module the list of function it defines (GUID ->
1935 // Summary).
1936 DenseMap<StringRef, GVSummaryMapTy> ModuleToDefinedGVSummaries(
1937 ThinLTO.ModuleMap.size());
1938 ThinLTO.CombinedIndex.collectDefinedGVSummariesPerModule(
1939 ModuleToDefinedGVSummaries);
1940 // Create entries for any modules that didn't have any GV summaries
1941 // (either they didn't have any GVs to start with, or we suppressed
1942 // generation of the summaries because they e.g. had inline assembly
1943 // uses that couldn't be promoted/renamed on export). This is so
1944 // InProcessThinBackend::start can still launch a backend thread, which
1945 // is passed the map of summaries for the module, without any special
1946 // handling for this case.
1947 for (auto &Mod : ThinLTO.ModuleMap)
1948 if (!ModuleToDefinedGVSummaries.count(Mod.first))
1949 ModuleToDefinedGVSummaries.try_emplace(Mod.first);
1950
1951 FunctionImporter::ImportListsTy ImportLists(ThinLTO.ModuleMap.size());
1952 DenseMap<StringRef, FunctionImporter::ExportSetTy> ExportLists(
1953 ThinLTO.ModuleMap.size());
1954 StringMap<std::map<GlobalValue::GUID, GlobalValue::LinkageTypes>> ResolvedODR;
1955
1956 if (DumpThinCGSCCs)
1957 ThinLTO.CombinedIndex.dumpSCCs(outs());
1958
1959 std::set<GlobalValue::GUID> ExportedGUIDs;
1960
1961 bool WholeProgramVisibilityEnabledInLTO =
1962 Conf.HasWholeProgramVisibility &&
1963 // If validation is enabled, upgrade visibility only when all vtables
1964 // have typeinfos.
1965 (!Conf.ValidateAllVtablesHaveTypeInfos || Conf.AllVtablesHaveTypeInfos);
1966 if (hasWholeProgramVisibility(WholeProgramVisibilityEnabledInLTO))
1967 ThinLTO.CombinedIndex.setWithWholeProgramVisibility();
1968
1969 // If we're validating, get the vtable symbols that should not be
1970 // upgraded because they correspond to typeIDs outside of index-based
1971 // WPD info.
1972 DenseSet<GlobalValue::GUID> VisibleToRegularObjSymbols;
1973 if (WholeProgramVisibilityEnabledInLTO &&
1974 Conf.ValidateAllVtablesHaveTypeInfos) {
1975 // This returns true when the name is local or not defined. Locals are
1976 // expected to be handled separately.
1977 auto IsVisibleToRegularObj = [&](StringRef name) {
1978 auto It = GlobalResolutions->find(name);
1979 return (It == GlobalResolutions->end() ||
1980 It->second.VisibleOutsideSummary || !It->second.Prevailing);
1981 };
1982
1983 getVisibleToRegularObjVtableGUIDs(ThinLTO.CombinedIndex,
1984 VisibleToRegularObjSymbols,
1985 IsVisibleToRegularObj);
1986 }
1987
1988 // If allowed, upgrade public vcall visibility to linkage unit visibility in
1989 // the summaries before whole program devirtualization below.
1991 ThinLTO.CombinedIndex, WholeProgramVisibilityEnabledInLTO,
1992 DynamicExportSymbols, VisibleToRegularObjSymbols);
1993
1994 // Perform index-based WPD. This will return immediately if there are
1995 // no index entries in the typeIdMetadata map (e.g. if we are instead
1996 // performing IR-based WPD in hybrid regular/thin LTO mode).
1997 std::map<ValueInfo, std::vector<VTableSlotSummary>> LocalWPDTargetsMap;
1998 runWholeProgramDevirtOnIndex(ThinLTO.CombinedIndex, ExportedGUIDs,
1999 LocalWPDTargetsMap);
2000
2001 auto isPrevailing = [&](GlobalValue::GUID GUID, const GlobalValueSummary *S) {
2002 return ThinLTO.isPrevailingModuleForGUID(GUID, S->modulePath());
2003 };
2005 MemProfContextDisambiguation ContextDisambiguation;
2006 ContextDisambiguation.run(ThinLTO.CombinedIndex, isPrevailing);
2007 }
2008
2009 // Figure out which symbols need to be internalized. This also needs to happen
2010 // at -O0 because summary-based DCE is implemented using internalization, and
2011 // we must apply DCE consistently with the full LTO module in order to avoid
2012 // undefined references during the final link.
2013 for (auto &Res : *GlobalResolutions) {
2014 // If the symbol does not have external references or it is not prevailing,
2015 // then not need to mark it as exported from a ThinLTO partition.
2016 if (Res.second.Partition != GlobalResolution::External ||
2017 !Res.second.isPrevailingIRSymbol())
2018 continue;
2020 GlobalValue::dropLLVMManglingEscape(Res.second.IRName));
2021 // Mark exported unless index-based analysis determined it to be dead.
2022 if (ThinLTO.CombinedIndex.isGUIDLive(GUID))
2023 ExportedGUIDs.insert(GUID);
2024 }
2025
2026 // Reset the GlobalResolutions to deallocate the associated memory, as there
2027 // are no further accesses. We specifically want to do this before computing
2028 // cross module importing, which adds to peak memory via the computed import
2029 // and export lists.
2030 releaseGlobalResolutionsMemory();
2031
2032 if (Conf.OptLevel > 0)
2033 ComputeCrossModuleImport(ThinLTO.CombinedIndex, ModuleToDefinedGVSummaries,
2034 isPrevailing, ImportLists, ExportLists);
2035
2036 // Any functions referenced by the jump table in the regular LTO object must
2037 // be exported.
2038 auto &Defs = ThinLTO.CombinedIndex.cfiFunctionDefs();
2039 ExportedGUIDs.insert(Defs.guid_begin(), Defs.guid_end());
2040 auto &Decls = ThinLTO.CombinedIndex.cfiFunctionDecls();
2041 ExportedGUIDs.insert(Decls.guid_begin(), Decls.guid_end());
2042
2043 auto isExported = [&](StringRef ModuleIdentifier, ValueInfo VI) {
2044 const auto &ExportList = ExportLists.find(ModuleIdentifier);
2045 return (ExportList != ExportLists.end() && ExportList->second.count(VI)) ||
2046 ExportedGUIDs.count(VI.getGUID());
2047 };
2048
2049 // Update local devirtualized targets that were exported by cross-module
2050 // importing or by other devirtualizations marked in the ExportedGUIDs set.
2051 updateIndexWPDForExports(ThinLTO.CombinedIndex, isExported,
2052 LocalWPDTargetsMap);
2053
2054 thinLTOInternalizeAndPromoteInIndex(ThinLTO.CombinedIndex, isExported,
2055 isPrevailing);
2056
2057 auto recordNewLinkage = [&](StringRef ModuleIdentifier,
2059 GlobalValue::LinkageTypes NewLinkage) {
2060 ResolvedODR[ModuleIdentifier][GUID] = NewLinkage;
2061 };
2062 thinLTOResolvePrevailingInIndex(Conf, ThinLTO.CombinedIndex, isPrevailing,
2063 recordNewLinkage, GUIDPreservedSymbols);
2064
2065 thinLTOPropagateFunctionAttrs(ThinLTO.CombinedIndex, isPrevailing);
2066
2067 generateParamAccessSummary(ThinLTO.CombinedIndex);
2068
2071
2072 TimeTraceScopeExit.release();
2073
2074 auto &ModuleMap =
2075 ThinLTO.ModulesToCompile ? *ThinLTO.ModulesToCompile : ThinLTO.ModuleMap;
2076
2077 auto RunBackends = [&](ThinBackendProc *BackendProcess) -> Error {
2078 auto ProcessOneModule = [&](int I) -> Error {
2079 auto &Mod = *(ModuleMap.begin() + I);
2080 // Tasks 0 through ParallelCodeGenParallelismLevel-1 are reserved for
2081 // combined module and parallel code generation partitions.
2082 return BackendProcess->start(
2083 RegularLTO.ParallelCodeGenParallelismLevel + I, Mod.second,
2084 ImportLists[Mod.first], ExportLists[Mod.first],
2085 ResolvedODR[Mod.first], ThinLTO.ModuleMap);
2086 };
2087
2088 BackendProcess->setup(ModuleMap.size(),
2089 RegularLTO.ParallelCodeGenParallelismLevel,
2090 RegularLTO.CombinedModule->getTargetTriple());
2091
2092 if (BackendProcess->getThreadCount() == 1 ||
2093 BackendProcess->isSensitiveToInputOrder()) {
2094 // Process the modules in the order they were provided on the
2095 // command-line. It is important for this codepath to be used for
2096 // WriteIndexesThinBackend, to ensure the emitted LinkedObjectsFile lists
2097 // ThinLTO objects in the same order as the inputs, which otherwise would
2098 // affect the final link order.
2099 for (int I = 0, E = ModuleMap.size(); I != E; ++I)
2100 if (Error E = ProcessOneModule(I))
2101 return E;
2102 } else {
2103 // When executing in parallel, process largest bitsize modules first to
2104 // improve parallelism, and avoid starving the thread pool near the end.
2105 // This saves about 15 sec on a 36-core machine while link `clang.exe`
2106 // (out of 100 sec).
2107 std::vector<BitcodeModule *> ModulesVec;
2108 ModulesVec.reserve(ModuleMap.size());
2109 for (auto &Mod : ModuleMap)
2110 ModulesVec.push_back(&Mod.second);
2111 for (int I : generateModulesOrdering(ModulesVec))
2112 if (Error E = ProcessOneModule(I))
2113 return E;
2114 }
2115 return BackendProcess->wait();
2116 };
2117
2119 std::unique_ptr<ThinBackendProc> BackendProc =
2120 ThinLTO.Backend(Conf, ThinLTO.CombinedIndex, ModuleToDefinedGVSummaries,
2121 AddStream, Cache);
2122 return RunBackends(BackendProc.get());
2123 }
2124
2125 // Perform two rounds of code generation for ThinLTO:
2126 // 1. First round: Perform optimization and code generation, outputting to
2127 // temporary scratch objects.
2128 // 2. Merge code generation data extracted from the temporary scratch objects.
2129 // 3. Second round: Execute code generation again using the merged data.
2130 LLVM_DEBUG(dbgs() << "[TwoRounds] Initializing ThinLTO two-codegen rounds\n");
2131
2132 unsigned MaxTasks = getMaxTasks();
2133 auto Parallelism = ThinLTO.Backend.getParallelism();
2134 // Set up two additional streams and caches for storing temporary scratch
2135 // objects and optimized IRs, using the same cache directory as the original.
2136 cgdata::StreamCacheData CG(MaxTasks, Cache, "CG"), IR(MaxTasks, Cache, "IR");
2137
2138 // First round: Execute optimization and code generation, outputting to
2139 // temporary scratch objects. Serialize the optimized IRs before initiating
2140 // code generation.
2141 LLVM_DEBUG(dbgs() << "[TwoRounds] Running the first round of codegen\n");
2142 auto FirstRoundLTO = std::make_unique<FirstRoundThinBackend>(
2143 Conf, ThinLTO.CombinedIndex, Parallelism, ModuleToDefinedGVSummaries,
2144 CG.AddStream, CG.Cache, IR.AddStream, IR.Cache);
2145 if (Error E = RunBackends(FirstRoundLTO.get()))
2146 return E;
2147
2148 LLVM_DEBUG(dbgs() << "[TwoRounds] Merging codegen data\n");
2149 auto CombinedHashOrErr = cgdata::mergeCodeGenData(*CG.getResult());
2150 if (Error E = CombinedHashOrErr.takeError())
2151 return E;
2152 auto CombinedHash = *CombinedHashOrErr;
2153 LLVM_DEBUG(dbgs() << "[TwoRounds] CGData hash: " << CombinedHash << "\n");
2154
2155 // Second round: Read the optimized IRs and execute code generation using the
2156 // merged data.
2157 LLVM_DEBUG(dbgs() << "[TwoRounds] Running the second round of codegen\n");
2158 auto SecondRoundLTO = std::make_unique<SecondRoundThinBackend>(
2159 Conf, ThinLTO.CombinedIndex, Parallelism, ModuleToDefinedGVSummaries,
2160 AddStream, Cache, IR.getResult(), CombinedHash);
2161 return RunBackends(SecondRoundLTO.get());
2162}
2163
2167 std::optional<uint64_t> RemarksHotnessThreshold, int Count) {
2168 std::string Filename = std::string(RemarksFilename);
2169 // For ThinLTO, file.opt.<format> becomes
2170 // file.opt.<format>.thin.<num>.<format>.
2171 if (!Filename.empty() && Count != -1)
2172 Filename =
2173 (Twine(Filename) + ".thin." + llvm::utostr(Count) + "." + RemarksFormat)
2174 .str();
2175
2176 auto ResultOrErr = llvm::setupLLVMOptimizationRemarks(
2177 Context, Filename, RemarksPasses, RemarksFormat, RemarksWithHotness,
2179 if (Error E = ResultOrErr.takeError())
2180 return std::move(E);
2181
2182 if (*ResultOrErr)
2183 (*ResultOrErr)->keep();
2184
2185 return ResultOrErr;
2186}
2187
2190 // Setup output file to emit statistics.
2191 if (StatsFilename.empty())
2192 return nullptr;
2193
2195 std::error_code EC;
2196 auto StatsFile =
2197 std::make_unique<ToolOutputFile>(StatsFilename, EC, sys::fs::OF_None);
2198 if (EC)
2199 return errorCodeToError(EC);
2200
2201 StatsFile->keep();
2202 return std::move(StatsFile);
2203}
2204
2205// Compute the ordering we will process the inputs: the rough heuristic here
2206// is to sort them per size so that the largest module get schedule as soon as
2207// possible. This is purely a compile-time optimization.
2209 auto Seq = llvm::seq<int>(0, R.size());
2210 std::vector<int> ModulesOrdering(Seq.begin(), Seq.end());
2211 llvm::sort(ModulesOrdering, [&](int LeftIndex, int RightIndex) {
2212 auto LSize = R[LeftIndex]->getBuffer().size();
2213 auto RSize = R[RightIndex]->getBuffer().size();
2214 return LSize > RSize;
2215 });
2216 return ModulesOrdering;
2217}
2218
2219namespace {
2220/// This out-of-process backend does not perform code generation when invoked
2221/// for each task. Instead, it generates the necessary information (e.g., the
2222/// summary index shard, import list, etc.) to enable code generation to be
2223/// performed externally, similar to WriteIndexesThinBackend. The backend's
2224/// `wait` function then invokes an external distributor process to carry out
2225/// the backend compilations.
2226class OutOfProcessThinBackend : public CGThinBackend {
2227 using SString = SmallString<128>;
2228
2230 StringSaver Saver{Alloc};
2231
2232 SString LinkerOutputFile;
2233
2234 SString DistributorPath;
2235 ArrayRef<StringRef> DistributorArgs;
2236
2237 SString RemoteCompiler;
2238 ArrayRef<StringRef> RemoteCompilerPrependArgs;
2239 ArrayRef<StringRef> RemoteCompilerArgs;
2240
2241 bool SaveTemps;
2242
2243 SmallVector<StringRef, 0> CodegenOptions;
2244 DenseSet<StringRef> CommonInputs;
2245 // Number of the object files that have been already cached.
2246 std::atomic<size_t> CachedJobs{0};
2247 // Information specific to individual backend compilation job.
2248 struct Job {
2249 unsigned Task;
2250 StringRef ModuleID;
2251 StringRef NativeObjectPath;
2252 StringRef SummaryIndexPath;
2253 ImportsFilesContainer ImportsFiles;
2254 std::string CacheKey;
2255 AddStreamFn CacheAddStream;
2256 bool Cached = false;
2257 };
2258 // The set of backend compilations jobs.
2259 SmallVector<Job> Jobs;
2260
2261 // A unique string to identify the current link.
2262 SmallString<8> UID;
2263
2264 // The offset to the first ThinLTO task.
2265 unsigned ThinLTOTaskOffset;
2266
2267 // The target triple to supply for backend compilations.
2268 llvm::Triple Triple;
2269
2270 // Cache
2271 FileCache Cache;
2272
2273public:
2274 OutOfProcessThinBackend(
2275 const Config &Conf, ModuleSummaryIndex &CombinedIndex,
2276 ThreadPoolStrategy ThinLTOParallelism,
2277 const DenseMap<StringRef, GVSummaryMapTy> &ModuleToDefinedGVSummaries,
2278 AddStreamFn AddStream, FileCache CacheFn, lto::IndexWriteCallback OnWrite,
2279 bool ShouldEmitIndexFiles, bool ShouldEmitImportsFiles,
2280 StringRef LinkerOutputFile, StringRef Distributor,
2281 ArrayRef<StringRef> DistributorArgs, StringRef RemoteCompiler,
2282 ArrayRef<StringRef> RemoteCompilerPrependArgs,
2283 ArrayRef<StringRef> RemoteCompilerArgs, bool SaveTemps)
2284 : CGThinBackend(Conf, CombinedIndex, ModuleToDefinedGVSummaries,
2285 AddStream, OnWrite, ShouldEmitIndexFiles,
2286 ShouldEmitImportsFiles, ThinLTOParallelism),
2287 LinkerOutputFile(LinkerOutputFile), DistributorPath(Distributor),
2288 DistributorArgs(DistributorArgs), RemoteCompiler(RemoteCompiler),
2289 RemoteCompilerPrependArgs(RemoteCompilerPrependArgs),
2290 RemoteCompilerArgs(RemoteCompilerArgs), SaveTemps(SaveTemps),
2291 Cache(std::move(CacheFn)) {}
2292
2293 void setup(unsigned ThinLTONumTasks, unsigned ThinLTOTaskOffset,
2294 llvm::Triple Triple) override {
2296 Jobs.resize((size_t)ThinLTONumTasks);
2297 this->ThinLTOTaskOffset = ThinLTOTaskOffset;
2298 this->Triple = Triple;
2299 this->Conf.Dtlto = 1;
2300 }
2301
2302 virtual Error runThinLTOBackendThread(
2303 Job &J, const FunctionImporter::ImportMapTy &ImportList,
2304 const FunctionImporter::ExportSetTy &ExportList,
2305 const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes>
2306 &ResolvedODR) {
2307 {
2308 TimeTraceScope TimeScope("Emit individual index for DTLTO",
2309 J.SummaryIndexPath);
2310 if (auto E = emitFiles(ImportList, J.ModuleID, J.ModuleID.str(),
2311 J.SummaryIndexPath, J.ImportsFiles))
2312 return E;
2313 }
2314
2315 if (!Cache.isValid() || !CombinedIndex.modulePaths().count(J.ModuleID) ||
2316 all_of(CombinedIndex.getModuleHash(J.ModuleID),
2317 [](uint32_t V) { return V == 0; }))
2318 // Cache disabled or no entry for this module in the combined index or
2319 // no module hash.
2320 return Error::success();
2321
2322 TimeTraceScope TimeScope("Check cache for DTLTO", J.SummaryIndexPath);
2323 const GVSummaryMapTy &DefinedGlobals =
2324 ModuleToDefinedGVSummaries.find(J.ModuleID)->second;
2325
2326 // The module may be cached, this helps handling it.
2327 J.CacheKey = computeLTOCacheKey(Conf, CombinedIndex, J.ModuleID, ImportList,
2328 ExportList, ResolvedODR, DefinedGlobals,
2329 CfiFunctionDefs, CfiFunctionDecls);
2330
2331 // The module may be cached, this helps handling it.
2332 auto CacheAddStreamExp = Cache(J.Task, J.CacheKey, J.ModuleID);
2333 if (Error Err = CacheAddStreamExp.takeError())
2334 return Err;
2335 AddStreamFn &CacheAddStream = *CacheAddStreamExp;
2336 // If CacheAddStream is null, we have a cache hit and at this point
2337 // object file is already passed back to the linker.
2338 if (!CacheAddStream) {
2339 J.Cached = true; // Cache hit, mark the job as cached.
2340 CachedJobs.fetch_add(1);
2341 } else {
2342 // If CacheAddStream is not null, we have a cache miss and we need to
2343 // run the backend for codegen. Save cache 'add stream'
2344 // function for a later use.
2345 J.CacheAddStream = std::move(CacheAddStream);
2346 }
2347 return Error::success();
2348 }
2349
2350 Error start(
2351 unsigned Task, BitcodeModule BM,
2352 const FunctionImporter::ImportMapTy &ImportList,
2353 const FunctionImporter::ExportSetTy &ExportList,
2354 const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes> &ResolvedODR,
2355 MapVector<StringRef, BitcodeModule> &ModuleMap) override {
2356
2357 StringRef ModulePath = BM.getModuleIdentifier();
2358
2359 SString ObjFilePath = sys::path::parent_path(LinkerOutputFile);
2360 sys::path::append(ObjFilePath, sys::path::stem(ModulePath) + "." +
2361 itostr(Task) + "." + UID + ".native.o");
2362
2363 Job &J = Jobs[Task - ThinLTOTaskOffset];
2364 J = {Task,
2365 ModulePath,
2366 Saver.save(ObjFilePath.str()),
2367 Saver.save(ObjFilePath.str() + ".thinlto.bc"),
2368 {}, // Filled in by emitFiles below.
2369 "", /*CacheKey=*/
2370 nullptr,
2371 false};
2372
2373 // Cleanup per-job temporary files on abnormal process exit.
2374 if (!SaveTemps) {
2375 llvm::sys::RemoveFileOnSignal(J.NativeObjectPath);
2376 if (!ShouldEmitIndexFiles)
2377 llvm::sys::RemoveFileOnSignal(J.SummaryIndexPath);
2378 }
2379
2380 assert(ModuleToDefinedGVSummaries.count(ModulePath));
2381
2382 // The BackendThreadPool is only used here to write the sharded index files
2383 // (similar to WriteIndexesThinBackend).
2384 BackendThreadPool.async(
2385 [=](Job &J, const FunctionImporter::ImportMapTy &ImportList,
2386 const FunctionImporter::ExportSetTy &ExportList,
2387 const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes>
2388 &ResolvedODR) {
2389 if (LLVM_ENABLE_THREADS && Conf.TimeTraceEnabled)
2392 "Emit individual index and check cache for DTLTO");
2393 Error E =
2394 runThinLTOBackendThread(J, ImportList, ExportList, ResolvedODR);
2395 if (E) {
2396 std::unique_lock<std::mutex> L(ErrMu);
2397 if (Err)
2398 Err = joinErrors(std::move(*Err), std::move(E));
2399 else
2400 Err = std::move(E);
2401 }
2402 if (LLVM_ENABLE_THREADS && Conf.TimeTraceEnabled)
2404 },
2405 std::ref(J), std::ref(ImportList), std::ref(ExportList),
2406 std::ref(ResolvedODR));
2407
2408 return Error::success();
2409 }
2410
2411 // Derive a set of Clang options that will be shared/common for all DTLTO
2412 // backend compilations. We are intentionally minimal here as these options
2413 // must remain synchronized with the behavior of Clang. DTLTO does not support
2414 // all the features available with in-process LTO. More features are expected
2415 // to be added over time. Users can specify Clang options directly if a
2416 // feature is not supported. Note that explicitly specified options that imply
2417 // additional input or output file dependencies must be communicated to the
2418 // distribution system, potentially by setting extra options on the
2419 // distributor program.
2420 void buildCommonRemoteCompilerOptions() {
2421 const lto::Config &C = Conf;
2422 auto &Ops = CodegenOptions;
2423
2424 Ops.push_back(Saver.save("-O" + Twine(C.OptLevel)));
2425
2426 if (C.Options.EmitAddrsig)
2427 Ops.push_back("-faddrsig");
2428 if (C.Options.FunctionSections)
2429 Ops.push_back("-ffunction-sections");
2430 if (C.Options.DataSections)
2431 Ops.push_back("-fdata-sections");
2432
2433 if (C.RelocModel == Reloc::PIC_)
2434 // Clang doesn't have -fpic for all triples.
2435 if (!Triple.isOSBinFormatCOFF())
2436 Ops.push_back("-fpic");
2437
2438 // Turn on/off warnings about profile cfg mismatch (default on)
2439 // --lto-pgo-warn-mismatch.
2440 if (!C.PGOWarnMismatch) {
2441 Ops.push_back("-mllvm");
2442 Ops.push_back("-no-pgo-warn-mismatch");
2443 }
2444
2445 // Enable sample-based profile guided optimizations.
2446 // Sample profile file path --lto-sample-profile=<value>.
2447 if (!C.SampleProfile.empty()) {
2448 Ops.push_back(
2449 Saver.save("-fprofile-sample-use=" + Twine(C.SampleProfile)));
2450 CommonInputs.insert(C.SampleProfile);
2451 }
2452
2453 // We don't know which of options will be used by Clang.
2454 Ops.push_back("-Wno-unused-command-line-argument");
2455
2456 // Forward any supplied options.
2457 if (!RemoteCompilerArgs.empty())
2458 for (auto &a : RemoteCompilerArgs)
2459 Ops.push_back(a);
2460 }
2461
2462 // Generates a JSON file describing the backend compilations, for the
2463 // distributor.
2464 bool emitDistributorJson(StringRef DistributorJson) {
2465 using json::Array;
2466 std::error_code EC;
2467 raw_fd_ostream OS(DistributorJson, EC);
2468 if (EC)
2469 return false;
2470
2471 json::OStream JOS(OS);
2472 JOS.object([&]() {
2473 // Information common to all jobs.
2474 JOS.attributeObject("common", [&]() {
2475 JOS.attribute("linker_output", LinkerOutputFile);
2476
2477 JOS.attributeArray("args", [&]() {
2478 JOS.value(RemoteCompiler);
2479
2480 // Forward any supplied prepend options.
2481 if (!RemoteCompilerPrependArgs.empty())
2482 for (auto &A : RemoteCompilerPrependArgs)
2483 JOS.value(A);
2484
2485 JOS.value("-c");
2486
2487 JOS.value(Saver.save("--target=" + Triple.str()));
2488
2489 for (const auto &A : CodegenOptions)
2490 JOS.value(A);
2491 });
2492
2493 JOS.attribute("inputs", Array(CommonInputs));
2494 });
2495
2496 // Per-compilation-job information.
2497 JOS.attributeArray("jobs", [&]() {
2498 for (const auto &J : Jobs) {
2499 assert(J.Task != 0);
2500 if (J.Cached) {
2501 assert(!Cache.getCacheDirectoryPath().empty());
2502 continue;
2503 }
2504
2506 SmallVector<StringRef, 1> Outputs;
2507
2508 JOS.object([&]() {
2509 JOS.attributeArray("args", [&]() {
2510 JOS.value(J.ModuleID);
2511 Inputs.push_back(J.ModuleID);
2512
2513 JOS.value(
2514 Saver.save("-fthinlto-index=" + Twine(J.SummaryIndexPath)));
2515 Inputs.push_back(J.SummaryIndexPath);
2516
2517 JOS.value("-o");
2518 JOS.value(J.NativeObjectPath);
2519 Outputs.push_back(J.NativeObjectPath);
2520 });
2521
2522 // Add the bitcode files from which imports will be made. These do
2523 // not explicitly appear on the backend compilation command lines
2524 // but are recorded in the summary index shards.
2525 llvm::append_range(Inputs, J.ImportsFiles);
2526 JOS.attribute("inputs", Array(Inputs));
2527
2528 JOS.attribute("outputs", Array(Outputs));
2529 });
2530 }
2531 });
2532 });
2533
2534 return true;
2535 }
2536
2537 void removeFile(StringRef FileName) {
2538 std::error_code EC = sys::fs::remove(FileName, true);
2539 if (EC && EC != std::make_error_code(std::errc::no_such_file_or_directory))
2540 errs() << "warning: could not remove the file '" << FileName
2541 << "': " << EC.message() << "\n";
2542 }
2543
2544 Error wait() override {
2545 // Wait for the information on the required backend compilations to be
2546 // gathered.
2547 BackendThreadPool.wait();
2548 if (Err)
2549 return std::move(*Err);
2550
2551 auto CleanPerJobFiles = llvm::make_scope_exit([&] {
2552 llvm::TimeTraceScope TimeScope("Remove DTLTO temporary files");
2553 if (!SaveTemps)
2554 for (auto &Job : Jobs) {
2555 removeFile(Job.NativeObjectPath);
2556 if (!ShouldEmitIndexFiles)
2557 removeFile(Job.SummaryIndexPath);
2558 }
2559 });
2560
2561 const StringRef BCError = "DTLTO backend compilation: ";
2562
2563 buildCommonRemoteCompilerOptions();
2564
2565 SString JsonFile = sys::path::parent_path(LinkerOutputFile);
2566 {
2567 llvm::TimeTraceScope TimeScope("Emit DTLTO JSON");
2568 sys::path::append(JsonFile, sys::path::stem(LinkerOutputFile) + "." +
2569 UID + ".dist-file.json");
2570 // Cleanup DTLTO JSON file on abnormal process exit.
2571 if (!SaveTemps)
2573 if (!emitDistributorJson(JsonFile))
2575 BCError + "failed to generate distributor JSON script: " + JsonFile,
2577 }
2578 auto CleanJson = llvm::make_scope_exit([&] {
2579 if (!SaveTemps)
2580 removeFile(JsonFile);
2581 });
2582
2583 {
2584 llvm::TimeTraceScope TimeScope("Execute DTLTO distributor",
2585 DistributorPath);
2586 // Checks if we have any jobs that don't have corresponding cache entries.
2587 if (CachedJobs.load() < Jobs.size()) {
2588 SmallVector<StringRef, 3> Args = {DistributorPath};
2589 llvm::append_range(Args, DistributorArgs);
2590 Args.push_back(JsonFile);
2591 std::string ErrMsg;
2592 if (sys::ExecuteAndWait(Args[0], Args,
2593 /*Env=*/std::nullopt, /*Redirects=*/{},
2594 /*SecondsToWait=*/0, /*MemoryLimit=*/0,
2595 &ErrMsg)) {
2597 BCError + "distributor execution failed" +
2598 (!ErrMsg.empty() ? ": " + ErrMsg + Twine(".") : Twine(".")),
2600 }
2601 }
2602 }
2603
2604 {
2605 llvm::TimeTraceScope FilesScope("Add DTLTO files to the link");
2606 for (auto &Job : Jobs) {
2607 if (!Job.CacheKey.empty() && Job.Cached) {
2608 assert(Cache.isValid());
2609 continue;
2610 }
2611 // Load the native object from a file into a memory buffer
2612 // and store its contents in the output buffer.
2613 auto ObjFileMbOrErr =
2614 MemoryBuffer::getFile(Job.NativeObjectPath, /*IsText=*/false,
2615 /*RequiresNullTerminator=*/false);
2616 if (std::error_code EC = ObjFileMbOrErr.getError())
2618 BCError + "cannot open native object file: " +
2619 Job.NativeObjectPath + ": " + EC.message(),
2621
2622 MemoryBufferRef ObjFileMbRef = ObjFileMbOrErr->get()->getMemBufferRef();
2623 if (Cache.isValid()) {
2624 // Cache hits are taken care of earlier. At this point, we could only
2625 // have cache misses.
2626 assert(Job.CacheAddStream);
2627 // Obtain a file stream for a storing a cache entry.
2628 auto CachedFileStreamOrErr =
2629 Job.CacheAddStream(Job.Task, Job.ModuleID);
2630 if (!CachedFileStreamOrErr)
2631 return joinErrors(
2632 CachedFileStreamOrErr.takeError(),
2634 "Cannot get a cache file stream: %s",
2635 Job.NativeObjectPath.data()));
2636 // Store a file buffer into the cache stream.
2637 auto &CacheStream = *(CachedFileStreamOrErr->get());
2638 *(CacheStream.OS) << ObjFileMbRef.getBuffer();
2639 if (Error Err = CacheStream.commit())
2640 return Err;
2641 } else {
2642 auto StreamOrErr = AddStream(Job.Task, Job.ModuleID);
2643 if (Error Err = StreamOrErr.takeError())
2644 report_fatal_error(std::move(Err));
2645 auto &Stream = *StreamOrErr->get();
2646 *Stream.OS << ObjFileMbRef.getBuffer();
2647 if (Error Err = Stream.commit())
2648 report_fatal_error(std::move(Err));
2649 }
2650 }
2651 }
2652 return Error::success();
2653 }
2654};
2655} // end anonymous namespace
2656
2658 ThreadPoolStrategy Parallelism, lto::IndexWriteCallback OnWrite,
2659 bool ShouldEmitIndexFiles, bool ShouldEmitImportsFiles,
2660 StringRef LinkerOutputFile, StringRef Distributor,
2661 ArrayRef<StringRef> DistributorArgs, StringRef RemoteCompiler,
2662 ArrayRef<StringRef> RemoteCompilerPrependArgs,
2663 ArrayRef<StringRef> RemoteCompilerArgs, bool SaveTemps) {
2664 auto Func =
2665 [=](const Config &Conf, ModuleSummaryIndex &CombinedIndex,
2666 const DenseMap<StringRef, GVSummaryMapTy> &ModuleToDefinedGVSummaries,
2667 AddStreamFn AddStream, FileCache Cache) {
2668 return std::make_unique<OutOfProcessThinBackend>(
2669 Conf, CombinedIndex, Parallelism, ModuleToDefinedGVSummaries,
2670 AddStream, Cache, OnWrite, ShouldEmitIndexFiles,
2671 ShouldEmitImportsFiles, LinkerOutputFile, Distributor,
2672 DistributorArgs, RemoteCompiler, RemoteCompilerPrependArgs,
2673 RemoteCompilerArgs, SaveTemps);
2674 };
2675 return ThinBackend(Func, Parallelism);
2676}
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Function Alias Analysis false
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
dxil translate DXIL Translate Metadata
#define DEBUG_TYPE
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
This file supports working with JSON data.
static void writeToResolutionFile(raw_ostream &OS, InputFile *Input, ArrayRef< SymbolResolution > Res)
Definition LTO.cpp:719
static void thinLTOResolvePrevailingGUID(const Config &C, ValueInfo VI, DenseSet< GlobalValueSummary * > &GlobalInvolvedWithAlias, function_ref< bool(GlobalValue::GUID, const GlobalValueSummary *)> isPrevailing, function_ref< void(StringRef, GlobalValue::GUID, GlobalValue::LinkageTypes)> recordNewLinkage, const DenseSet< GlobalValue::GUID > &GUIDPreservedSymbols)
Definition LTO.cpp:369
static void handleNonPrevailingComdat(GlobalValue &GV, std::set< const Comdat * > &NonPrevailingComdats)
Definition LTO.cpp:849
static cl::opt< bool > DumpThinCGSCCs("dump-thin-cg-sccs", cl::init(false), cl::Hidden, cl::desc("Dump the SCCs in the ThinLTO index's callgraph"))
static void thinLTOInternalizeAndPromoteGUID(ValueInfo VI, function_ref< bool(StringRef, ValueInfo)> isExported, function_ref< bool(GlobalValue::GUID, const GlobalValueSummary *)> isPrevailing)
Definition LTO.cpp:471
Legalize the Machine IR a function s Machine IR
Definition Legalizer.cpp:80
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
#define G(x, y, z)
Definition MD5.cpp:55
Machine Check Debug Module
This file contains the declarations for metadata subclasses.
#define P(N)
Provides a library for accessing information about this process and other processes on the operating ...
static const char * name
This file defines the make_scope_exit function, which executes user-defined cleanup logic at scope ex...
This file defines the SmallSet class.
This file defines the 'Statistic' class, which is designed to be an easy way to expose various metric...
This file contains some functions that are useful when dealing with strings.
#define LLVM_DEBUG(...)
Definition Debug.h:114
This pass exposes codegen information to IR-level passes.
The Input class is used to parse a yaml document into in-memory structs and vectors.
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
iterator end() const
Definition ArrayRef.h:131
iterator begin() const
Definition ArrayRef.h:130
bool empty() const
empty - Check if the array is empty.
Definition ArrayRef.h:137
const T & consume_front()
consume_front() - Returns the first element and drops it from ArrayRef.
Definition ArrayRef.h:157
static LLVM_ABI ArrayType * get(Type *ElementType, uint64_t NumElements)
This static method is the primary way to construct an ArrayType.
Represents a module in a bitcode file.
StringRef getModuleIdentifier() const
LLVM_ABI Error readSummary(ModuleSummaryIndex &CombinedIndex, StringRef ModulePath, std::function< bool(GlobalValue::GUID)> IsPrevailing=nullptr)
Parse the specified bitcode buffer and merge its module summary index into CombinedIndex.
LLVM_ABI Expected< std::unique_ptr< Module > > parseModule(LLVMContext &Context, ParserCallbacks Callbacks={})
Read the entire bitcode module and return it.
LLVM_ABI Expected< std::unique_ptr< Module > > getLazyModule(LLVMContext &Context, bool ShouldLazyLoadMetadata, bool IsImporting, ParserCallbacks Callbacks={})
Read the bitcode module and prepare for lazy deserialization of function bodies.
static LLVM_ABI ConstantAggregateZero * get(Type *Ty)
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64
iterator find(const_arg_type_t< KeyT > Val)
Definition DenseMap.h:178
std::pair< iterator, bool > try_emplace(KeyT &&Key, Ts &&...Args)
Definition DenseMap.h:256
size_type count(const_arg_type_t< KeyT > Val) const
Return 1 if the specified key is in the map, 0 otherwise.
Definition DenseMap.h:174
iterator end()
Definition DenseMap.h:81
Implements a dense probed hash-table based set.
Definition DenseSet.h:279
Lightweight error class with error context and mandatory checking.
Definition Error.h:159
static ErrorSuccess success()
Create a success value.
Definition Error.h:336
Tagged union holding either a T or a Error.
Definition Error.h:485
Error takeError()
Take ownership of the stored error.
Definition Error.h:612
The map maintains the list of imports.
DenseSet< ValueInfo > ExportSetTy
The set contains an entry for every global value that the module exports.
Function and variable summary information to aid decisions and implementation of importing.
static bool isAppendingLinkage(LinkageTypes Linkage)
static LLVM_ABI GUID getGUIDAssumingExternalLinkage(StringRef GlobalName)
Return a 64-bit global unique ID constructed from the name of a global symbol.
Definition Globals.cpp:77
static bool isExternalWeakLinkage(LinkageTypes Linkage)
static bool isLocalLinkage(LinkageTypes Linkage)
LLVM_ABI bool isDeclaration() const
Return true if the primary definition of this global value is outside of the current translation unit...
Definition Globals.cpp:328
void setUnnamedAddr(UnnamedAddr Val)
uint64_t GUID
Declare a type to represent a global unique identifier for a global value.
bool hasLocalLinkage() const
static StringRef dropLLVMManglingEscape(StringRef Name)
If the given string begins with the GlobalValue name mangling escape character '\1',...
LLVM_ABI const Comdat * getComdat() const
Definition Globals.cpp:201
static bool isLinkOnceLinkage(LinkageTypes Linkage)
void setLinkage(LinkageTypes LT)
DLLStorageClassTypes
Storage classes of global values for PE targets.
Definition GlobalValue.h:74
GUID getGUID() const
Return a 64-bit global unique ID constructed from global value name (i.e.
static bool isExternalLinkage(LinkageTypes Linkage)
VisibilityTypes
An enumeration for the kinds of visibility of global values.
Definition GlobalValue.h:67
@ DefaultVisibility
The GV is visible.
Definition GlobalValue.h:68
static LLVM_ABI std::string getGlobalIdentifier(StringRef Name, GlobalValue::LinkageTypes Linkage, StringRef FileName)
Return the modified name for a global value suitable to be used as the key for a global lookup (e....
Definition Globals.cpp:161
static LinkageTypes getWeakLinkage(bool ODR)
static bool isWeakForLinker(LinkageTypes Linkage)
Whether the definition of this global may be replaced at link time.
bool hasAppendingLinkage() const
bool hasAvailableExternallyLinkage() const
LinkageTypes
An enumeration for the kinds of linkage for global values.
Definition GlobalValue.h:52
@ CommonLinkage
Tentative definitions.
Definition GlobalValue.h:63
@ InternalLinkage
Rename collisions when linking (static functions).
Definition GlobalValue.h:60
@ ExternalLinkage
Externally visible function.
Definition GlobalValue.h:53
@ WeakAnyLinkage
Keep one copy of named function when linking (weak)
Definition GlobalValue.h:57
@ AvailableExternallyLinkage
Available for inspection, not emission.
Definition GlobalValue.h:54
DLLStorageClassTypes getDLLStorageClass() const
Type * getValueType() const
static bool isLinkOnceODRLinkage(LinkageTypes Linkage)
LLVM_ABI void eraseFromParent()
eraseFromParent - This method unlinks 'this' from the containing module and deletes it.
Definition Globals.cpp:520
void setAlignment(Align Align)
Sets the alignment attribute of the GlobalVariable.
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68
static MDTuple * get(LLVMContext &Context, ArrayRef< Metadata * > MDs)
Definition Metadata.h:1526
This class implements a map that also provides access to all stored values in a deterministic order.
Definition MapVector.h:36
bool empty() const
Definition MapVector.h:77
iterator begin()
Definition MapVector.h:65
size_type size() const
Definition MapVector.h:56
PreservedAnalyses run(Module &M, ModuleAnalysisManager &AM)
StringRef getBuffer() const
static ErrorOr< std::unique_ptr< MemoryBuffer > > getFile(const Twine &Filename, bool IsText=false, bool RequiresNullTerminator=true, bool IsVolatile=false, std::optional< Align > Alignment=std::nullopt)
Open the specified file as a MemoryBuffer, returning a new MemoryBuffer if successful,...
Class to hold module path string table and global value map, and encapsulate methods for operating on...
CfiFunctionIndex & cfiFunctionDecls()
const ModuleHash & getModuleHash(const StringRef ModPath) const
Get the module SHA1 hash recorded for the given module path.
const StringMap< ModuleHash > & modulePaths() const
Table of modules, containing module hash and id.
CfiFunctionIndex & cfiFunctionDefs()
LLVM_ABI void addModule(Module *M)
static LLVM_ABI void CollectAsmSymvers(const Module &M, function_ref< void(StringRef, StringRef)> AsmSymver)
Parse inline ASM and collect the symvers directives that are defined in the current module.
PointerUnion< GlobalValue *, AsmSymbol * > Symbol
LLVM_ABI uint32_t getSymbolFlags(Symbol S) const
ArrayRef< Symbol > symbols() const
A Module instance is used to store all the information related to an LLVM module.
Definition Module.h:67
A class that wrap the SHA1 algorithm.
Definition SHA1.h:27
LLVM_ABI void update(ArrayRef< uint8_t > Data)
Digest more data.
Definition SHA1.cpp:208
LLVM_ABI std::array< uint8_t, 20 > result()
Return the current raw 160-bits SHA1 for the digested data since the last call to init().
Definition SHA1.cpp:288
size_type count(const T &V) const
count - Return 1 if the element is in the set, 0 otherwise.
Definition SmallSet.h:175
bool empty() const
Definition SmallSet.h:168
bool erase(const T &V)
Definition SmallSet.h:199
std::pair< const_iterator, bool > insert(const T &V)
insert - Insert an element into the set if it isn't already there.
Definition SmallSet.h:183
SmallString - A SmallString is just a SmallVector with methods and accessors that make it work better...
Definition SmallString.h:26
StringRef str() const
Explicit conversion to StringRef.
void reserve(size_type N)
void resize(size_type N)
void push_back(const T &Elt)
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
A wrapper around a string literal that serves as a proxy for constructing global tables of StringRefs...
Definition StringRef.h:864
size_type count(StringRef Key) const
count - Return 1 if the element is in the map, 0 otherwise.
Definition StringMap.h:285
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55
constexpr bool empty() const
empty - Check if the string is empty.
Definition StringRef.h:143
constexpr const char * data() const
data - Get a pointer to the start of the string (which may not be null terminated).
Definition StringRef.h:140
Saves strings in the provided stable storage and returns a StringRef with a stable character pointer.
Definition StringSaver.h:22
StringRef save(const char *S)
Definition StringSaver.h:31
MCTargetOptions MCOptions
Machine level options.
DebuggerKind DebuggerTuning
Which debugger to tune for.
unsigned FunctionSections
Emit functions into separate sections.
unsigned DataSections
Emit data into separate sections.
This tells how a thread pool will be used.
Definition Threading.h:115
The TimeTraceScope is a helper class to call the begin and end functions of the time trace profiler.
Triple - Helper class for working with autoconf configuration names.
Definition Triple.h:47
bool isArm64e() const
Tests whether the target is the Apple "arm64e" AArch64 subarch.
Definition Triple.h:1159
ArchType getArch() const
Get the parsed architecture type of this triple.
Definition Triple.h:414
bool isOSBinFormatCOFF() const
Tests whether the OS uses the COFF binary format.
Definition Triple.h:791
const std::string & str() const
Definition Triple.h:481
bool isOSDarwin() const
Is this a "Darwin" OS (macOS, iOS, tvOS, watchOS, DriverKit, XROS, or bridgeOS).
Definition Triple.h:628
bool isOSBinFormatELF() const
Tests whether the OS uses the ELF binary format.
Definition Triple.h:786
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition Twine.h:82
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:45
static LLVM_ABI IntegerType * getInt8Ty(LLVMContext &C)
Definition Type.cpp:294
LLVM_ABI void setName(const Twine &Name)
Change the name of the value.
Definition Value.cpp:397
LLVM_ABI void replaceAllUsesWith(Value *V)
Change all uses of this to point to a new Value.
Definition Value.cpp:553
bool use_empty() const
Definition Value.h:346
LLVM_ABI StringRef getName() const
Return a constant reference to the value's name.
Definition Value.cpp:322
LLVM_ABI void takeName(Value *V)
Transfer the name from V to this value.
Definition Value.cpp:403
std::pair< iterator, bool > insert(const ValueT &V)
Definition DenseSet.h:202
iterator find(const_arg_type_t< ValueT > V)
Definition DenseSet.h:167
void insert_range(Range &&R)
Definition DenseSet.h:228
size_type size() const
Definition DenseSet.h:87
bool contains(const_arg_type_t< ValueT > V) const
Check if the set contains the given element.
Definition DenseSet.h:175
size_type count(const_arg_type_t< ValueT > V) const
Return 1 if the specified key is in the set, 0 otherwise.
Definition DenseSet.h:180
An efficient, type-erasing, non-owning reference to a callable.
Ephemeral symbols produced by Reader::symbols() and Reader::module_symbols().
Definition IRSymtab.h:316
An input file.
Definition LTO.h:113
static LLVM_ABI Expected< std::unique_ptr< InputFile > > create(MemoryBufferRef Object)
Create an InputFile.
Definition LTO.cpp:569
ArrayRef< Symbol > symbols() const
A range over the symbols in this InputFile.
Definition LTO.h:173
LLVM_ABI StringRef getName() const
Returns the path to the InputFile.
Definition LTO.cpp:600
LLVM_ABI BitcodeModule & getSingleBitcodeModule()
Definition LTO.cpp:604
LLVM_ABI LTO(Config Conf, ThinBackend Backend={}, unsigned ParallelCodeGenParallelismLevel=1, LTOKind LTOMode=LTOK_Default)
Create an LTO object.
Definition LTO.cpp:622
LLVM_ABI Error add(std::unique_ptr< InputFile > Obj, ArrayRef< SymbolResolution > Res)
Add an input file to the LTO link, using the provided symbol resolutions.
Definition LTO.cpp:743
static LLVM_ABI SmallVector< const char * > getRuntimeLibcallSymbols(const Triple &TT)
Static method that returns a list of libcall symbols that can be generated by LTO but might not be vi...
Definition LTO.cpp:1412
virtual Expected< std::shared_ptr< lto::InputFile > > addInput(std::unique_ptr< lto::InputFile > InputPtr)
Definition LTO.h:620
virtual llvm::Error handleArchiveInputs()
Definition LTO.h:624
LTOKind
Unified LTO modes.
Definition LTO.h:399
@ LTOK_UnifiedRegular
Regular LTO, with Unified LTO enabled.
Definition LTO.h:404
@ LTOK_Default
Any LTO mode without Unified LTO. The default mode.
Definition LTO.h:401
@ LTOK_UnifiedThin
ThinLTO, with Unified LTO enabled.
Definition LTO.h:407
virtual LLVM_ABI ~LTO()
LLVM_ABI unsigned getMaxTasks() const
Returns an upper bound on the number of tasks that the client may expect.
Definition LTO.cpp:1166
LLVM_ABI Error run(AddStreamFn AddStream, FileCache Cache={})
Runs the LTO pipeline.
Definition LTO.cpp:1217
This class defines the interface to the ThinLTO backend.
Definition LTO.h:227
const DenseMap< StringRef, GVSummaryMapTy > & ModuleToDefinedGVSummaries
Definition LTO.h:231
LLVM_ABI Error emitFiles(const FunctionImporter::ImportMapTy &ImportList, StringRef ModulePath, const std::string &NewModulePath) const
Definition LTO.cpp:1425
ModuleSummaryIndex & CombinedIndex
Definition LTO.h:230
A raw_ostream that writes to a file descriptor.
This class implements an extremely fast bulk output stream that can only output to a stream.
Definition raw_ostream.h:53
static LLVM_ABI Pid getProcessId()
Get the process's identifier.
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
constexpr char Align[]
Key for Kernel::Arg::Metadata::mAlign.
constexpr char Args[]
Key for Kernel::Metadata::mArgs.
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
LLVM_ABI Function * getDeclarationIfExists(const Module *M, ID id)
Look up the Function declaration of the intrinsic id in the Module M and return it if it exists.
static auto libcall_impls()
LLVM_ABI Expected< stable_hash > mergeCodeGenData(ArrayRef< StringRef > ObjectFiles)
Merge the codegen data from the scratch objects ObjectFiles from the first codegen round.
LLVM_ABI std::unique_ptr< Module > loadModuleForTwoRounds(BitcodeModule &OrigModule, unsigned Task, LLVMContext &Context, ArrayRef< StringRef > IRFiles)
Load the optimized bitcode module for the second codegen round.
initializer< Ty > init(const Ty &Val)
LLVM_ABI ThinBackend createInProcessThinBackend(ThreadPoolStrategy Parallelism, IndexWriteCallback OnWrite=nullptr, bool ShouldEmitIndexFiles=false, bool ShouldEmitImportsFiles=false)
This ThinBackend runs the individual backend jobs in-process.
Definition LTO.cpp:1775
LLVM_ABI std::string getThinLTOOutputFile(StringRef Path, StringRef OldPrefix, StringRef NewPrefix)
Given the original Path to an output file, replace any path prefix matching OldPrefix with NewPrefix.
Definition LTO.cpp:1809
LLVM_ABI StringLiteral getThinLTODefaultCPU(const Triple &TheTriple)
Definition LTO.cpp:1791
LLVM_ABI Expected< std::unique_ptr< ToolOutputFile > > setupStatsFile(StringRef StatsFilename)
Setups the output file for saving statistics.
Definition LTO.cpp:2189
LLVM_ABI ThinBackend createOutOfProcessThinBackend(ThreadPoolStrategy Parallelism, IndexWriteCallback OnWrite, bool ShouldEmitIndexFiles, bool ShouldEmitImportsFiles, StringRef LinkerOutputFile, StringRef Distributor, ArrayRef< StringRef > DistributorArgs, StringRef RemoteCompiler, ArrayRef< StringRef > RemoteCompilerPrependArgs, ArrayRef< StringRef > RemoteCompilerArgs, bool SaveTemps)
This ThinBackend generates the index shards and then runs the individual backend jobs via an external...
Definition LTO.cpp:2657
LLVM_ABI Error backend(const Config &C, AddStreamFn AddStream, unsigned ParallelCodeGenParallelismLevel, Module &M, ModuleSummaryIndex &CombinedIndex)
Runs a regular LTO backend.
std::function< void(const std::string &)> IndexWriteCallback
Definition LTO.h:222
LLVM_ABI Error finalizeOptimizationRemarks(LLVMRemarkFileHandle DiagOutputFile)
LLVM_ABI ThinBackend createWriteIndexesThinBackend(ThreadPoolStrategy Parallelism, std::string OldPrefix, std::string NewPrefix, std::string NativeObjectPrefix, bool ShouldEmitImportsFiles, raw_fd_ostream *LinkedObjectsFile, IndexWriteCallback OnWrite)
This ThinBackend writes individual module indexes to files, instead of running the individual backend...
Definition LTO.cpp:1895
LLVM_ABI Expected< LLVMRemarkFileHandle > setupLLVMOptimizationRemarks(LLVMContext &Context, StringRef RemarksFilename, StringRef RemarksPasses, StringRef RemarksFormat, bool RemarksWithHotness, std::optional< uint64_t > RemarksHotnessThreshold=0, int Count=-1)
Setup optimization remarks.
Definition LTO.cpp:2164
LLVM_ABI std::vector< int > generateModulesOrdering(ArrayRef< BitcodeModule * > R)
Produces a container ordering for optimal multi-threaded processing.
Definition LTO.cpp:2208
LLVM_ABI Error thinBackend(const Config &C, unsigned Task, AddStreamFn AddStream, Module &M, const ModuleSummaryIndex &CombinedIndex, const FunctionImporter::ImportMapTy &ImportList, const GVSummaryMapTy &DefinedGlobals, MapVector< StringRef, BitcodeModule > *ModuleMap, bool CodeGenOnly, AddStreamFn IRAddStream=nullptr, const std::vector< uint8_t > &CmdArgs=std::vector< uint8_t >())
Runs a ThinLTO backend.
llvm::SmallVector< std::string > ImportsFilesContainer
Definition LTO.h:224
LLVM_ABI Expected< IRSymtabFile > readIRSymtab(MemoryBufferRef MBRef)
Reads a bitcode file, creating its irsymtab if necessary.
DiagnosticInfoOptimizationBase::Argument NV
void write64le(void *P, uint64_t V)
Definition Endian.h:478
void write32le(void *P, uint32_t V)
Definition Endian.h:475
LLVM_ABI std::error_code remove(const Twine &path, bool IgnoreNonExisting=true)
Remove path.
LLVM_ABI std::error_code create_directories(const Twine &path, bool IgnoreExisting=true, perms Perms=owner_all|group_all)
Create all the non-existent directories in path.
Definition Path.cpp:972
LLVM_ABI StringRef stem(StringRef path LLVM_LIFETIME_BOUND, Style style=Style::native)
Get stem.
Definition Path.cpp:580
LLVM_ABI StringRef parent_path(StringRef path LLVM_LIFETIME_BOUND, Style style=Style::native)
Get parent path.
Definition Path.cpp:468
LLVM_ABI bool replace_path_prefix(SmallVectorImpl< char > &Path, StringRef OldPrefix, StringRef NewPrefix, Style style=Style::native)
Replace matching path prefix with another path.
Definition Path.cpp:519
LLVM_ABI void append(SmallVectorImpl< char > &path, const Twine &a, const Twine &b="", const Twine &c="", const Twine &d="")
Append to path.
Definition Path.cpp:457
LLVM_ABI bool RemoveFileOnSignal(StringRef Filename, std::string *ErrMsg=nullptr)
This function registers signal handlers to ensure that if a signal gets delivered that the named file...
LLVM_ABI int ExecuteAndWait(StringRef Program, ArrayRef< StringRef > Args, std::optional< ArrayRef< StringRef > > Env=std::nullopt, ArrayRef< std::optional< StringRef > > Redirects={}, unsigned SecondsToWait=0, unsigned MemoryLimit=0, std::string *ErrMsg=nullptr, bool *ExecutionFailed=nullptr, std::optional< ProcessStatistics > *ProcStat=nullptr, BitVector *AffinityMask=nullptr)
This function executes the program using the arguments provided.
Definition Program.cpp:32
This is an optimization pass for GlobalISel generic memory operations.
Definition Types.h:26
ThreadPoolStrategy heavyweight_hardware_concurrency(unsigned ThreadCount=0)
Returns a thread strategy for tasks requiring significant memory or other resources.
Definition Threading.h:167
detail::zippy< detail::zip_shortest, T, U, Args... > zip(T &&t, U &&u, Args &&...args)
zip iterator for two or more iteratable types.
Definition STLExtras.h:829
cl::opt< std::string > RemarksFormat("lto-pass-remarks-format", cl::desc("The format used for serializing remarks (default: YAML)"), cl::value_desc("format"), cl::init("yaml"))
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1737
Error createFileError(const Twine &F, Error E)
Concatenate a source file path and/or name with an Error.
Definition Error.h:1399
std::unordered_set< GlobalValueSummary * > GVSummaryPtrSet
A set of global value summary pointers.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
void generateParamAccessSummary(ModuleSummaryIndex &Index)
cl::opt< bool > CodeGenDataThinLTOTwoRounds("codegen-data-thinlto-two-rounds", cl::init(false), cl::Hidden, cl::desc("Enable two-round ThinLTO code generation. The first round " "emits codegen data, while the second round uses the emitted " "codegen data for further optimizations."))
Definition LTO.cpp:79
LLVM_ABI Expected< LLVMRemarkFileHandle > setupLLVMOptimizationRemarks(LLVMContext &Context, StringRef RemarksFilename, StringRef RemarksPasses, StringRef RemarksFormat, bool RemarksWithHotness, std::optional< uint64_t > RemarksHotnessThreshold=0)
Set up optimization remarks that output to a file.
cl::opt< std::string > RemarksPasses("lto-pass-remarks-filter", cl::desc("Only record optimization remarks from passes whose " "names match the given regular expression"), cl::value_desc("regex"))
LLVM_ABI std::error_code inconvertibleErrorCode()
The value returned by this function can be returned from convertToErrorCode for Error values where no...
Definition Error.cpp:98
LLVM_ABI raw_fd_ostream & outs()
This returns a reference to a raw_fd_ostream for standard output.
DenseMap< GlobalValue::GUID, GlobalValueSummary * > GVSummaryMapTy
Map of global value GUID to its summary, used to identify values defined in a particular module,...
auto dyn_cast_if_present(const Y &Val)
dyn_cast_if_present<X> - Functionally identical to dyn_cast, except that a null (or none in the case ...
Definition Casting.h:732
iterator_range< T > make_range(T x, T y)
Convenience function for iterating over sub-ranges.
void append_range(Container &C, Range &&R)
Wrapper function to append range R to container C.
Definition STLExtras.h:2184
uint64_t stable_hash
An opaque object representing a stable hash code.
std::string utostr(uint64_t X, bool isNeg=false)
LLVM_ABI bool thinLTOPropagateFunctionAttrs(ModuleSummaryIndex &Index, function_ref< bool(GlobalValue::GUID, const GlobalValueSummary *)> isPrevailing)
Propagate function attributes for function summaries along the index's callgraph during thinlink.
Error createStringError(std::error_code EC, char const *Fmt, const Ts &... Vals)
Create formatted StringError object.
Definition Error.h:1305
LLVM_ABI bool hasWholeProgramVisibility(bool WholeProgramVisibilityEnabledInLTO)
LLVM_ABI void writeIndexToFile(const ModuleSummaryIndex &Index, raw_ostream &Out, const ModuleToSummariesForIndexTy *ModuleToSummariesForIndex=nullptr, const GVSummaryPtrSet *DecSummaries=nullptr)
Write the specified module summary index to the given raw output stream, where it will be written in ...
LLVM_ABI void ComputeCrossModuleImport(const ModuleSummaryIndex &Index, const DenseMap< StringRef, GVSummaryMapTy > &ModuleToDefinedGVSummaries, function_ref< bool(GlobalValue::GUID, const GlobalValueSummary *)> isPrevailing, FunctionImporter::ImportListsTy &ImportLists, DenseMap< StringRef, FunctionImporter::ExportSetTy > &ExportLists)
Compute all the imports and exports for every module in the Index.
auto dyn_cast_or_null(const Y &Val)
Definition Casting.h:753
LLVM_ABI void EnableStatistics(bool DoPrintOnExit=true)
Enable the collection and printing of statistics.
LLVM_ABI void thinLTOInternalizeAndPromoteInIndex(ModuleSummaryIndex &Index, function_ref< bool(StringRef, ValueInfo)> isExported, function_ref< bool(GlobalValue::GUID, const GlobalValueSummary *)> isPrevailing)
Update the linkages in the given Index to mark exported values as external and non-exported values as...
Definition LTO.cpp:554
LLVM_ABI void timeTraceProfilerInitialize(unsigned TimeTraceGranularity, StringRef ProcName, bool TimeTraceVerbose=false)
Initialize the time trace profiler.
LLVM_ABI void timeTraceProfilerFinishThread()
Finish a time trace profiler running on a worker thread.
LLVM_ABI std::string recomputeLTOCacheKey(const std::string &Key, StringRef ExtraID)
Recomputes the LTO cache key for a given key with an extra identifier.
Definition LTO.cpp:355
Error joinErrors(Error E1, Error E2)
Concatenate errors.
Definition Error.h:442
LLVM_ABI void updatePublicTypeTestCalls(Module &M, bool WholeProgramVisibilityEnabledInLTO)
LLVM_ABI void getVisibleToRegularObjVtableGUIDs(ModuleSummaryIndex &Index, DenseSet< GlobalValue::GUID > &VisibleToRegularObjSymbols, function_ref< bool(StringRef)> IsVisibleToRegularObj)
Based on typeID string, get all associated vtable GUIDS that are visible to regular objects.
void sort(IteratorTy Start, IteratorTy End)
Definition STLExtras.h:1634
bool timeTraceProfilerEnabled()
Is the time trace profiler enabled, i.e. initialized?
LLVM_ABI raw_ostream & dbgs()
dbgs() - This returns a reference to a raw_ostream for debugging messages.
Definition Debug.cpp:207
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
Definition Error.cpp:167
FunctionAddr VTableAddr Count
Definition InstrProf.h:139
std::map< std::string, GVSummaryMapTy, std::less<> > ModuleToSummariesForIndexTy
Map of a module name to the GUIDs and summaries we will import from that module.
LLVM_ABI cl::opt< bool > EnableLTOInternalization
Enable global value internalization in LTO.
cl::opt< bool > RemarksWithHotness("lto-pass-remarks-with-hotness", cl::desc("With PGO, include profile count in optimization remarks"), cl::Hidden)
LLVM_ABI void timeTraceProfilerEnd()
Manually end the last time section.
cl::opt< std::string > RemarksFilename("lto-pass-remarks-output", cl::desc("Output filename for pass remarks"), cl::value_desc("filename"))
cl::opt< bool > SupportsHotColdNew
Indicate we are linking with an allocator that supports hot/cold operator new interfaces.
LLVM_ABI void updateIndexWPDForExports(ModuleSummaryIndex &Summary, function_ref< bool(StringRef, ValueInfo)> isExported, std::map< ValueInfo, std::vector< VTableSlotSummary > > &LocalWPDTargetsMap)
Call after cross-module importing to update the recorded single impl devirt target names for any loca...
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
LLVM_ABI void thinLTOResolvePrevailingInIndex(const lto::Config &C, ModuleSummaryIndex &Index, function_ref< bool(GlobalValue::GUID, const GlobalValueSummary *)> isPrevailing, function_ref< void(StringRef, GlobalValue::GUID, GlobalValue::LinkageTypes)> recordNewLinkage, const DenseSet< GlobalValue::GUID > &GUIDPreservedSymbols)
Resolve linkage for prevailing symbols in the Index.
Definition LTO.cpp:449
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
LLVM_ATTRIBUTE_VISIBILITY_DEFAULT AnalysisKey InnerAnalysisManagerProxy< AnalysisManagerT, IRUnitT, ExtraArgTs... >::Key
Error make_error(ArgTs &&... Args)
Make a Error instance representing failure using the given error info type.
Definition Error.h:340
LLVM_ABI raw_fd_ostream & errs()
This returns a reference to a raw_ostream for standard error.
@ Mod
The access may modify the value stored in memory.
Definition ModRef.h:34
std::string join(IteratorT Begin, IteratorT End, StringRef Separator)
Joins the strings in the range [Begin, End), adding Separator between the elements.
FunctionAddr VTableAddr uintptr_t uintptr_t Data
Definition InstrProf.h:189
auto make_scope_exit(Callable &&F)
Definition ScopeExit.h:53
cl::opt< bool > EnableMemProfContextDisambiguation
Enable MemProf context disambiguation for thin link.
LLVM_ABI void runWholeProgramDevirtOnIndex(ModuleSummaryIndex &Summary, std::set< GlobalValue::GUID > &ExportedGUIDs, std::map< ValueInfo, std::vector< VTableSlotSummary > > &LocalWPDTargetsMap)
Perform index-based whole program devirtualization on the Summary index.
cl::opt< bool > ForceImportAll
LLVM_ABI void gatherImportedSummariesForModule(StringRef ModulePath, const DenseMap< StringRef, GVSummaryMapTy > &ModuleToDefinedGVSummaries, const FunctionImporter::ImportMapTy &ImportList, ModuleToSummariesForIndexTy &ModuleToSummariesForIndex, GVSummaryPtrSet &DecSummaries)
Compute the set of summaries needed for a ThinLTO backend compilation of ModulePath.
ArrayRef(const T &OneElt) -> ArrayRef< T >
void toHex(ArrayRef< uint8_t > Input, bool LowerCase, SmallVectorImpl< char > &Output)
Convert buffer Input to its hexadecimal representation. The returned string is double the size of Inp...
OutputIt move(R &&Range, OutputIt Out)
Provide wrappers to std::move which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1915
LLVM_ABI void processImportsFiles(StringRef ModulePath, const ModuleToSummariesForIndexTy &ModuleToSummariesForIndex, function_ref< void(const std::string &)> F)
Call F passing each of the files module ModulePath will import from.
cl::opt< std::optional< uint64_t >, false, remarks::HotnessThresholdParser > RemarksHotnessThreshold("lto-pass-remarks-hotness-threshold", cl::desc("Minimum profile count required for an " "optimization remark to be output." " Use 'auto' to apply the threshold from profile summary."), cl::value_desc("uint or 'auto'"), cl::init(0), cl::Hidden)
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
LLVM_ABI std::string computeLTOCacheKey(const lto::Config &Conf, const ModuleSummaryIndex &Index, StringRef ModuleID, const FunctionImporter::ImportMapTy &ImportList, const FunctionImporter::ExportSetTy &ExportList, const std::map< GlobalValue::GUID, GlobalValue::LinkageTypes > &ResolvedODR, const GVSummaryMapTy &DefinedGlobals, const DenseSet< GlobalValue::GUID > &CfiFunctionDefs={}, const DenseSet< GlobalValue::GUID > &CfiFunctionDecls={})
Computes a unique hash for the Module considering the current list of export/import and other global ...
Definition LTO.cpp:104
LLVM_ABI Error errorCodeToError(std::error_code EC)
Helper for converting an std::error_code to a Error.
Definition Error.cpp:111
static cl::opt< bool > LTOKeepSymbolCopies("lto-keep-symbol-copies", cl::init(false), cl::Hidden, cl::desc("Keep copies of symbols in LTO indexing"))
LLVM_ABI bool UpgradeDebugInfo(Module &M)
Check the debug info version number, if it is out-dated, drop the debug info.
auto seq(T Begin, T End)
Iterate over an integral type from Begin up to - but not including - End.
Definition Sequence.h:305
BumpPtrAllocatorImpl<> BumpPtrAllocator
The standard BumpPtrAllocator which just uses the default template parameters.
Definition Allocator.h:383
std::function< Expected< std::unique_ptr< CachedFileStream > >( unsigned Task, const Twine &ModuleName)> AddStreamFn
This type defines the callback to add a file that is generated on the fly.
Definition Caching.h:58
LLVM_ABI void PrintStatisticsJSON(raw_ostream &OS)
Print statistics in JSON format.
LLVM_ABI void computeDeadSymbolsWithConstProp(ModuleSummaryIndex &Index, const DenseSet< GlobalValue::GUID > &GUIDPreservedSymbols, function_ref< PrevailingType(GlobalValue::GUID)> isPrevailing, bool ImportEnabled)
Compute dead symbols and run constant propagation in combined index after that.
LLVM_ABI Error EmitImportsFiles(StringRef ModulePath, StringRef OutputFilename, const ModuleToSummariesForIndexTy &ModuleToSummariesForIndex)
Emit into OutputFilename the files module ModulePath will import from.
@ Keep
No function return thunk.
Definition CodeGen.h:162
std::string itostr(int64_t X)
LLVM_ABI void updateVCallVisibilityInModule(Module &M, bool WholeProgramVisibilityEnabledInLTO, const DenseSet< GlobalValue::GUID > &DynamicExportSymbols, bool ValidateAllVtablesHaveTypeInfos, function_ref< bool(StringRef)> IsVisibleToRegularObj)
If whole program visibility asserted, then upgrade all public vcall visibility metadata on vtable def...
LLVM_ABI TimeTraceProfilerEntry * timeTraceProfilerBegin(StringRef Name, StringRef Detail)
Manually begin a time section, with the given Name and Detail.
LLVM_ABI void updateVCallVisibilityInIndex(ModuleSummaryIndex &Index, bool WholeProgramVisibilityEnabledInLTO, const DenseSet< GlobalValue::GUID > &DynamicExportSymbols, const DenseSet< GlobalValue::GUID > &VisibleToRegularObjSymbols)
If whole program visibility asserted, then upgrade all public vcall visibility metadata on vtable def...
Implement std::hash so that hash_code can be used in STL containers.
Definition BitVector.h:870
This type represents a file cache system that manages caching of files.
Definition Caching.h:84
const std::string & getCacheDirectoryPath() const
Definition Caching.h:94
bool isValid() const
Definition Caching.h:97
A simple container for information about the supported runtime calls.
unsigned getNumAvailableLibcallImpls() const
bool isAvailable(RTLIB::LibcallImpl Impl) const
static StringRef getLibcallImplName(RTLIB::LibcallImpl CallImpl)
Get the libcall routine name for the specified libcall implementation.
Struct that holds a reference to a particular GUID in a global value summary.
LTO configuration.
Definition Config.h:42
std::optional< uint64_t > RemarksHotnessThreshold
The minimum hotness value a diagnostic needs in order to be included in optimization diagnostics.
Definition Config.h:171
std::optional< CodeModel::Model > CodeModel
Definition Config.h:57
std::string AAPipeline
Definition Config.h:116
bool CodeGenOnly
Disable entirely the optimizer, including importing for ThinLTO.
Definition Config.h:69
std::vector< std::string > MAttrs
Definition Config.h:51
std::vector< std::string > MllvmArgs
Definition Config.h:52
CodeGenOptLevel CGOptLevel
Definition Config.h:58
bool Dtlto
This flag is used as one of parameters to calculate cache entries and to ensure that in-process cache...
Definition Config.h:100
std::string DefaultTriple
Setting this field will replace unspecified target triples in input files with this triple.
Definition Config.h:124
std::string CPU
Definition Config.h:49
std::string DwoDir
The directory to store .dwo files.
Definition Config.h:136
std::string RemarksFilename
Optimization remarks file path.
Definition Config.h:150
std::string OverrideTriple
Setting this field will replace target triples in input files with this triple.
Definition Config.h:120
std::string ProfileRemapping
Name remapping file for profile data.
Definition Config.h:133
TargetOptions Options
Definition Config.h:50
bool TimeTraceEnabled
Time trace enabled.
Definition Config.h:186
std::string RemarksPasses
Optimization remarks pass filter.
Definition Config.h:153
std::string OptPipeline
If this field is set, the set of passes run in the middle-end optimizer will be the one specified by ...
Definition Config.h:111
unsigned TimeTraceGranularity
Time trace granularity.
Definition Config.h:189
unsigned OptLevel
Definition Config.h:60
bool RemarksWithHotness
Whether to emit optimization remarks with hotness informations.
Definition Config.h:156
std::optional< Reloc::Model > RelocModel
Definition Config.h:56
CodeGenFileType CGFileType
Definition Config.h:59
bool Freestanding
Flag to indicate that the optimizer should not assume builtins are present on the target.
Definition Config.h:66
std::string SampleProfile
Sample PGO profile path.
Definition Config.h:130
std::string RemarksFormat
The format used for serializing remarks (default: YAML).
Definition Config.h:174
The purpose of this struct is to only expose the symbol information that an LTO client should need in...
Definition LTO.h:148
The resolution for a symbol.
Definition LTO.h:629
unsigned FinalDefinitionInLinkageUnit
The definition of this symbol is unpreemptable at runtime and is known to be in this linkage unit.
Definition LTO.h:639
unsigned ExportDynamic
The symbol was exported dynamically, and therefore could be referenced by a shared library not visibl...
Definition LTO.h:646
unsigned Prevailing
The linker has chosen this definition of the symbol.
Definition LTO.h:635
unsigned LinkerRedefined
Linker redefined version of the symbol which appeared in -wrap or -defsym linker option.
Definition LTO.h:650
unsigned VisibleToRegularObj
The definition of this symbol is visible outside of the LTO unit.
Definition LTO.h:642
This type defines the behavior following the thin-link phase during ThinLTO.
Definition LTO.h:297