1 //===-LTOBackend.cpp - LLVM Link Time Optimizer Backend -------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements the "backend" phase of LTO, i.e. it performs
10 // optimization and code generation on a loaded module. It is generally used
11 // internally by the LTO class but can also be used independently, for example
12 // to implement a standalone ThinLTO backend.
13 //
14 //===----------------------------------------------------------------------===//
15
16 #include "llvm/LTO/LTOBackend.h"
17 #include "llvm/Analysis/AliasAnalysis.h"
18 #include "llvm/Analysis/CGSCCPassManager.h"
19 #include "llvm/Analysis/TargetLibraryInfo.h"
20 #include "llvm/Analysis/TargetTransformInfo.h"
21 #include "llvm/Bitcode/BitcodeReader.h"
22 #include "llvm/Bitcode/BitcodeWriter.h"
23 #include "llvm/IR/LegacyPassManager.h"
24 #include "llvm/IR/PassManager.h"
25 #include "llvm/IR/RemarkStreamer.h"
26 #include "llvm/IR/Verifier.h"
27 #include "llvm/LTO/LTO.h"
28 #include "llvm/MC/SubtargetFeature.h"
29 #include "llvm/Object/ModuleSymbolTable.h"
30 #include "llvm/Passes/PassBuilder.h"
31 #include "llvm/Passes/StandardInstrumentations.h"
32 #include "llvm/Support/Error.h"
33 #include "llvm/Support/FileSystem.h"
34 #include "llvm/Support/MemoryBuffer.h"
35 #include "llvm/Support/Path.h"
36 #include "llvm/Support/Program.h"
37 #include "llvm/Support/SmallVectorMemoryBuffer.h"
38 #include "llvm/Support/TargetRegistry.h"
39 #include "llvm/Support/ThreadPool.h"
40 #include "llvm/Support/raw_ostream.h"
41 #include "llvm/Target/TargetMachine.h"
42 #include "llvm/Transforms/IPO.h"
43 #include "llvm/Transforms/IPO/PassManagerBuilder.h"
44 #include "llvm/Transforms/Scalar/LoopPassManager.h"
45 #include "llvm/Transforms/Utils/FunctionImportUtils.h"
46 #include "llvm/Transforms/Utils/SplitModule.h"
47
48 using namespace llvm;
49 using namespace lto;
50
reportOpenError(StringRef Path,Twine Msg)51 LLVM_ATTRIBUTE_NORETURN static void reportOpenError(StringRef Path, Twine Msg) {
52 errs() << "failed to open " << Path << ": " << Msg << '\n';
53 errs().flush();
54 exit(1);
55 }
56
addSaveTemps(std::string OutputFileName,bool UseInputModulePath)57 Error Config::addSaveTemps(std::string OutputFileName,
58 bool UseInputModulePath) {
59 ShouldDiscardValueNames = false;
60
61 std::error_code EC;
62 ResolutionFile = std::make_unique<raw_fd_ostream>(
63 OutputFileName + "resolution.txt", EC, sys::fs::OpenFlags::OF_Text);
64 if (EC)
65 return errorCodeToError(EC);
66
67 auto setHook = [&](std::string PathSuffix, ModuleHookFn &Hook) {
68 // Keep track of the hook provided by the linker, which also needs to run.
69 ModuleHookFn LinkerHook = Hook;
70 Hook = [=](unsigned Task, const Module &M) {
71 // If the linker's hook returned false, we need to pass that result
72 // through.
73 if (LinkerHook && !LinkerHook(Task, M))
74 return false;
75
76 std::string PathPrefix;
77 // If this is the combined module (not a ThinLTO backend compile) or the
78 // user hasn't requested using the input module's path, emit to a file
79 // named from the provided OutputFileName with the Task ID appended.
80 if (M.getModuleIdentifier() == "ld-temp.o" || !UseInputModulePath) {
81 PathPrefix = OutputFileName;
82 if (Task != (unsigned)-1)
83 PathPrefix += utostr(Task) + ".";
84 } else
85 PathPrefix = M.getModuleIdentifier() + ".";
86 std::string Path = PathPrefix + PathSuffix + ".bc";
87 std::error_code EC;
88 raw_fd_ostream OS(Path, EC, sys::fs::OpenFlags::OF_None);
89 // Because -save-temps is a debugging feature, we report the error
90 // directly and exit.
91 if (EC)
92 reportOpenError(Path, EC.message());
93 WriteBitcodeToFile(M, OS, /*ShouldPreserveUseListOrder=*/false);
94 return true;
95 };
96 };
97
98 setHook("0.preopt", PreOptModuleHook);
99 setHook("1.promote", PostPromoteModuleHook);
100 setHook("2.internalize", PostInternalizeModuleHook);
101 setHook("3.import", PostImportModuleHook);
102 setHook("4.opt", PostOptModuleHook);
103 setHook("5.precodegen", PreCodeGenModuleHook);
104
105 CombinedIndexHook =
106 [=](const ModuleSummaryIndex &Index,
107 const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols) {
108 std::string Path = OutputFileName + "index.bc";
109 std::error_code EC;
110 raw_fd_ostream OS(Path, EC, sys::fs::OpenFlags::OF_None);
111 // Because -save-temps is a debugging feature, we report the error
112 // directly and exit.
113 if (EC)
114 reportOpenError(Path, EC.message());
115 WriteIndexToFile(Index, OS);
116
117 Path = OutputFileName + "index.dot";
118 raw_fd_ostream OSDot(Path, EC, sys::fs::OpenFlags::OF_None);
119 if (EC)
120 reportOpenError(Path, EC.message());
121 Index.exportToDot(OSDot, GUIDPreservedSymbols);
122 return true;
123 };
124
125 return Error::success();
126 }
127
128 namespace {
129
130 std::unique_ptr<TargetMachine>
createTargetMachine(const Config & Conf,const Target * TheTarget,Module & M)131 createTargetMachine(const Config &Conf, const Target *TheTarget, Module &M) {
132 StringRef TheTriple = M.getTargetTriple();
133 SubtargetFeatures Features;
134 Features.getDefaultSubtargetFeatures(Triple(TheTriple));
135 for (const std::string &A : Conf.MAttrs)
136 Features.AddFeature(A);
137
138 Reloc::Model RelocModel;
139 if (Conf.RelocModel)
140 RelocModel = *Conf.RelocModel;
141 else
142 RelocModel =
143 M.getPICLevel() == PICLevel::NotPIC ? Reloc::Static : Reloc::PIC_;
144
145 Optional<CodeModel::Model> CodeModel;
146 if (Conf.CodeModel)
147 CodeModel = *Conf.CodeModel;
148 else
149 CodeModel = M.getCodeModel();
150
151 return std::unique_ptr<TargetMachine>(TheTarget->createTargetMachine(
152 TheTriple, Conf.CPU, Features.getString(), Conf.Options, RelocModel,
153 CodeModel, Conf.CGOptLevel));
154 }
155
runNewPMPasses(const Config & Conf,Module & Mod,TargetMachine * TM,unsigned OptLevel,bool IsThinLTO,ModuleSummaryIndex * ExportSummary,const ModuleSummaryIndex * ImportSummary)156 static void runNewPMPasses(const Config &Conf, Module &Mod, TargetMachine *TM,
157 unsigned OptLevel, bool IsThinLTO,
158 ModuleSummaryIndex *ExportSummary,
159 const ModuleSummaryIndex *ImportSummary) {
160 Optional<PGOOptions> PGOOpt;
161 if (!Conf.SampleProfile.empty())
162 PGOOpt = PGOOptions(Conf.SampleProfile, "", Conf.ProfileRemapping,
163 PGOOptions::SampleUse, PGOOptions::NoCSAction, true);
164 else if (Conf.RunCSIRInstr) {
165 PGOOpt = PGOOptions("", Conf.CSIRProfile, Conf.ProfileRemapping,
166 PGOOptions::IRUse, PGOOptions::CSIRInstr);
167 } else if (!Conf.CSIRProfile.empty()) {
168 PGOOpt = PGOOptions(Conf.CSIRProfile, "", Conf.ProfileRemapping,
169 PGOOptions::IRUse, PGOOptions::CSIRUse);
170 }
171
172 PassInstrumentationCallbacks PIC;
173 StandardInstrumentations SI;
174 SI.registerCallbacks(PIC);
175 PassBuilder PB(TM, Conf.PTO, PGOOpt, &PIC);
176 AAManager AA;
177
178 // Parse a custom AA pipeline if asked to.
179 if (auto Err = PB.parseAAPipeline(AA, "default"))
180 report_fatal_error("Error parsing default AA pipeline");
181
182 LoopAnalysisManager LAM(Conf.DebugPassManager);
183 FunctionAnalysisManager FAM(Conf.DebugPassManager);
184 CGSCCAnalysisManager CGAM(Conf.DebugPassManager);
185 ModuleAnalysisManager MAM(Conf.DebugPassManager);
186
187 // Register the AA manager first so that our version is the one used.
188 FAM.registerPass([&] { return std::move(AA); });
189
190 // Register all the basic analyses with the managers.
191 PB.registerModuleAnalyses(MAM);
192 PB.registerCGSCCAnalyses(CGAM);
193 PB.registerFunctionAnalyses(FAM);
194 PB.registerLoopAnalyses(LAM);
195 PB.crossRegisterProxies(LAM, FAM, CGAM, MAM);
196
197 ModulePassManager MPM(Conf.DebugPassManager);
198 // FIXME (davide): verify the input.
199
200 PassBuilder::OptimizationLevel OL;
201
202 switch (OptLevel) {
203 default:
204 llvm_unreachable("Invalid optimization level");
205 case 0:
206 OL = PassBuilder::O0;
207 break;
208 case 1:
209 OL = PassBuilder::O1;
210 break;
211 case 2:
212 OL = PassBuilder::O2;
213 break;
214 case 3:
215 OL = PassBuilder::O3;
216 break;
217 }
218
219 if (IsThinLTO)
220 MPM = PB.buildThinLTODefaultPipeline(OL, Conf.DebugPassManager,
221 ImportSummary);
222 else
223 MPM = PB.buildLTODefaultPipeline(OL, Conf.DebugPassManager, ExportSummary);
224 MPM.run(Mod, MAM);
225
226 // FIXME (davide): verify the output.
227 }
228
runNewPMCustomPasses(Module & Mod,TargetMachine * TM,std::string PipelineDesc,std::string AAPipelineDesc,bool DisableVerify)229 static void runNewPMCustomPasses(Module &Mod, TargetMachine *TM,
230 std::string PipelineDesc,
231 std::string AAPipelineDesc,
232 bool DisableVerify) {
233 PassBuilder PB(TM);
234 AAManager AA;
235
236 // Parse a custom AA pipeline if asked to.
237 if (!AAPipelineDesc.empty())
238 if (auto Err = PB.parseAAPipeline(AA, AAPipelineDesc))
239 report_fatal_error("unable to parse AA pipeline description '" +
240 AAPipelineDesc + "': " + toString(std::move(Err)));
241
242 LoopAnalysisManager LAM;
243 FunctionAnalysisManager FAM;
244 CGSCCAnalysisManager CGAM;
245 ModuleAnalysisManager MAM;
246
247 // Register the AA manager first so that our version is the one used.
248 FAM.registerPass([&] { return std::move(AA); });
249
250 // Register all the basic analyses with the managers.
251 PB.registerModuleAnalyses(MAM);
252 PB.registerCGSCCAnalyses(CGAM);
253 PB.registerFunctionAnalyses(FAM);
254 PB.registerLoopAnalyses(LAM);
255 PB.crossRegisterProxies(LAM, FAM, CGAM, MAM);
256
257 ModulePassManager MPM;
258
259 // Always verify the input.
260 MPM.addPass(VerifierPass());
261
262 // Now, add all the passes we've been requested to.
263 if (auto Err = PB.parsePassPipeline(MPM, PipelineDesc))
264 report_fatal_error("unable to parse pass pipeline description '" +
265 PipelineDesc + "': " + toString(std::move(Err)));
266
267 if (!DisableVerify)
268 MPM.addPass(VerifierPass());
269 MPM.run(Mod, MAM);
270 }
271
runOldPMPasses(const Config & Conf,Module & Mod,TargetMachine * TM,bool IsThinLTO,ModuleSummaryIndex * ExportSummary,const ModuleSummaryIndex * ImportSummary)272 static void runOldPMPasses(const Config &Conf, Module &Mod, TargetMachine *TM,
273 bool IsThinLTO, ModuleSummaryIndex *ExportSummary,
274 const ModuleSummaryIndex *ImportSummary) {
275 legacy::PassManager passes;
276 passes.add(createTargetTransformInfoWrapperPass(TM->getTargetIRAnalysis()));
277
278 PassManagerBuilder PMB;
279 PMB.LibraryInfo = new TargetLibraryInfoImpl(Triple(TM->getTargetTriple()));
280 PMB.Inliner = createFunctionInliningPass();
281 PMB.ExportSummary = ExportSummary;
282 PMB.ImportSummary = ImportSummary;
283 // Unconditionally verify input since it is not verified before this
284 // point and has unknown origin.
285 PMB.VerifyInput = true;
286 PMB.VerifyOutput = !Conf.DisableVerify;
287 PMB.LoopVectorize = true;
288 PMB.SLPVectorize = true;
289 PMB.OptLevel = Conf.OptLevel;
290 PMB.PGOSampleUse = Conf.SampleProfile;
291 PMB.EnablePGOCSInstrGen = Conf.RunCSIRInstr;
292 if (!Conf.RunCSIRInstr && !Conf.CSIRProfile.empty()) {
293 PMB.EnablePGOCSInstrUse = true;
294 PMB.PGOInstrUse = Conf.CSIRProfile;
295 }
296 if (IsThinLTO)
297 PMB.populateThinLTOPassManager(passes);
298 else
299 PMB.populateLTOPassManager(passes);
300 passes.run(Mod);
301 }
302
opt(const Config & Conf,TargetMachine * TM,unsigned Task,Module & Mod,bool IsThinLTO,ModuleSummaryIndex * ExportSummary,const ModuleSummaryIndex * ImportSummary)303 bool opt(const Config &Conf, TargetMachine *TM, unsigned Task, Module &Mod,
304 bool IsThinLTO, ModuleSummaryIndex *ExportSummary,
305 const ModuleSummaryIndex *ImportSummary) {
306 // FIXME: Plumb the combined index into the new pass manager.
307 if (!Conf.OptPipeline.empty())
308 runNewPMCustomPasses(Mod, TM, Conf.OptPipeline, Conf.AAPipeline,
309 Conf.DisableVerify);
310 else if (Conf.UseNewPM)
311 runNewPMPasses(Conf, Mod, TM, Conf.OptLevel, IsThinLTO, ExportSummary,
312 ImportSummary);
313 else
314 runOldPMPasses(Conf, Mod, TM, IsThinLTO, ExportSummary, ImportSummary);
315 return !Conf.PostOptModuleHook || Conf.PostOptModuleHook(Task, Mod);
316 }
317
318 static cl::opt<bool> EmbedBitcode(
319 "lto-embed-bitcode", cl::init(false),
320 cl::desc("Embed LLVM bitcode in object files produced by LTO"));
321
EmitBitcodeSection(Module & M,const Config & Conf)322 static void EmitBitcodeSection(Module &M, const Config &Conf) {
323 if (!EmbedBitcode)
324 return;
325 SmallVector<char, 0> Buffer;
326 raw_svector_ostream OS(Buffer);
327 WriteBitcodeToFile(M, OS);
328
329 std::unique_ptr<MemoryBuffer> Buf(
330 new SmallVectorMemoryBuffer(std::move(Buffer)));
331 llvm::EmbedBitcodeInModule(M, Buf->getMemBufferRef(), /*EmbedBitcode*/ true,
332 /*EmbedMarker*/ false, /*CmdArgs*/ nullptr);
333 }
334
codegen(const Config & Conf,TargetMachine * TM,AddStreamFn AddStream,unsigned Task,Module & Mod)335 void codegen(const Config &Conf, TargetMachine *TM, AddStreamFn AddStream,
336 unsigned Task, Module &Mod) {
337 if (Conf.PreCodeGenModuleHook && !Conf.PreCodeGenModuleHook(Task, Mod))
338 return;
339
340 EmitBitcodeSection(Mod, Conf);
341
342 std::unique_ptr<ToolOutputFile> DwoOut;
343 SmallString<1024> DwoFile(Conf.SplitDwarfOutput);
344 if (!Conf.DwoDir.empty()) {
345 std::error_code EC;
346 if (auto EC = llvm::sys::fs::create_directories(Conf.DwoDir))
347 report_fatal_error("Failed to create directory " + Conf.DwoDir + ": " +
348 EC.message());
349
350 DwoFile = Conf.DwoDir;
351 sys::path::append(DwoFile, std::to_string(Task) + ".dwo");
352 TM->Options.MCOptions.SplitDwarfFile = DwoFile.str().str();
353 } else
354 TM->Options.MCOptions.SplitDwarfFile = Conf.SplitDwarfFile;
355
356 if (!DwoFile.empty()) {
357 std::error_code EC;
358 DwoOut = std::make_unique<ToolOutputFile>(DwoFile, EC, sys::fs::OF_None);
359 if (EC)
360 report_fatal_error("Failed to open " + DwoFile + ": " + EC.message());
361 }
362
363 auto Stream = AddStream(Task);
364 legacy::PassManager CodeGenPasses;
365 if (TM->addPassesToEmitFile(CodeGenPasses, *Stream->OS,
366 DwoOut ? &DwoOut->os() : nullptr,
367 Conf.CGFileType))
368 report_fatal_error("Failed to setup codegen");
369 CodeGenPasses.run(Mod);
370
371 if (DwoOut)
372 DwoOut->keep();
373 }
374
splitCodeGen(const Config & C,TargetMachine * TM,AddStreamFn AddStream,unsigned ParallelCodeGenParallelismLevel,std::unique_ptr<Module> Mod)375 void splitCodeGen(const Config &C, TargetMachine *TM, AddStreamFn AddStream,
376 unsigned ParallelCodeGenParallelismLevel,
377 std::unique_ptr<Module> Mod) {
378 ThreadPool CodegenThreadPool(ParallelCodeGenParallelismLevel);
379 unsigned ThreadCount = 0;
380 const Target *T = &TM->getTarget();
381
382 SplitModule(
383 std::move(Mod), ParallelCodeGenParallelismLevel,
384 [&](std::unique_ptr<Module> MPart) {
385 // We want to clone the module in a new context to multi-thread the
386 // codegen. We do it by serializing partition modules to bitcode
387 // (while still on the main thread, in order to avoid data races) and
388 // spinning up new threads which deserialize the partitions into
389 // separate contexts.
390 // FIXME: Provide a more direct way to do this in LLVM.
391 SmallString<0> BC;
392 raw_svector_ostream BCOS(BC);
393 WriteBitcodeToFile(*MPart, BCOS);
394
395 // Enqueue the task
396 CodegenThreadPool.async(
397 [&](const SmallString<0> &BC, unsigned ThreadId) {
398 LTOLLVMContext Ctx(C);
399 Expected<std::unique_ptr<Module>> MOrErr = parseBitcodeFile(
400 MemoryBufferRef(StringRef(BC.data(), BC.size()), "ld-temp.o"),
401 Ctx);
402 if (!MOrErr)
403 report_fatal_error("Failed to read bitcode");
404 std::unique_ptr<Module> MPartInCtx = std::move(MOrErr.get());
405
406 std::unique_ptr<TargetMachine> TM =
407 createTargetMachine(C, T, *MPartInCtx);
408
409 codegen(C, TM.get(), AddStream, ThreadId, *MPartInCtx);
410 },
411 // Pass BC using std::move to ensure that it get moved rather than
412 // copied into the thread's context.
413 std::move(BC), ThreadCount++);
414 },
415 false);
416
417 // Because the inner lambda (which runs in a worker thread) captures our local
418 // variables, we need to wait for the worker threads to terminate before we
419 // can leave the function scope.
420 CodegenThreadPool.wait();
421 }
422
initAndLookupTarget(const Config & C,Module & Mod)423 Expected<const Target *> initAndLookupTarget(const Config &C, Module &Mod) {
424 if (!C.OverrideTriple.empty())
425 Mod.setTargetTriple(C.OverrideTriple);
426 else if (Mod.getTargetTriple().empty())
427 Mod.setTargetTriple(C.DefaultTriple);
428
429 std::string Msg;
430 const Target *T = TargetRegistry::lookupTarget(Mod.getTargetTriple(), Msg);
431 if (!T)
432 return make_error<StringError>(Msg, inconvertibleErrorCode());
433 return T;
434 }
435 }
436
437 static Error
finalizeOptimizationRemarks(std::unique_ptr<ToolOutputFile> DiagOutputFile)438 finalizeOptimizationRemarks(std::unique_ptr<ToolOutputFile> DiagOutputFile) {
439 // Make sure we flush the diagnostic remarks file in case the linker doesn't
440 // call the global destructors before exiting.
441 if (!DiagOutputFile)
442 return Error::success();
443 DiagOutputFile->keep();
444 DiagOutputFile->os().flush();
445 return Error::success();
446 }
447
backend(const Config & C,AddStreamFn AddStream,unsigned ParallelCodeGenParallelismLevel,std::unique_ptr<Module> Mod,ModuleSummaryIndex & CombinedIndex)448 Error lto::backend(const Config &C, AddStreamFn AddStream,
449 unsigned ParallelCodeGenParallelismLevel,
450 std::unique_ptr<Module> Mod,
451 ModuleSummaryIndex &CombinedIndex) {
452 Expected<const Target *> TOrErr = initAndLookupTarget(C, *Mod);
453 if (!TOrErr)
454 return TOrErr.takeError();
455
456 std::unique_ptr<TargetMachine> TM = createTargetMachine(C, *TOrErr, *Mod);
457
458 // Setup optimization remarks.
459 auto DiagFileOrErr = lto::setupOptimizationRemarks(
460 Mod->getContext(), C.RemarksFilename, C.RemarksPasses, C.RemarksFormat,
461 C.RemarksWithHotness);
462 if (!DiagFileOrErr)
463 return DiagFileOrErr.takeError();
464 auto DiagnosticOutputFile = std::move(*DiagFileOrErr);
465
466 if (!C.CodeGenOnly) {
467 if (!opt(C, TM.get(), 0, *Mod, /*IsThinLTO=*/false,
468 /*ExportSummary=*/&CombinedIndex, /*ImportSummary=*/nullptr))
469 return finalizeOptimizationRemarks(std::move(DiagnosticOutputFile));
470 }
471
472 if (ParallelCodeGenParallelismLevel == 1) {
473 codegen(C, TM.get(), AddStream, 0, *Mod);
474 } else {
475 splitCodeGen(C, TM.get(), AddStream, ParallelCodeGenParallelismLevel,
476 std::move(Mod));
477 }
478 return finalizeOptimizationRemarks(std::move(DiagnosticOutputFile));
479 }
480
dropDeadSymbols(Module & Mod,const GVSummaryMapTy & DefinedGlobals,const ModuleSummaryIndex & Index)481 static void dropDeadSymbols(Module &Mod, const GVSummaryMapTy &DefinedGlobals,
482 const ModuleSummaryIndex &Index) {
483 std::vector<GlobalValue*> DeadGVs;
484 for (auto &GV : Mod.global_values())
485 if (GlobalValueSummary *GVS = DefinedGlobals.lookup(GV.getGUID()))
486 if (!Index.isGlobalValueLive(GVS)) {
487 DeadGVs.push_back(&GV);
488 convertToDeclaration(GV);
489 }
490
491 // Now that all dead bodies have been dropped, delete the actual objects
492 // themselves when possible.
493 for (GlobalValue *GV : DeadGVs) {
494 GV->removeDeadConstantUsers();
495 // Might reference something defined in native object (i.e. dropped a
496 // non-prevailing IR def, but we need to keep the declaration).
497 if (GV->use_empty())
498 GV->eraseFromParent();
499 }
500 }
501
thinBackend(const Config & Conf,unsigned Task,AddStreamFn AddStream,Module & Mod,const ModuleSummaryIndex & CombinedIndex,const FunctionImporter::ImportMapTy & ImportList,const GVSummaryMapTy & DefinedGlobals,MapVector<StringRef,BitcodeModule> & ModuleMap)502 Error lto::thinBackend(const Config &Conf, unsigned Task, AddStreamFn AddStream,
503 Module &Mod, const ModuleSummaryIndex &CombinedIndex,
504 const FunctionImporter::ImportMapTy &ImportList,
505 const GVSummaryMapTy &DefinedGlobals,
506 MapVector<StringRef, BitcodeModule> &ModuleMap) {
507 Expected<const Target *> TOrErr = initAndLookupTarget(Conf, Mod);
508 if (!TOrErr)
509 return TOrErr.takeError();
510
511 std::unique_ptr<TargetMachine> TM = createTargetMachine(Conf, *TOrErr, Mod);
512
513 // Setup optimization remarks.
514 auto DiagFileOrErr = lto::setupOptimizationRemarks(
515 Mod.getContext(), Conf.RemarksFilename, Conf.RemarksPasses,
516 Conf.RemarksFormat, Conf.RemarksWithHotness, Task);
517 if (!DiagFileOrErr)
518 return DiagFileOrErr.takeError();
519 auto DiagnosticOutputFile = std::move(*DiagFileOrErr);
520
521 if (Conf.CodeGenOnly) {
522 codegen(Conf, TM.get(), AddStream, Task, Mod);
523 return finalizeOptimizationRemarks(std::move(DiagnosticOutputFile));
524 }
525
526 if (Conf.PreOptModuleHook && !Conf.PreOptModuleHook(Task, Mod))
527 return finalizeOptimizationRemarks(std::move(DiagnosticOutputFile));
528
529 renameModuleForThinLTO(Mod, CombinedIndex);
530
531 dropDeadSymbols(Mod, DefinedGlobals, CombinedIndex);
532
533 thinLTOResolvePrevailingInModule(Mod, DefinedGlobals);
534
535 if (Conf.PostPromoteModuleHook && !Conf.PostPromoteModuleHook(Task, Mod))
536 return finalizeOptimizationRemarks(std::move(DiagnosticOutputFile));
537
538 if (!DefinedGlobals.empty())
539 thinLTOInternalizeModule(Mod, DefinedGlobals);
540
541 if (Conf.PostInternalizeModuleHook &&
542 !Conf.PostInternalizeModuleHook(Task, Mod))
543 return finalizeOptimizationRemarks(std::move(DiagnosticOutputFile));
544
545 auto ModuleLoader = [&](StringRef Identifier) {
546 assert(Mod.getContext().isODRUniquingDebugTypes() &&
547 "ODR Type uniquing should be enabled on the context");
548 auto I = ModuleMap.find(Identifier);
549 assert(I != ModuleMap.end());
550 return I->second.getLazyModule(Mod.getContext(),
551 /*ShouldLazyLoadMetadata=*/true,
552 /*IsImporting*/ true);
553 };
554
555 FunctionImporter Importer(CombinedIndex, ModuleLoader);
556 if (Error Err = Importer.importFunctions(Mod, ImportList).takeError())
557 return Err;
558
559 if (Conf.PostImportModuleHook && !Conf.PostImportModuleHook(Task, Mod))
560 return finalizeOptimizationRemarks(std::move(DiagnosticOutputFile));
561
562 if (!opt(Conf, TM.get(), Task, Mod, /*IsThinLTO=*/true,
563 /*ExportSummary=*/nullptr, /*ImportSummary=*/&CombinedIndex))
564 return finalizeOptimizationRemarks(std::move(DiagnosticOutputFile));
565
566 codegen(Conf, TM.get(), AddStream, Task, Mod);
567 return finalizeOptimizationRemarks(std::move(DiagnosticOutputFile));
568 }
569