From 45ee0a9afc6282000e06fa1edb89fe2159a7b34e Mon Sep 17 00:00:00 2001 From: Scott Linder Date: Wed, 15 Feb 2023 17:12:47 +0000 Subject: [PATCH] [LLD] Add --lto-CGO[0-3] option Allow controlling the CodeGenOpt::Level independent of the LTO optimization level in LLD via new options for the COFF, ELF, MachO, and wasm frontends to lld. Most are spelled as --lto-CGO[0-3], but COFF is spelled as -opt:lldltocgo=[0-3]. See D57422 for discussion surrounding the issue of how to set the CG opt level. The ultimate goal is to let each function control its CG opt level, but until then the current default means it is impossible to specify a CG opt level lower than 2 while using LTO. This option gives the user a means to control it for as long as it is not handled on a per-function basis. Reviewed By: MaskRay, #lld-macho, int3 Differential Revision: https://reviews.llvm.org/D141970 --- lld/COFF/Config.h | 2 ++ lld/COFF/Driver.cpp | 4 ++++ lld/COFF/LTO.cpp | 5 ++++- lld/Common/Args.cpp | 7 ++----- lld/ELF/Config.h | 1 + lld/ELF/Driver.cpp | 10 ++++++++-- lld/ELF/LTO.cpp | 2 +- lld/ELF/Options.td | 2 ++ lld/MachO/Config.h | 5 +++++ lld/MachO/Driver.cpp | 14 +++++++++++--- lld/MachO/LTO.cpp | 2 +- lld/MachO/Options.td | 4 ++++ lld/include/lld/Common/Args.h | 2 +- lld/test/COFF/lto-cgo.ll | 28 ++++++++++++++++++++++++++++ lld/test/ELF/lto/cgo.ll | 28 ++++++++++++++++++++++++++++ lld/test/MachO/lto-cgo.ll | 28 ++++++++++++++++++++++++++++ lld/test/wasm/lto/cgo.ll | 28 ++++++++++++++++++++++++++++ lld/wasm/Config.h | 5 +++++ lld/wasm/Driver.cpp | 10 ++++++++-- lld/wasm/LTO.cpp | 2 +- lld/wasm/Options.td | 2 ++ 21 files changed, 174 insertions(+), 17 deletions(-) create mode 100644 lld/test/COFF/lto-cgo.ll create mode 100644 lld/test/ELF/lto/cgo.ll create mode 100644 lld/test/MachO/lto-cgo.ll create mode 100644 lld/test/wasm/lto/cgo.ll diff --git a/lld/COFF/Config.h b/lld/COFF/Config.h index 4711573a5b76..1c35acf25ed6 100644 --- a/lld/COFF/Config.h +++ b/lld/COFF/Config.h @@ -162,6 +162,8 @@ struct Configuration { // Used for /opt:lldlto=N unsigned ltoo = 2; + // Used for /opt:lldltocgo=N + std::optional ltoCgo; // Used for /opt:lldltojobs=N std::string thinLTOJobs; diff --git a/lld/COFF/Driver.cpp b/lld/COFF/Driver.cpp index 464cb825d4e4..e0fc29879abe 100644 --- a/lld/COFF/Driver.cpp +++ b/lld/COFF/Driver.cpp @@ -1768,6 +1768,10 @@ void LinkerDriver::linkerMain(ArrayRef argsArr) { } else if (s.consume_front("lldlto=")) { if (s.getAsInteger(10, config->ltoo) || config->ltoo > 3) error("/opt:lldlto: invalid optimization level: " + s); + } else if (s.consume_front("lldltocgo=")) { + config->ltoCgo.emplace(); + if (s.getAsInteger(10, *config->ltoCgo) || *config->ltoCgo > 3) + error("/opt:lldltocgo: invalid codegen optimization level: " + s); } else if (s.consume_front("lldltojobs=")) { if (!get_threadpool_strategy(s)) error("/opt:lldltojobs: invalid job count: " + s); diff --git a/lld/COFF/LTO.cpp b/lld/COFF/LTO.cpp index b5643b885972..cfb964b6aa3b 100644 --- a/lld/COFF/LTO.cpp +++ b/lld/COFF/LTO.cpp @@ -88,7 +88,10 @@ lto::Config BitcodeCompiler::createConfig() { c.OptLevel = ctx.config.ltoo; c.CPU = getCPUStr(); c.MAttrs = getMAttrs(); - c.CGOptLevel = args::getCGOptLevel(ctx.config.ltoo); + std::optional optLevelOrNone = CodeGenOpt::getLevel( + ctx.config.ltoCgo.value_or(args::getCGOptLevel(ctx.config.ltoo))); + assert(optLevelOrNone && "Invalid optimization level!"); + c.CGOptLevel = *optLevelOrNone; c.AlwaysEmitRegularLTOObj = !ctx.config.ltoObjPath.empty(); c.DebugPassManager = ctx.config.ltoDebugPassManager; c.CSIRProfile = std::string(ctx.config.ltoCSProfileFile); diff --git a/lld/Common/Args.cpp b/lld/Common/Args.cpp index 388c15b3db3e..b6d050bb1f77 100644 --- a/lld/Common/Args.cpp +++ b/lld/Common/Args.cpp @@ -19,11 +19,8 @@ using namespace lld; // TODO(sbc): Remove this once CGOptLevel can be set completely based on bitcode // function metadata. -CodeGenOpt::Level lld::args::getCGOptLevel(int optLevelLTO) { - if (optLevelLTO == 3) - return CodeGenOpt::Aggressive; - assert(optLevelLTO < 3); - return CodeGenOpt::Default; +int lld::args::getCGOptLevel(int optLevelLTO) { + return std::clamp(optLevelLTO, 2, 3); } static int64_t getInteger(opt::InputArgList &args, unsigned key, diff --git a/lld/ELF/Config.h b/lld/ELF/Config.h index 66aa6656fe4e..61faea4e9bce 100644 --- a/lld/ELF/Config.h +++ b/lld/ELF/Config.h @@ -317,6 +317,7 @@ struct Config { uint64_t zStackSize; unsigned ltoPartitions; unsigned ltoo; + llvm::CodeGenOpt::Level ltoCgo; unsigned optimize; StringRef thinLTOJobs; unsigned timeTraceGranularity; diff --git a/lld/ELF/Driver.cpp b/lld/ELF/Driver.cpp index fe403962a385..93caf755196f 100644 --- a/lld/ELF/Driver.cpp +++ b/lld/ELF/Driver.cpp @@ -1139,6 +1139,14 @@ static void readConfigs(opt::InputArgList &args) { args.hasFlag(OPT_lto_whole_program_visibility, OPT_no_lto_whole_program_visibility, false); config->ltoo = args::getInteger(args, OPT_lto_O, 2); + if (config->ltoo > 3) + error("invalid optimization level for LTO: " + Twine(config->ltoo)); + unsigned ltoCgo = + args::getInteger(args, OPT_lto_CGO, args::getCGOptLevel(config->ltoo)); + if (auto level = CodeGenOpt::getLevel(ltoCgo)) + config->ltoCgo = *level; + else + error("invalid codegen optimization level for LTO: " + Twine(ltoCgo)); config->ltoObjPath = args.getLastArgValue(OPT_lto_obj_path_eq); config->ltoPartitions = args::getInteger(args, OPT_lto_partitions, 1); config->ltoSampleProfile = args.getLastArgValue(OPT_lto_sample_profile); @@ -1395,8 +1403,6 @@ static void readConfigs(opt::InputArgList &args) { config->thinLTOJobs = arg->getValue(); config->threadCount = parallel::strategy.compute_thread_count(); - if (config->ltoo > 3) - error("invalid optimization level for LTO: " + Twine(config->ltoo)); if (config->ltoPartitions == 0) error("--lto-partitions: number of threads must be > 0"); if (!get_threadpool_strategy(config->thinLTOJobs)) diff --git a/lld/ELF/LTO.cpp b/lld/ELF/LTO.cpp index 23777aeca92b..b51810dc91d7 100644 --- a/lld/ELF/LTO.cpp +++ b/lld/ELF/LTO.cpp @@ -127,7 +127,7 @@ static lto::Config createConfig() { c.OptLevel = config->ltoo; c.CPU = getCPUStr(); c.MAttrs = getMAttrs(); - c.CGOptLevel = args::getCGOptLevel(config->ltoo); + c.CGOptLevel = config->ltoCgo; c.PTO.LoopVectorization = c.OptLevel > 1; c.PTO.SLPVectorization = c.OptLevel > 1; diff --git a/lld/ELF/Options.td b/lld/ELF/Options.td index 8783bbc2fdab..87d84246ac45 100644 --- a/lld/ELF/Options.td +++ b/lld/ELF/Options.td @@ -558,6 +558,8 @@ def lto_newpm_passes: JJ<"lto-newpm-passes=">, HelpText<"Passes to run during LTO">; def lto_O: JJ<"lto-O">, MetaVarName<"">, HelpText<"Optimization level for LTO">; +def lto_CGO: JJ<"lto-CGO">, MetaVarName<"">, + HelpText<"Codegen optimization level for LTO">; def lto_partitions: JJ<"lto-partitions=">, HelpText<"Number of LTO codegen partitions">; def lto_cs_profile_generate: FF<"lto-cs-profile-generate">, diff --git a/lld/MachO/Config.h b/lld/MachO/Config.h index 220fb99d2e22..af46303f1ae2 100644 --- a/lld/MachO/Config.h +++ b/lld/MachO/Config.h @@ -26,6 +26,10 @@ #include +namespace llvm::CodeGenOpt { +enum Level : int; +} // namespace llvm::CodeGenOpt + namespace lld { namespace macho { @@ -165,6 +169,7 @@ struct Configuration { llvm::StringRef thinLTOJobs; llvm::StringRef umbrella; uint32_t ltoo = 2; + llvm::CodeGenOpt::Level ltoCgo; llvm::CachePruningPolicy thinLTOCachePolicy; llvm::StringRef thinLTOCacheDir; llvm::StringRef thinLTOIndexOnlyArg; diff --git a/lld/MachO/Driver.cpp b/lld/MachO/Driver.cpp index 65fea8958946..121fa851041c 100644 --- a/lld/MachO/Driver.cpp +++ b/lld/MachO/Driver.cpp @@ -1421,6 +1421,17 @@ bool macho::link(ArrayRef argsArr, llvm::raw_ostream &stdoutOS, target = createTargetInfo(args); depTracker = std::make_unique( args.getLastArgValue(OPT_dependency_info)); + + config->ltoo = args::getInteger(args, OPT_lto_O, 2); + if (config->ltoo > 3) + error("--lto-O: invalid optimization level: " + Twine(config->ltoo)); + unsigned ltoCgo = + args::getInteger(args, OPT_lto_CGO, args::getCGOptLevel(config->ltoo)); + if (auto level = CodeGenOpt::getLevel(ltoCgo)) + config->ltoCgo = *level; + else + error("--lto-CGO: invalid codegen optimization level: " + Twine(ltoCgo)); + if (errorCount()) return false; @@ -1558,9 +1569,6 @@ bool macho::link(ArrayRef argsArr, llvm::raw_ostream &stdoutOS, config->umbrella = arg->getValue(); } config->ltoObjPath = args.getLastArgValue(OPT_object_path_lto); - config->ltoo = args::getInteger(args, OPT_lto_O, 2); - if (config->ltoo > 3) - error("--lto-O: invalid optimization level: " + Twine(config->ltoo)); config->thinLTOCacheDir = args.getLastArgValue(OPT_cache_path_lto); config->thinLTOCachePolicy = getLTOCachePolicy(args); config->thinLTOEmitImportsFiles = args.hasArg(OPT_thinlto_emit_imports_files); diff --git a/lld/MachO/LTO.cpp b/lld/MachO/LTO.cpp index 2f5e9d06f396..6e3d4f3c230f 100644 --- a/lld/MachO/LTO.cpp +++ b/lld/MachO/LTO.cpp @@ -70,7 +70,7 @@ static lto::Config createConfig() { c.TimeTraceEnabled = config->timeTraceEnabled; c.TimeTraceGranularity = config->timeTraceGranularity; c.OptLevel = config->ltoo; - c.CGOptLevel = args::getCGOptLevel(config->ltoo); + c.CGOptLevel = config->ltoCgo; if (config->saveTemps) checkError(c.addSaveTemps(config->outputFile.str() + ".", /*UseInputModulePath=*/true)); diff --git a/lld/MachO/Options.td b/lld/MachO/Options.td index cb66f6277b5b..80a12f256b4b 100644 --- a/lld/MachO/Options.td +++ b/lld/MachO/Options.td @@ -84,6 +84,10 @@ def lto_O: Joined<["--"], "lto-O">, HelpText<"Set optimization level for LTO (default: 2)">, MetaVarName<"">, Group; +def lto_CGO: Joined<["--"], "lto-CGO">, + HelpText<"Set codegen optimization level for LTO (default: 2)">, + MetaVarName<"">, + Group; def thinlto_cache_policy_eq: Joined<["--"], "thinlto-cache-policy=">, HelpText<"Pruning policy for the ThinLTO cache">, Group; diff --git a/lld/include/lld/Common/Args.h b/lld/include/lld/Common/Args.h index 40c8ee4e9d0e..60f83fbbbf1a 100644 --- a/lld/include/lld/Common/Args.h +++ b/lld/include/lld/Common/Args.h @@ -23,7 +23,7 @@ class InputArgList; namespace lld { namespace args { -llvm::CodeGenOpt::Level getCGOptLevel(int optLevelLTO); +int getCGOptLevel(int optLevelLTO); int64_t getInteger(llvm::opt::InputArgList &args, unsigned key, int64_t Default); diff --git a/lld/test/COFF/lto-cgo.ll b/lld/test/COFF/lto-cgo.ll new file mode 100644 index 000000000000..6f45eab4880c --- /dev/null +++ b/lld/test/COFF/lto-cgo.ll @@ -0,0 +1,28 @@ +; REQUIRES: x86 + +; RUN: llvm-as %s -o %t.obj +; RUN: lld-link -opt:lldlto=0 %t.obj -dll -noentry -out:%t.dll -mllvm:-debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: lld-link -opt:lldltocgo=0 %t.obj -dll -noentry -out:%t.dll -mllvm:-debug-pass=Structure 2>&1 | FileCheck --check-prefix=NOOPT %s +; RUN: lld-link -opt:lldlto=3 %t.obj -dll -noentry -out:%t.dll -mllvm:-debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: lld-link -opt:lldltocgo=3 %t.obj -dll -noentry -out:%t.dll -mllvm:-debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: lld-link -opt:lldlto=0 -opt:lldltocgo=0 %t.obj -dll -noentry -out:%t.dll -mllvm:-debug-pass=Structure 2>&1 | FileCheck --check-prefix=NOOPT %s +; RUN: lld-link -opt:lldlto=3 -opt:lldltocgo=0 %t.obj -dll -noentry -out:%t.dll -mllvm:-debug-pass=Structure 2>&1 | FileCheck --check-prefix=NOOPT %s +; RUN: lld-link -opt:lldlto=0 -opt:lldltocgo=3 %t.obj -dll -noentry -out:%t.dll -mllvm:-debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: lld-link -opt:lldlto=3 -opt:lldltocgo=3 %t.obj -dll -noentry -out:%t.dll -mllvm:-debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: lld-link -opt:lldlto=0 -opt:lldltocgo=0 -opt:lldltocgo=2 %t.obj -dll -noentry -out:%t.dll -mllvm:-debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: not lld-link -opt:lldlto=4 %t.obj -dll -noentry -out:%t.dll -mllvm:-debug-pass=Structure 2>&1 | FileCheck --check-prefix=ERROR-O4 %s +; RUN: not lld-link -opt:lldltocgo=4 %t.obj -dll -noentry -out:%t.dll -mllvm:-debug-pass=Structure 2>&1 | FileCheck --check-prefix=ERROR-CGO4 %s +; RUN: not lld-link -opt:lldlto=4 -opt:lldltocgo=4 %t.obj -dll -noentry -out:%t.dll -mllvm:-debug-pass=Structure 2>&1 | FileCheck --check-prefixes=ERROR-O4,ERROR-CGO4 %s + +; NOOPT: Fast Register Allocator +; OPT: Greedy Register Allocator +; ERROR-O4: lld-link: error: /opt:lldlto: invalid optimization level: 4 +; ERROR-CGO4: lld-link: error: /opt:lldltocgo: invalid codegen optimization level: 4 + +target datalayout = "e-m:w-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128" +target triple = "x86_64-pc-windows-msvc" + +define void @_start() { +entry: + ret void +} diff --git a/lld/test/ELF/lto/cgo.ll b/lld/test/ELF/lto/cgo.ll new file mode 100644 index 000000000000..1ff15864b78e --- /dev/null +++ b/lld/test/ELF/lto/cgo.ll @@ -0,0 +1,28 @@ +; REQUIRES: x86 + +; RUN: llvm-as %s -o %t.o +; RUN: ld.lld --lto-O0 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: ld.lld --lto-CGO0 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=NOOPT %s +; RUN: ld.lld --lto-O3 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: ld.lld --lto-CGO3 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: ld.lld --lto-O0 --lto-CGO0 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=NOOPT %s +; RUN: ld.lld --lto-O3 --lto-CGO0 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=NOOPT %s +; RUN: ld.lld --lto-O0 --lto-CGO3 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: ld.lld --lto-O3 --lto-CGO3 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: ld.lld --lto-O0 --lto-CGO0 --lto-CGO2 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: not ld.lld --lto-O4 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=ERROR-O4 %s +; RUN: not ld.lld --lto-CGO4 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=ERROR-CGO4 %s +; RUN: not ld.lld --lto-O4 --lto-CGO4 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefixes=ERROR-O4,ERROR-CGO4 %s + +; NOOPT: Fast Register Allocator +; OPT: Greedy Register Allocator +; ERROR-O4: ld.lld: error: invalid optimization level for LTO: 4 +; ERROR-CGO4: ld.lld: error: invalid codegen optimization level for LTO: 4 + +target triple = "x86_64-unknown-linux-gnu" +target datalayout = "e-m:e-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128" + +define void @_start() { +entry: + ret void +} diff --git a/lld/test/MachO/lto-cgo.ll b/lld/test/MachO/lto-cgo.ll new file mode 100644 index 000000000000..b19d607e17e0 --- /dev/null +++ b/lld/test/MachO/lto-cgo.ll @@ -0,0 +1,28 @@ +; REQUIRES: x86 + +; RUN: llvm-as %s -o %t.o +; RUN: %lld -dylib --lto-O0 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: %lld -dylib --lto-CGO0 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=NOOPT %s +; RUN: %lld -dylib --lto-O3 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: %lld -dylib --lto-CGO3 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: %lld -dylib --lto-O0 --lto-CGO0 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=NOOPT %s +; RUN: %lld -dylib --lto-O3 --lto-CGO0 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=NOOPT %s +; RUN: %lld -dylib --lto-O0 --lto-CGO3 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: %lld -dylib --lto-O3 --lto-CGO3 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: %lld -dylib --lto-O0 --lto-CGO0 --lto-CGO2 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: not %lld -dylib --lto-O4 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=ERROR-O4 %s +; RUN: not %lld -dylib --lto-CGO4 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=ERROR-CGO4 %s +; RUN: not %lld -dylib --lto-O4 --lto-CGO4 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefixes=ERROR-O4,ERROR-CGO4 %s + +; NOOPT: Fast Register Allocator +; OPT: Greedy Register Allocator +; ERROR-O4: ld64.lld: error: --lto-O: invalid optimization level: 4 +; ERROR-CGO4: ld64.lld: error: --lto-CGO: invalid codegen optimization level: 4 + +target triple = "x86_64-apple-darwin" +target datalayout = "e-m:o-p270:32:32-p271:32:32-p272:64:64-i64:64-f80:128-n8:16:32:64-S128" + +define void @_start() { +entry: + ret void +} diff --git a/lld/test/wasm/lto/cgo.ll b/lld/test/wasm/lto/cgo.ll new file mode 100644 index 000000000000..c37ae6e8bcf3 --- /dev/null +++ b/lld/test/wasm/lto/cgo.ll @@ -0,0 +1,28 @@ +; REQUIRES: x86 + +; RUN: llvm-as %s -o %t.o +; RUN: wasm-ld --lto-O0 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: wasm-ld --lto-CGO0 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=NOOPT %s +; RUN: wasm-ld --lto-O3 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: wasm-ld --lto-CGO3 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: wasm-ld --lto-O0 --lto-CGO0 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=NOOPT %s +; RUN: wasm-ld --lto-O3 --lto-CGO0 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=NOOPT %s +; RUN: wasm-ld --lto-O0 --lto-CGO3 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: wasm-ld --lto-O3 --lto-CGO3 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: wasm-ld --lto-O0 --lto-CGO0 --lto-CGO2 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=OPT %s +; RUN: not wasm-ld --lto-O4 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=ERROR-O4 %s +; RUN: not wasm-ld --lto-CGO4 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefix=ERROR-CGO4 %s +; RUN: not wasm-ld --lto-O4 --lto-CGO4 %t.o -o %t -mllvm -debug-pass=Structure 2>&1 | FileCheck --check-prefixes=ERROR-O4,ERROR-CGO4 %s + +; NOOPT-NOT: WebAssembly Optimize Returned +; OPT: WebAssembly Optimize Returned +; ERROR-O4: wasm-ld: error: invalid optimization level for LTO: 4 +; ERROR-CGO4: wasm-ld: error: invalid codegen optimization level for LTO: 4 + +target datalayout = "e-m:e-p:32:32-p10:8:8-p20:8:8-i64:64-n32:64-S128" +target triple = "wasm32-unknown-unknown-wasm" + +define void @_start() { +entry: + ret void +} diff --git a/lld/wasm/Config.h b/lld/wasm/Config.h index 858a97860dbe..87217dddcb1e 100644 --- a/lld/wasm/Config.h +++ b/lld/wasm/Config.h @@ -16,6 +16,10 @@ #include "llvm/Support/CachePruning.h" #include +namespace llvm::CodeGenOpt { +enum Level : int; +} // namespace llvm::CodeGenOpt + namespace lld { namespace wasm { @@ -63,6 +67,7 @@ struct Configuration { uint64_t zStackSize; unsigned ltoPartitions; unsigned ltoo; + llvm::CodeGenOpt::Level ltoCgo; unsigned optimize; llvm::StringRef thinLTOJobs; bool ltoDebugPassManager; diff --git a/lld/wasm/Driver.cpp b/lld/wasm/Driver.cpp index e117e632d60f..709fd9923b53 100644 --- a/lld/wasm/Driver.cpp +++ b/lld/wasm/Driver.cpp @@ -424,6 +424,14 @@ static void readConfigs(opt::InputArgList &args) { config->importTable = args.hasArg(OPT_import_table); config->importUndefined = args.hasArg(OPT_import_undefined); config->ltoo = args::getInteger(args, OPT_lto_O, 2); + if (config->ltoo > 3) + error("invalid optimization level for LTO: " + Twine(config->ltoo)); + unsigned ltoCgo = + args::getInteger(args, OPT_lto_CGO, args::getCGOptLevel(config->ltoo)); + if (auto level = CodeGenOpt::getLevel(ltoCgo)) + config->ltoCgo = *level; + else + error("invalid codegen optimization level for LTO: " + Twine(ltoCgo)); config->ltoPartitions = args::getInteger(args, OPT_lto_partitions, 1); config->ltoDebugPassManager = args.hasArg(OPT_lto_debug_pass_manager); config->mapFile = args.getLastArgValue(OPT_Map); @@ -560,8 +568,6 @@ static void checkOptions(opt::InputArgList &args) { error("--compress-relocations is incompatible with output debug" " information. Please pass --strip-debug or --strip-all"); - if (config->ltoo > 3) - error("invalid optimization level for LTO: " + Twine(config->ltoo)); if (config->ltoPartitions == 0) error("--lto-partitions: number of threads must be > 0"); if (!get_threadpool_strategy(config->thinLTOJobs)) diff --git a/lld/wasm/LTO.cpp b/lld/wasm/LTO.cpp index 150e663ce7ee..d5ec3f70a1df 100644 --- a/lld/wasm/LTO.cpp +++ b/lld/wasm/LTO.cpp @@ -51,7 +51,7 @@ static std::unique_ptr createLTO() { c.DiagHandler = diagnosticHandler; c.OptLevel = config->ltoo; c.MAttrs = getMAttrs(); - c.CGOptLevel = args::getCGOptLevel(config->ltoo); + c.CGOptLevel = config->ltoCgo; c.DebugPassManager = config->ltoDebugPassManager; if (config->relocatable) diff --git a/lld/wasm/Options.td b/lld/wasm/Options.td index a47c852148d4..b30ae99e6eb0 100644 --- a/lld/wasm/Options.td +++ b/lld/wasm/Options.td @@ -256,6 +256,8 @@ def: JoinedOrSeparate<["-"], "u">, Alias; // LTO-related options. def lto_O: JJ<"lto-O">, MetaVarName<"">, HelpText<"Optimization level for LTO">; +def lto_CGO: JJ<"lto-CGO">, MetaVarName<"">, + HelpText<"Codegen optimization level for LTO">; def lto_partitions: JJ<"lto-partitions=">, HelpText<"Number of LTO codegen partitions">; def disable_verify: F<"disable-verify">;