Mercurial > hg > CbC > CbC_llvm
diff lld/MachO/Driver.cpp @ 207:2e18cbf3894f
LLVM12
author | Shinji KONO <kono@ie.u-ryukyu.ac.jp> |
---|---|
date | Tue, 08 Jun 2021 06:07:14 +0900 |
parents | 0572611fdcc8 |
children | 5f17cb93ff66 |
line wrap: on
line diff
--- a/lld/MachO/Driver.cpp Mon May 25 11:55:54 2020 +0900 +++ b/lld/MachO/Driver.cpp Tue Jun 08 06:07:14 2021 +0900 @@ -9,10 +9,14 @@ #include "Driver.h" #include "Config.h" #include "InputFiles.h" +#include "LTO.h" +#include "MarkLive.h" +#include "ObjC.h" #include "OutputSection.h" #include "OutputSegment.h" #include "SymbolTable.h" #include "Symbols.h" +#include "SyntheticSections.h" #include "Target.h" #include "Writer.h" @@ -21,92 +25,227 @@ #include "lld/Common/ErrorHandler.h" #include "lld/Common/LLVM.h" #include "lld/Common/Memory.h" +#include "lld/Common/Reproduce.h" #include "lld/Common/Version.h" #include "llvm/ADT/DenseSet.h" #include "llvm/ADT/StringExtras.h" #include "llvm/ADT/StringRef.h" #include "llvm/BinaryFormat/MachO.h" #include "llvm/BinaryFormat/Magic.h" +#include "llvm/Config/llvm-config.h" +#include "llvm/LTO/LTO.h" #include "llvm/Object/Archive.h" #include "llvm/Option/ArgList.h" -#include "llvm/Option/Option.h" +#include "llvm/Support/CommandLine.h" +#include "llvm/Support/FileSystem.h" +#include "llvm/Support/Host.h" #include "llvm/Support/MemoryBuffer.h" +#include "llvm/Support/Parallel.h" #include "llvm/Support/Path.h" +#include "llvm/Support/TarWriter.h" +#include "llvm/Support/TargetSelect.h" +#include "llvm/Support/TimeProfiler.h" +#include "llvm/TextAPI/PackedVersion.h" + +#include <algorithm> using namespace llvm; using namespace llvm::MachO; +using namespace llvm::object; +using namespace llvm::opt; using namespace llvm::sys; using namespace lld; using namespace lld::macho; -Configuration *lld::macho::config; +Configuration *macho::config; +DependencyTracker *macho::depTracker; -// Create prefix string literals used in Options.td -#define PREFIX(NAME, VALUE) const char *NAME[] = VALUE; -#include "Options.inc" -#undef PREFIX +static HeaderFileType getOutputType(const InputArgList &args) { + // TODO: -r, -dylinker, -preload... + Arg *outputArg = args.getLastArg(OPT_bundle, OPT_dylib, OPT_execute); + if (outputArg == nullptr) + return MH_EXECUTE; -// Create table mapping all options defined in Options.td -static const opt::OptTable::Info optInfo[] = { -#define OPTION(X1, X2, ID, KIND, GROUP, ALIAS, X7, X8, X9, X10, X11, X12) \ - {X1, X2, X10, X11, OPT_##ID, opt::Option::KIND##Class, \ - X9, X8, OPT_##GROUP, OPT_##ALIAS, X7, X12}, -#include "Options.inc" -#undef OPTION -}; + switch (outputArg->getOption().getID()) { + case OPT_bundle: + return MH_BUNDLE; + case OPT_dylib: + return MH_DYLIB; + case OPT_execute: + return MH_EXECUTE; + default: + llvm_unreachable("internal error"); + } +} + +static Optional<StringRef> findLibrary(StringRef name) { + if (config->searchDylibsFirst) { + if (Optional<StringRef> path = findPathCombination( + "lib" + name, config->librarySearchPaths, {".tbd", ".dylib"})) + return path; + return findPathCombination("lib" + name, config->librarySearchPaths, + {".a"}); + } + return findPathCombination("lib" + name, config->librarySearchPaths, + {".tbd", ".dylib", ".a"}); +} -MachOOptTable::MachOOptTable() : OptTable(optInfo) {} - -opt::InputArgList MachOOptTable::parse(ArrayRef<const char *> argv) { - // Make InputArgList from string vectors. - unsigned missingIndex; - unsigned missingCount; - SmallVector<const char *, 256> vec(argv.data(), argv.data() + argv.size()); +static Optional<std::string> findFramework(StringRef name) { + SmallString<260> symlink; + StringRef suffix; + std::tie(name, suffix) = name.split(","); + for (StringRef dir : config->frameworkSearchPaths) { + symlink = dir; + path::append(symlink, name + ".framework", name); - opt::InputArgList args = ParseArgs(vec, missingIndex, missingCount); + if (!suffix.empty()) { + // NOTE: we must resolve the symlink before trying the suffixes, because + // there are no symlinks for the suffixed paths. + SmallString<260> location; + if (!fs::real_path(symlink, location)) { + // only append suffix if realpath() succeeds + Twine suffixed = location + suffix; + if (fs::exists(suffixed)) + return suffixed.str(); + } + // Suffix lookup failed, fall through to the no-suffix case. + } - if (missingCount) - error(Twine(args.getArgString(missingIndex)) + ": missing argument"); + if (Optional<std::string> path = resolveDylibPath(symlink)) + return path; + } + return {}; +} - for (opt::Arg *arg : args.filtered(OPT_UNKNOWN)) - error("unknown argument: " + arg->getSpelling()); - return args; +static bool warnIfNotDirectory(StringRef option, StringRef path) { + if (!fs::exists(path)) { + warn("directory not found for option -" + option + path); + return false; + } else if (!fs::is_directory(path)) { + warn("option -" + option + path + " references a non-directory path"); + return false; + } + return true; } -// This is for -lfoo. We'll look for libfoo.dylib from search paths. -static Optional<std::string> findDylib(StringRef name) { - for (StringRef dir : config->searchPaths) { - std::string path = (dir + "/lib" + name + ".dylib").str(); - if (fs::exists(path)) - return path; +static std::vector<StringRef> +getSearchPaths(unsigned optionCode, InputArgList &args, + const std::vector<StringRef> &roots, + const SmallVector<StringRef, 2> &systemPaths) { + std::vector<StringRef> paths; + StringRef optionLetter{optionCode == OPT_F ? "F" : "L"}; + for (StringRef path : args::getStrings(args, optionCode)) { + // NOTE: only absolute paths are re-rooted to syslibroot(s) + bool found = false; + if (path::is_absolute(path, path::Style::posix)) { + for (StringRef root : roots) { + SmallString<261> buffer(root); + path::append(buffer, path); + // Do not warn about paths that are computed via the syslib roots + if (fs::is_directory(buffer)) { + paths.push_back(saver.save(buffer.str())); + found = true; + } + } + } + if (!found && warnIfNotDirectory(optionLetter, path)) + paths.push_back(path); } - error("library not found for -l" + name); - return None; + + // `-Z` suppresses the standard "system" search paths. + if (args.hasArg(OPT_Z)) + return paths; + + for (const StringRef &path : systemPaths) { + for (const StringRef &root : roots) { + SmallString<261> buffer(root); + path::append(buffer, path); + if (fs::is_directory(buffer)) + paths.push_back(saver.save(buffer.str())); + } + } + return paths; +} + +static std::vector<StringRef> getSystemLibraryRoots(InputArgList &args) { + std::vector<StringRef> roots; + for (const Arg *arg : args.filtered(OPT_syslibroot)) + roots.push_back(arg->getValue()); + // NOTE: the final `-syslibroot` being `/` will ignore all roots + if (roots.size() && roots.back() == "/") + roots.clear(); + // NOTE: roots can never be empty - add an empty root to simplify the library + // and framework search path computation. + if (roots.empty()) + roots.emplace_back(""); + return roots; +} + +static std::vector<StringRef> +getLibrarySearchPaths(InputArgList &args, const std::vector<StringRef> &roots) { + return getSearchPaths(OPT_L, args, roots, {"/usr/lib", "/usr/local/lib"}); } -static TargetInfo *createTargetInfo(opt::InputArgList &args) { - StringRef s = args.getLastArgValue(OPT_arch, "x86_64"); - if (s != "x86_64") - error("missing or unsupported -arch " + s); - return createX86_64TargetInfo(); +static std::vector<StringRef> +getFrameworkSearchPaths(InputArgList &args, + const std::vector<StringRef> &roots) { + return getSearchPaths(OPT_F, args, roots, + {"/Library/Frameworks", "/System/Library/Frameworks"}); } -static std::vector<StringRef> getSearchPaths(opt::InputArgList &args) { - std::vector<StringRef> ret{args::getStrings(args, OPT_L)}; - if (!args.hasArg(OPT_Z)) { - ret.push_back("/usr/lib"); - ret.push_back("/usr/local/lib"); +namespace { +struct ArchiveMember { + MemoryBufferRef mbref; + uint32_t modTime; +}; +} // namespace + +// Returns slices of MB by parsing MB as an archive file. +// Each slice consists of a member file in the archive. +static std::vector<ArchiveMember> getArchiveMembers(MemoryBufferRef mb) { + std::unique_ptr<Archive> file = + CHECK(Archive::create(mb), + mb.getBufferIdentifier() + ": failed to parse archive"); + Archive *archive = file.get(); + make<std::unique_ptr<Archive>>(std::move(file)); // take ownership + + std::vector<ArchiveMember> v; + Error err = Error::success(); + + // Thin archives refer to .o files, so --reproduce needs the .o files too. + bool addToTar = archive->isThin() && tar; + + for (const Archive::Child &c : archive->children(err)) { + MemoryBufferRef mbref = + CHECK(c.getMemoryBufferRef(), + mb.getBufferIdentifier() + + ": could not get the buffer for a child of the archive"); + if (addToTar) + tar->append(relativeToRoot(check(c.getFullName())), mbref.getBuffer()); + uint32_t modTime = toTimeT( + CHECK(c.getLastModified(), mb.getBufferIdentifier() + + ": could not get the modification " + "time for a child of the archive")); + v.push_back({mbref, modTime}); } - return ret; + if (err) + fatal(mb.getBufferIdentifier() + + ": Archive::children failed: " + toString(std::move(err))); + + return v; } -static void addFile(StringRef path) { +static InputFile *addFile(StringRef path, bool forceLoadArchive, + bool isExplicit = true, + bool isBundleLoader = false) { Optional<MemoryBufferRef> buffer = readFile(path); if (!buffer) - return; + return nullptr; MemoryBufferRef mbref = *buffer; + InputFile *newFile = nullptr; - switch (identify_magic(mbref.getBuffer())) { + file_magic magic = identify_magic(mbref.getBuffer()); + switch (magic) { case file_magic::archive: { std::unique_ptr<object::Archive> file = CHECK( object::Archive::create(mbref), path + ": failed to parse archive"); @@ -114,39 +253,178 @@ if (!file->isEmpty() && !file->hasSymbolTable()) error(path + ": archive has no index; run ranlib to add one"); - inputFiles.push_back(make<ArchiveFile>(std::move(file))); + if (config->allLoad || forceLoadArchive) { + if (Optional<MemoryBufferRef> buffer = readFile(path)) { + for (const ArchiveMember &member : getArchiveMembers(*buffer)) { + if (Optional<InputFile *> file = loadArchiveMember( + member.mbref, member.modTime, path, /*objCOnly=*/false)) { + inputFiles.insert(*file); + printArchiveMemberLoad( + (forceLoadArchive ? "-force_load" : "-all_load"), + inputFiles.back()); + } + } + } + } else if (config->forceLoadObjC) { + for (const object::Archive::Symbol &sym : file->symbols()) + if (sym.getName().startswith(objc::klass)) + symtab->addUndefined(sym.getName(), /*file=*/nullptr, + /*isWeakRef=*/false); + + // TODO: no need to look for ObjC sections for a given archive member if + // we already found that it contains an ObjC symbol. We should also + // consider creating a LazyObjFile class in order to avoid double-loading + // these files here and below (as part of the ArchiveFile). + if (Optional<MemoryBufferRef> buffer = readFile(path)) { + for (const ArchiveMember &member : getArchiveMembers(*buffer)) { + if (Optional<InputFile *> file = loadArchiveMember( + member.mbref, member.modTime, path, /*objCOnly=*/true)) { + inputFiles.insert(*file); + printArchiveMemberLoad("-ObjC", inputFiles.back()); + } + } + } + } + + newFile = make<ArchiveFile>(std::move(file)); break; } case file_magic::macho_object: - inputFiles.push_back(make<ObjFile>(mbref)); + newFile = make<ObjFile>(mbref, getModTime(path), ""); break; case file_magic::macho_dynamically_linked_shared_lib: - inputFiles.push_back(make<DylibFile>(mbref)); + case file_magic::macho_dynamically_linked_shared_lib_stub: + case file_magic::tapi_file: + if (DylibFile * dylibFile = loadDylib(mbref)) { + if (isExplicit) + dylibFile->explicitlyLinked = true; + newFile = dylibFile; + } + break; + case file_magic::bitcode: + newFile = make<BitcodeFile>(mbref); + break; + case file_magic::macho_executable: + case file_magic::macho_bundle: + // We only allow executable and bundle type here if it is used + // as a bundle loader. + if (!isBundleLoader) + error(path + ": unhandled file type"); + if (DylibFile *dylibFile = loadDylib(mbref, nullptr, isBundleLoader)) + newFile = dylibFile; break; default: error(path + ": unhandled file type"); } + if (newFile) { + // printArchiveMemberLoad() prints both .a and .o names, so no need to + // print the .a name here. + if (config->printEachFile && magic != file_magic::archive && + !isa<DylibFile>(newFile)) + message(toString(newFile)); + inputFiles.insert(newFile); + } + return newFile; +} + +static void addLibrary(StringRef name, bool isNeeded, bool isWeak, + bool isReexport, bool isExplicit) { + if (Optional<StringRef> path = findLibrary(name)) { + if (auto *dylibFile = dyn_cast_or_null<DylibFile>( + addFile(*path, /*forceLoadArchive=*/false, isExplicit))) { + if (isNeeded) + dylibFile->forceNeeded = true; + if (isWeak) + dylibFile->forceWeakImport = true; + if (isReexport) { + config->hasReexports = true; + dylibFile->reexport = true; + } + } + return; + } + error("library not found for -l" + name); } -static std::array<StringRef, 6> archNames{"arm", "arm64", "i386", - "x86_64", "ppc", "ppc64"}; -static bool isArchString(StringRef s) { - static DenseSet<StringRef> archNamesSet(archNames.begin(), archNames.end()); - return archNamesSet.find(s) != archNamesSet.end(); +static void addFramework(StringRef name, bool isNeeded, bool isWeak, + bool isReexport, bool isExplicit) { + if (Optional<std::string> path = findFramework(name)) { + if (auto *dylibFile = dyn_cast_or_null<DylibFile>( + addFile(*path, /*forceLoadArchive=*/false, isExplicit))) { + if (isNeeded) + dylibFile->forceNeeded = true; + if (isWeak) + dylibFile->forceWeakImport = true; + if (isReexport) { + config->hasReexports = true; + dylibFile->reexport = true; + } + } + return; + } + error("framework not found for -framework " + name); +} + +// Parses LC_LINKER_OPTION contents, which can add additional command line +// flags. +void macho::parseLCLinkerOption(InputFile *f, unsigned argc, StringRef data) { + SmallVector<const char *, 4> argv; + size_t offset = 0; + for (unsigned i = 0; i < argc && offset < data.size(); ++i) { + argv.push_back(data.data() + offset); + offset += strlen(data.data() + offset) + 1; + } + if (argv.size() != argc || offset > data.size()) + fatal(toString(f) + ": invalid LC_LINKER_OPTION"); + + MachOOptTable table; + unsigned missingIndex, missingCount; + InputArgList args = table.ParseArgs(argv, missingIndex, missingCount); + if (missingCount) + fatal(Twine(args.getArgString(missingIndex)) + ": missing argument"); + for (const Arg *arg : args.filtered(OPT_UNKNOWN)) + error("unknown argument: " + arg->getAsString(args)); + + for (const Arg *arg : args) { + switch (arg->getOption().getID()) { + case OPT_l: + addLibrary(arg->getValue(), /*isNeeded=*/false, /*isWeak=*/false, + /*isReexport=*/false, /*isExplicit=*/false); + break; + case OPT_framework: + addFramework(arg->getValue(), /*isNeeded=*/false, /*isWeak=*/false, + /*isReexport=*/false, /*isExplicit=*/false); + break; + default: + error(arg->getSpelling() + " is not allowed in LC_LINKER_OPTION"); + } + } +} + +static void addFileList(StringRef path) { + Optional<MemoryBufferRef> buffer = readFile(path); + if (!buffer) + return; + MemoryBufferRef mbref = *buffer; + for (StringRef path : args::getLines(mbref)) + addFile(rerootPath(path), /*forceLoadArchive=*/false); } // An order file has one entry per line, in the following format: // -// <arch>:<object file>:<symbol name> +// <cpu>:<object file>:<symbol name> // -// <arch> and <object file> are optional. If not specified, then that entry -// matches any symbol of that name. +// <cpu> and <object file> are optional. If not specified, then that entry +// matches any symbol of that name. Parsing this format is not quite +// straightforward because the symbol name itself can contain colons, so when +// encountering a colon, we consider the preceding characters to decide if it +// can be a valid CPU type or file path. // // If a symbol is matched by multiple entries, then it takes the lowest-ordered // entry (the one nearest to the front of the list.) // // The file can also have line comments that start with '#'. -void parseOrderFile(StringRef path) { +static void parseOrderFile(StringRef path) { Optional<MemoryBufferRef> buffer = readFile(path); if (!buffer) { error("Could not read order file at " + path); @@ -155,59 +433,38 @@ MemoryBufferRef mbref = *buffer; size_t priority = std::numeric_limits<size_t>::max(); - for (StringRef rest : args::getLines(mbref)) { - StringRef arch, objectFile, symbol; + for (StringRef line : args::getLines(mbref)) { + StringRef objectFile, symbol; + line = line.take_until([](char c) { return c == '#'; }); // ignore comments + line = line.ltrim(); - std::array<StringRef, 3> fields; - uint8_t fieldCount = 0; - while (rest != "" && fieldCount < 3) { - std::pair<StringRef, StringRef> p = getToken(rest, ": \t\n\v\f\r"); - StringRef tok = p.first; - rest = p.second; - - // Check if we have a comment - if (tok == "" || tok[0] == '#') - break; - - fields[fieldCount++] = tok; - } + CPUType cpuType = StringSwitch<CPUType>(line) + .StartsWith("i386:", CPU_TYPE_I386) + .StartsWith("x86_64:", CPU_TYPE_X86_64) + .StartsWith("arm:", CPU_TYPE_ARM) + .StartsWith("arm64:", CPU_TYPE_ARM64) + .StartsWith("ppc:", CPU_TYPE_POWERPC) + .StartsWith("ppc64:", CPU_TYPE_POWERPC64) + .Default(CPU_TYPE_ANY); - switch (fieldCount) { - case 3: - arch = fields[0]; - objectFile = fields[1]; - symbol = fields[2]; - break; - case 2: - (isArchString(fields[0]) ? arch : objectFile) = fields[0]; - symbol = fields[1]; - break; - case 1: - symbol = fields[0]; - break; - case 0: - break; - default: - llvm_unreachable("too many fields in order file"); + if (cpuType != CPU_TYPE_ANY && cpuType != target->cpuType) + continue; + + // Drop the CPU type as well as the colon + if (cpuType != CPU_TYPE_ANY) + line = line.drop_until([](char c) { return c == ':'; }).drop_front(); + + constexpr std::array<StringRef, 2> fileEnds = {".o:", ".o):"}; + for (StringRef fileEnd : fileEnds) { + size_t pos = line.find(fileEnd); + if (pos != StringRef::npos) { + // Split the string around the colon + objectFile = line.take_front(pos + fileEnd.size() - 1); + line = line.drop_front(pos + fileEnd.size()); + break; + } } - - if (!arch.empty()) { - if (!isArchString(arch)) { - error("invalid arch \"" + arch + "\" in order file: expected one of " + - llvm::join(archNames, ", ")); - continue; - } - - // TODO: Update when we extend support for other archs - if (arch != "x86_64") - continue; - } - - if (!objectFile.empty() && !objectFile.endswith(".o")) { - error("invalid object file name \"" + objectFile + - "\" in order file: should end with .o"); - continue; - } + symbol = line.trim(); if (!symbol.empty()) { SymbolPriorityEntry &entry = config->priorities[symbol]; @@ -222,12 +479,16 @@ } // We expect sub-library names of the form "libfoo", which will match a dylib -// with a path of .*/libfoo.dylib. -static bool markSubLibrary(StringRef searchName) { +// with a path of .*/libfoo.{dylib, tbd}. +// XXX ld64 seems to ignore the extension entirely when matching sub-libraries; +// I'm not sure what the use case for that is. +static bool markReexport(StringRef searchName, ArrayRef<StringRef> extensions) { for (InputFile *file : inputFiles) { if (auto *dylibFile = dyn_cast<DylibFile>(file)) { StringRef filename = path::filename(dylibFile->getName()); - if (filename.consume_front(searchName) && filename == ".dylib") { + if (filename.consume_front(searchName) && + (filename.empty() || + find(extensions, filename) != extensions.end())) { dylibFile->reexport = true; return true; } @@ -236,111 +497,826 @@ return false; } -static void handlePlatformVersion(opt::ArgList::iterator &it, - const opt::ArgList::iterator &end) { - // -platform_version takes 3 args, which LLVM's option library doesn't - // support directly. So this explicitly handles that. - // FIXME: stash skipped args for later use. - for (int i = 0; i < 3; ++i) { - ++it; - if (it == end || (*it)->getOption().getID() != OPT_INPUT) - fatal("usage: -platform_version platform min_version sdk_version"); +// This function is called on startup. We need this for LTO since +// LTO calls LLVM functions to compile bitcode files to native code. +// Technically this can be delayed until we read bitcode files, but +// we don't bother to do lazily because the initialization is fast. +static void initLLVM() { + InitializeAllTargets(); + InitializeAllTargetMCs(); + InitializeAllAsmPrinters(); + InitializeAllAsmParsers(); +} + +static void compileBitcodeFiles() { + TimeTraceScope timeScope("LTO"); + auto *lto = make<BitcodeCompiler>(); + for (InputFile *file : inputFiles) + if (auto *bitcodeFile = dyn_cast<BitcodeFile>(file)) + lto->add(*bitcodeFile); + + for (ObjFile *file : lto->compile()) + inputFiles.insert(file); +} + +// Replaces common symbols with defined symbols residing in __common sections. +// This function must be called after all symbol names are resolved (i.e. after +// all InputFiles have been loaded.) As a result, later operations won't see +// any CommonSymbols. +static void replaceCommonSymbols() { + TimeTraceScope timeScope("Replace common symbols"); + for (Symbol *sym : symtab->getSymbols()) { + auto *common = dyn_cast<CommonSymbol>(sym); + if (common == nullptr) + continue; + + auto *isec = make<InputSection>(); + isec->file = common->getFile(); + isec->name = section_names::common; + isec->segname = segment_names::data; + isec->align = common->align; + // Casting to size_t will truncate large values on 32-bit architectures, + // but it's not really worth supporting the linking of 64-bit programs on + // 32-bit archs. + isec->data = {nullptr, static_cast<size_t>(common->size)}; + isec->flags = S_ZEROFILL; + inputSections.push_back(isec); + + // FIXME: CommonSymbol should store isReferencedDynamically, noDeadStrip + // and pass them on here. + replaceSymbol<Defined>(sym, sym->getName(), isec->file, isec, /*value=*/0, + /*size=*/0, + /*isWeakDef=*/false, + /*isExternal=*/true, common->privateExtern, + /*isThumb=*/false, + /*isReferencedDynamically=*/false, + /*noDeadStrip=*/false); + } +} + +static void initializeSectionRenameMap() { + if (config->dataConst) { + SmallVector<StringRef> v{section_names::got, + section_names::authGot, + section_names::authPtr, + section_names::nonLazySymbolPtr, + section_names::const_, + section_names::cfString, + section_names::moduleInitFunc, + section_names::moduleTermFunc, + section_names::objcClassList, + section_names::objcNonLazyClassList, + section_names::objcCatList, + section_names::objcNonLazyCatList, + section_names::objcProtoList, + section_names::objcImageInfo}; + for (StringRef s : v) + config->sectionRenameMap[{segment_names::data, s}] = { + segment_names::dataConst, s}; + } + config->sectionRenameMap[{segment_names::text, section_names::staticInit}] = { + segment_names::text, section_names::text}; + config->sectionRenameMap[{segment_names::import, section_names::pointers}] = { + config->dataConst ? segment_names::dataConst : segment_names::data, + section_names::nonLazySymbolPtr}; +} + +static inline char toLowerDash(char x) { + if (x >= 'A' && x <= 'Z') + return x - 'A' + 'a'; + else if (x == ' ') + return '-'; + return x; +} + +static std::string lowerDash(StringRef s) { + return std::string(map_iterator(s.begin(), toLowerDash), + map_iterator(s.end(), toLowerDash)); +} + +// Has the side-effect of setting Config::platformInfo. +static PlatformKind parsePlatformVersion(const ArgList &args) { + const Arg *arg = args.getLastArg(OPT_platform_version); + if (!arg) { + error("must specify -platform_version"); + return PlatformKind::unknown; + } + + StringRef platformStr = arg->getValue(0); + StringRef minVersionStr = arg->getValue(1); + StringRef sdkVersionStr = arg->getValue(2); + + // TODO(compnerd) see if we can generate this case list via XMACROS + PlatformKind platform = + StringSwitch<PlatformKind>(lowerDash(platformStr)) + .Cases("macos", "1", PlatformKind::macOS) + .Cases("ios", "2", PlatformKind::iOS) + .Cases("tvos", "3", PlatformKind::tvOS) + .Cases("watchos", "4", PlatformKind::watchOS) + .Cases("bridgeos", "5", PlatformKind::bridgeOS) + .Cases("mac-catalyst", "6", PlatformKind::macCatalyst) + .Cases("ios-simulator", "7", PlatformKind::iOSSimulator) + .Cases("tvos-simulator", "8", PlatformKind::tvOSSimulator) + .Cases("watchos-simulator", "9", PlatformKind::watchOSSimulator) + .Cases("driverkit", "10", PlatformKind::driverKit) + .Default(PlatformKind::unknown); + if (platform == PlatformKind::unknown) + error(Twine("malformed platform: ") + platformStr); + // TODO: check validity of version strings, which varies by platform + // NOTE: ld64 accepts version strings with 5 components + // llvm::VersionTuple accepts no more than 4 components + // Has Apple ever published version strings with 5 components? + if (config->platformInfo.minimum.tryParse(minVersionStr)) + error(Twine("malformed minimum version: ") + minVersionStr); + if (config->platformInfo.sdk.tryParse(sdkVersionStr)) + error(Twine("malformed sdk version: ") + sdkVersionStr); + return platform; +} + +// Has the side-effect of setting Config::target. +static TargetInfo *createTargetInfo(InputArgList &args) { + StringRef archName = args.getLastArgValue(OPT_arch); + if (archName.empty()) + fatal("must specify -arch"); + PlatformKind platform = parsePlatformVersion(args); + + config->platformInfo.target = + MachO::Target(getArchitectureFromName(archName), platform); + + uint32_t cpuType; + uint32_t cpuSubtype; + std::tie(cpuType, cpuSubtype) = getCPUTypeFromArchitecture(config->arch()); + + switch (cpuType) { + case CPU_TYPE_X86_64: + return createX86_64TargetInfo(); + case CPU_TYPE_ARM64: + return createARM64TargetInfo(); + case CPU_TYPE_ARM64_32: + return createARM64_32TargetInfo(); + case CPU_TYPE_ARM: + return createARMTargetInfo(cpuSubtype); + default: + fatal("missing or unsupported -arch " + archName); + } +} + +static UndefinedSymbolTreatment +getUndefinedSymbolTreatment(const ArgList &args) { + StringRef treatmentStr = args.getLastArgValue(OPT_undefined); + auto treatment = + StringSwitch<UndefinedSymbolTreatment>(treatmentStr) + .Cases("error", "", UndefinedSymbolTreatment::error) + .Case("warning", UndefinedSymbolTreatment::warning) + .Case("suppress", UndefinedSymbolTreatment::suppress) + .Case("dynamic_lookup", UndefinedSymbolTreatment::dynamic_lookup) + .Default(UndefinedSymbolTreatment::unknown); + if (treatment == UndefinedSymbolTreatment::unknown) { + warn(Twine("unknown -undefined TREATMENT '") + treatmentStr + + "', defaulting to 'error'"); + treatment = UndefinedSymbolTreatment::error; + } else if (config->namespaceKind == NamespaceKind::twolevel && + (treatment == UndefinedSymbolTreatment::warning || + treatment == UndefinedSymbolTreatment::suppress)) { + if (treatment == UndefinedSymbolTreatment::warning) + error("'-undefined warning' only valid with '-flat_namespace'"); + else + error("'-undefined suppress' only valid with '-flat_namespace'"); + treatment = UndefinedSymbolTreatment::error; + } + return treatment; +} + +static void warnIfDeprecatedOption(const Option &opt) { + if (!opt.getGroup().isValid()) + return; + if (opt.getGroup().getID() == OPT_grp_deprecated) { + warn("Option `" + opt.getPrefixedName() + "' is deprecated in ld64:"); + warn(opt.getHelpText()); } } -bool macho::link(llvm::ArrayRef<const char *> argsArr, bool canExitEarly, +static void warnIfUnimplementedOption(const Option &opt) { + if (!opt.getGroup().isValid() || !opt.hasFlag(DriverFlag::HelpHidden)) + return; + switch (opt.getGroup().getID()) { + case OPT_grp_deprecated: + // warn about deprecated options elsewhere + break; + case OPT_grp_undocumented: + warn("Option `" + opt.getPrefixedName() + + "' is undocumented. Should lld implement it?"); + break; + case OPT_grp_obsolete: + warn("Option `" + opt.getPrefixedName() + + "' is obsolete. Please modernize your usage."); + break; + case OPT_grp_ignored: + warn("Option `" + opt.getPrefixedName() + "' is ignored."); + break; + default: + warn("Option `" + opt.getPrefixedName() + + "' is not yet implemented. Stay tuned..."); + break; + } +} + +static const char *getReproduceOption(InputArgList &args) { + if (const Arg *arg = args.getLastArg(OPT_reproduce)) + return arg->getValue(); + return getenv("LLD_REPRODUCE"); +} + +static void parseClangOption(StringRef opt, const Twine &msg) { + std::string err; + raw_string_ostream os(err); + + const char *argv[] = {"lld", opt.data()}; + if (cl::ParseCommandLineOptions(2, argv, "", &os)) + return; + os.flush(); + error(msg + ": " + StringRef(err).trim()); +} + +static uint32_t parseDylibVersion(const ArgList &args, unsigned id) { + const Arg *arg = args.getLastArg(id); + if (!arg) + return 0; + + if (config->outputType != MH_DYLIB) { + error(arg->getAsString(args) + ": only valid with -dylib"); + return 0; + } + + PackedVersion version; + if (!version.parse32(arg->getValue())) { + error(arg->getAsString(args) + ": malformed version"); + return 0; + } + + return version.rawValue(); +} + +static uint32_t parseProtection(StringRef protStr) { + uint32_t prot = 0; + for (char c : protStr) { + switch (c) { + case 'r': + prot |= VM_PROT_READ; + break; + case 'w': + prot |= VM_PROT_WRITE; + break; + case 'x': + prot |= VM_PROT_EXECUTE; + break; + case '-': + break; + default: + error("unknown -segprot letter '" + Twine(c) + "' in " + protStr); + return 0; + } + } + return prot; +} + +static std::vector<SectionAlign> parseSectAlign(const opt::InputArgList &args) { + std::vector<SectionAlign> sectAligns; + for (const Arg *arg : args.filtered(OPT_sectalign)) { + StringRef segName = arg->getValue(0); + StringRef sectName = arg->getValue(1); + StringRef alignStr = arg->getValue(2); + if (alignStr.startswith("0x") || alignStr.startswith("0X")) + alignStr = alignStr.drop_front(2); + uint32_t align; + if (alignStr.getAsInteger(16, align)) { + error("-sectalign: failed to parse '" + StringRef(arg->getValue(2)) + + "' as number"); + continue; + } + if (!isPowerOf2_32(align)) { + error("-sectalign: '" + StringRef(arg->getValue(2)) + + "' (in base 16) not a power of two"); + continue; + } + sectAligns.push_back({segName, sectName, align}); + } + return sectAligns; +} + +static bool dataConstDefault(const InputArgList &args) { + switch (config->outputType) { + case MH_EXECUTE: + return !args.hasArg(OPT_no_pie); + case MH_BUNDLE: + // FIXME: return false when -final_name ... + // has prefix "/System/Library/UserEventPlugins/" + // or matches "/usr/libexec/locationd" "/usr/libexec/terminusd" + return true; + case MH_DYLIB: + return true; + case MH_OBJECT: + return false; + default: + llvm_unreachable( + "unsupported output type for determining data-const default"); + } + return false; +} + +void SymbolPatterns::clear() { + literals.clear(); + globs.clear(); +} + +void SymbolPatterns::insert(StringRef symbolName) { + if (symbolName.find_first_of("*?[]") == StringRef::npos) + literals.insert(CachedHashStringRef(symbolName)); + else if (Expected<GlobPattern> pattern = GlobPattern::create(symbolName)) + globs.emplace_back(*pattern); + else + error("invalid symbol-name pattern: " + symbolName); +} + +bool SymbolPatterns::matchLiteral(StringRef symbolName) const { + return literals.contains(CachedHashStringRef(symbolName)); +} + +bool SymbolPatterns::matchGlob(StringRef symbolName) const { + for (const llvm::GlobPattern &glob : globs) + if (glob.match(symbolName)) + return true; + return false; +} + +bool SymbolPatterns::match(StringRef symbolName) const { + return matchLiteral(symbolName) || matchGlob(symbolName); +} + +static void handleSymbolPatterns(InputArgList &args, + SymbolPatterns &symbolPatterns, + unsigned singleOptionCode, + unsigned listFileOptionCode) { + for (const Arg *arg : args.filtered(singleOptionCode)) + symbolPatterns.insert(arg->getValue()); + for (const Arg *arg : args.filtered(listFileOptionCode)) { + StringRef path = arg->getValue(); + Optional<MemoryBufferRef> buffer = readFile(path); + if (!buffer) { + error("Could not read symbol file: " + path); + continue; + } + MemoryBufferRef mbref = *buffer; + for (StringRef line : args::getLines(mbref)) { + line = line.take_until([](char c) { return c == '#'; }).trim(); + if (!line.empty()) + symbolPatterns.insert(line); + } + } +} + +void createFiles(const InputArgList &args) { + TimeTraceScope timeScope("Load input files"); + // This loop should be reserved for options whose exact ordering matters. + // Other options should be handled via filtered() and/or getLastArg(). + for (const Arg *arg : args) { + const Option &opt = arg->getOption(); + warnIfDeprecatedOption(opt); + warnIfUnimplementedOption(opt); + + switch (opt.getID()) { + case OPT_INPUT: + addFile(rerootPath(arg->getValue()), /*forceLoadArchive=*/false); + break; + case OPT_needed_library: + if (auto *dylibFile = dyn_cast_or_null<DylibFile>( + addFile(rerootPath(arg->getValue()), false))) + dylibFile->forceNeeded = true; + break; + case OPT_reexport_library: + if (auto *dylibFile = dyn_cast_or_null<DylibFile>(addFile( + rerootPath(arg->getValue()), /*forceLoadArchive=*/false))) { + config->hasReexports = true; + dylibFile->reexport = true; + } + break; + case OPT_weak_library: + if (auto *dylibFile = dyn_cast_or_null<DylibFile>( + addFile(rerootPath(arg->getValue()), /*forceLoadArchive=*/false))) + dylibFile->forceWeakImport = true; + break; + case OPT_filelist: + addFileList(arg->getValue()); + break; + case OPT_force_load: + addFile(rerootPath(arg->getValue()), /*forceLoadArchive=*/true); + break; + case OPT_l: + case OPT_needed_l: + case OPT_reexport_l: + case OPT_weak_l: + addLibrary(arg->getValue(), opt.getID() == OPT_needed_l, + opt.getID() == OPT_weak_l, opt.getID() == OPT_reexport_l, + /*isExplicit=*/true); + break; + case OPT_framework: + case OPT_needed_framework: + case OPT_reexport_framework: + case OPT_weak_framework: + addFramework(arg->getValue(), opt.getID() == OPT_needed_framework, + opt.getID() == OPT_weak_framework, + opt.getID() == OPT_reexport_framework, /*isExplicit=*/true); + break; + default: + break; + } + } +} + +bool macho::link(ArrayRef<const char *> argsArr, bool canExitEarly, raw_ostream &stdoutOS, raw_ostream &stderrOS) { lld::stdoutOS = &stdoutOS; lld::stderrOS = &stderrOS; + errorHandler().cleanupCallback = []() { freeArena(); }; + + errorHandler().logName = args::getFilenameWithoutExe(argsArr[0]); stderrOS.enable_colors(stderrOS.has_colors()); - // TODO: Set up error handler properly, e.g. the errorLimitExceededMsg MachOOptTable parser; - opt::InputArgList args = parser.parse(argsArr.slice(1)); + InputArgList args = parser.parse(argsArr.slice(1)); + + errorHandler().errorLimitExceededMsg = + "too many errors emitted, stopping now " + "(use --error-limit=0 to see all errors)"; + errorHandler().errorLimit = args::getInteger(args, OPT_error_limit_eq, 20); + errorHandler().verbose = args.hasArg(OPT_verbose); + + if (args.hasArg(OPT_help_hidden)) { + parser.printHelp(argsArr[0], /*showHidden=*/true); + return true; + } + if (args.hasArg(OPT_help)) { + parser.printHelp(argsArr[0], /*showHidden=*/false); + return true; + } + if (args.hasArg(OPT_version)) { + message(getLLDVersion()); + return true; + } config = make<Configuration>(); symtab = make<SymbolTable>(); target = createTargetInfo(args); + depTracker = + make<DependencyTracker>(args.getLastArgValue(OPT_dependency_info)); - config->entry = symtab->addUndefined(args.getLastArgValue(OPT_e, "_main")); - config->outputFile = args.getLastArgValue(OPT_o, "a.out"); - config->installName = - args.getLastArgValue(OPT_install_name, config->outputFile); - config->searchPaths = getSearchPaths(args); - config->outputType = args.hasArg(OPT_dylib) ? MH_DYLIB : MH_EXECUTE; + // Must be set before any InputSections and Symbols are created. + config->deadStrip = args.hasArg(OPT_dead_strip); - if (args.hasArg(OPT_v)) { - message(getLLDVersion()); - std::vector<StringRef> &searchPaths = config->searchPaths; - message("Library search paths:\n" + - llvm::join(searchPaths.begin(), searchPaths.end(), "\n")); - freeArena(); - return !errorCount(); - } - - for (opt::ArgList::iterator it = args.begin(), end = args.end(); it != end; - ++it) { - const opt::Arg *arg = *it; - switch (arg->getOption().getID()) { - case OPT_INPUT: - addFile(arg->getValue()); - break; - case OPT_l: - if (Optional<std::string> path = findDylib(arg->getValue())) - addFile(*path); - break; - case OPT_platform_version: { - handlePlatformVersion(it, end); // Can advance "it". - break; - } + config->systemLibraryRoots = getSystemLibraryRoots(args); + if (const char *path = getReproduceOption(args)) { + // Note that --reproduce is a debug option so you can ignore it + // if you are trying to understand the whole picture of the code. + Expected<std::unique_ptr<TarWriter>> errOrWriter = + TarWriter::create(path, path::stem(path)); + if (errOrWriter) { + tar = std::move(*errOrWriter); + tar->append("response.txt", createResponseFile(args)); + tar->append("version.txt", getLLDVersion() + "\n"); + } else { + error("--reproduce: " + toString(errOrWriter.takeError())); } } - // Now that all dylibs have been loaded, search for those that should be - // re-exported. - for (opt::Arg *arg : args.filtered(OPT_sub_library)) { - config->hasReexports = true; - StringRef searchName = arg->getValue(); - if (!markSubLibrary(searchName)) - error("-sub_library " + searchName + " does not match a supplied dylib"); + if (auto *arg = args.getLastArg(OPT_threads_eq)) { + StringRef v(arg->getValue()); + unsigned threads = 0; + if (!llvm::to_integer(v, threads, 0) || threads == 0) + error(arg->getSpelling() + ": expected a positive integer, but got '" + + arg->getValue() + "'"); + parallel::strategy = hardware_concurrency(threads); + config->thinLTOJobs = v; + } + if (auto *arg = args.getLastArg(OPT_thinlto_jobs_eq)) + config->thinLTOJobs = arg->getValue(); + if (!get_threadpool_strategy(config->thinLTOJobs)) + error("--thinlto-jobs: invalid job count: " + config->thinLTOJobs); + + for (const Arg *arg : args.filtered(OPT_u)) { + config->explicitUndefineds.push_back(symtab->addUndefined( + arg->getValue(), /*file=*/nullptr, /*isWeakRef=*/false)); + } + + for (const Arg *arg : args.filtered(OPT_U)) + symtab->addDynamicLookup(arg->getValue()); + + config->mapFile = args.getLastArgValue(OPT_map); + config->outputFile = args.getLastArgValue(OPT_o, "a.out"); + config->astPaths = args.getAllArgValues(OPT_add_ast_path); + config->headerPad = args::getHex(args, OPT_headerpad, /*Default=*/32); + config->headerPadMaxInstallNames = + args.hasArg(OPT_headerpad_max_install_names); + config->printEachFile = args.hasArg(OPT_t); + config->printWhyLoad = args.hasArg(OPT_why_load); + config->outputType = getOutputType(args); + if (const Arg *arg = args.getLastArg(OPT_bundle_loader)) { + if (config->outputType != MH_BUNDLE) + error("-bundle_loader can only be used with MachO bundle output"); + addFile(arg->getValue(), /*forceLoadArchive=*/false, /*isExplicit=*/false, + /*isBundleLoader=*/true); + } + config->ltoObjPath = args.getLastArgValue(OPT_object_path_lto); + config->ltoNewPassManager = + args.hasFlag(OPT_no_lto_legacy_pass_manager, OPT_lto_legacy_pass_manager, + LLVM_ENABLE_NEW_PASS_MANAGER); + config->runtimePaths = args::getStrings(args, OPT_rpath); + config->allLoad = args.hasArg(OPT_all_load); + config->forceLoadObjC = args.hasArg(OPT_ObjC); + config->deadStripDylibs = args.hasArg(OPT_dead_strip_dylibs); + config->demangle = args.hasArg(OPT_demangle); + config->implicitDylibs = !args.hasArg(OPT_no_implicit_dylibs); + config->emitFunctionStarts = !args.hasArg(OPT_no_function_starts); + config->emitBitcodeBundle = args.hasArg(OPT_bitcode_bundle); + + // FIXME: Add a commandline flag for this too. + config->zeroModTime = getenv("ZERO_AR_DATE"); + + std::array<PlatformKind, 3> encryptablePlatforms{ + PlatformKind::iOS, PlatformKind::watchOS, PlatformKind::tvOS}; + config->emitEncryptionInfo = + args.hasFlag(OPT_encryptable, OPT_no_encryption, + is_contained(encryptablePlatforms, config->platform())); + +#ifndef LLVM_HAVE_LIBXAR + if (config->emitBitcodeBundle) + error("-bitcode_bundle unsupported because LLD wasn't built with libxar"); +#endif + + if (const Arg *arg = args.getLastArg(OPT_install_name)) { + if (config->outputType != MH_DYLIB) + warn(arg->getAsString(args) + ": ignored, only has effect with -dylib"); + else + config->installName = arg->getValue(); + } else if (config->outputType == MH_DYLIB) { + config->installName = config->outputFile; + } + + if (args.hasArg(OPT_mark_dead_strippable_dylib)) { + if (config->outputType != MH_DYLIB) + warn("-mark_dead_strippable_dylib: ignored, only has effect with -dylib"); + else + config->markDeadStrippableDylib = true; + } + + if (const Arg *arg = args.getLastArg(OPT_static, OPT_dynamic)) + config->staticLink = (arg->getOption().getID() == OPT_static); + + if (const Arg *arg = + args.getLastArg(OPT_flat_namespace, OPT_twolevel_namespace)) + config->namespaceKind = arg->getOption().getID() == OPT_twolevel_namespace + ? NamespaceKind::twolevel + : NamespaceKind::flat; + + config->undefinedSymbolTreatment = getUndefinedSymbolTreatment(args); + + if (config->outputType == MH_EXECUTE) + config->entry = symtab->addUndefined(args.getLastArgValue(OPT_e, "_main"), + /*file=*/nullptr, + /*isWeakRef=*/false); + + config->librarySearchPaths = + getLibrarySearchPaths(args, config->systemLibraryRoots); + config->frameworkSearchPaths = + getFrameworkSearchPaths(args, config->systemLibraryRoots); + if (const Arg *arg = + args.getLastArg(OPT_search_paths_first, OPT_search_dylibs_first)) + config->searchDylibsFirst = + arg->getOption().getID() == OPT_search_dylibs_first; + + config->dylibCompatibilityVersion = + parseDylibVersion(args, OPT_compatibility_version); + config->dylibCurrentVersion = parseDylibVersion(args, OPT_current_version); + + config->dataConst = + args.hasFlag(OPT_data_const, OPT_no_data_const, dataConstDefault(args)); + // Populate config->sectionRenameMap with builtin default renames. + // Options -rename_section and -rename_segment are able to override. + initializeSectionRenameMap(); + // Reject every special character except '.' and '$' + // TODO(gkm): verify that this is the proper set of invalid chars + StringRef invalidNameChars("!\"#%&'()*+,-/:;<=>?@[\\]^`{|}~"); + auto validName = [invalidNameChars](StringRef s) { + if (s.find_first_of(invalidNameChars) != StringRef::npos) + error("invalid name for segment or section: " + s); + return s; + }; + for (const Arg *arg : args.filtered(OPT_rename_section)) { + config->sectionRenameMap[{validName(arg->getValue(0)), + validName(arg->getValue(1))}] = { + validName(arg->getValue(2)), validName(arg->getValue(3))}; + } + for (const Arg *arg : args.filtered(OPT_rename_segment)) { + config->segmentRenameMap[validName(arg->getValue(0))] = + validName(arg->getValue(1)); + } + + config->sectionAlignments = parseSectAlign(args); + + for (const Arg *arg : args.filtered(OPT_segprot)) { + StringRef segName = arg->getValue(0); + uint32_t maxProt = parseProtection(arg->getValue(1)); + uint32_t initProt = parseProtection(arg->getValue(2)); + if (maxProt != initProt && config->arch() != AK_i386) + error("invalid argument '" + arg->getAsString(args) + + "': max and init must be the same for non-i386 archs"); + if (segName == segment_names::linkEdit) + error("-segprot cannot be used to change __LINKEDIT's protections"); + config->segmentProtections.push_back({segName, maxProt, initProt}); } - StringRef orderFile = args.getLastArgValue(OPT_order_file); - if (!orderFile.empty()) - parseOrderFile(orderFile); + handleSymbolPatterns(args, config->exportedSymbols, OPT_exported_symbol, + OPT_exported_symbols_list); + handleSymbolPatterns(args, config->unexportedSymbols, OPT_unexported_symbol, + OPT_unexported_symbols_list); + if (!config->exportedSymbols.empty() && !config->unexportedSymbols.empty()) { + error("cannot use both -exported_symbol* and -unexported_symbol* options\n" + ">>> ignoring unexports"); + config->unexportedSymbols.clear(); + } + // Explicitly-exported literal symbols must be defined, but might + // languish in an archive if unreferenced elsewhere. Light a fire + // under those lazy symbols! + for (const CachedHashStringRef &cachedName : config->exportedSymbols.literals) + symtab->addUndefined(cachedName.val(), /*file=*/nullptr, + /*isWeakRef=*/false); - // dyld requires us to load libSystem. Since we may run tests on non-OSX - // systems which do not have libSystem, we mock it out here. - // TODO: Replace this with a stub tbd file once we have TAPI support. - if (StringRef(getenv("LLD_IN_TEST")) == "1" && - config->outputType == MH_EXECUTE) { - inputFiles.push_back(DylibFile::createLibSystemMock()); + config->saveTemps = args.hasArg(OPT_save_temps); + + config->adhocCodesign = args.hasFlag( + OPT_adhoc_codesign, OPT_no_adhoc_codesign, + (config->arch() == AK_arm64 || config->arch() == AK_arm64e) && + config->platform() == PlatformKind::macOS); + + if (args.hasArg(OPT_v)) { + message(getLLDVersion()); + message(StringRef("Library search paths:") + + (config->librarySearchPaths.empty() + ? "" + : "\n\t" + join(config->librarySearchPaths, "\n\t"))); + message(StringRef("Framework search paths:") + + (config->frameworkSearchPaths.empty() + ? "" + : "\n\t" + join(config->frameworkSearchPaths, "\n\t"))); } - if (config->outputType == MH_EXECUTE && !isa<Defined>(config->entry)) { - error("undefined symbol: " + config->entry->getName()); - return false; + config->progName = argsArr[0]; + + config->timeTraceEnabled = args.hasArg( + OPT_time_trace, OPT_time_trace_granularity_eq, OPT_time_trace_file_eq); + config->timeTraceGranularity = + args::getInteger(args, OPT_time_trace_granularity_eq, 500); + + // Initialize time trace profiler. + if (config->timeTraceEnabled) + timeTraceProfilerInitialize(config->timeTraceGranularity, config->progName); + + { + TimeTraceScope timeScope("ExecuteLinker"); + + initLLVM(); // must be run before any call to addFile() + createFiles(args); + + config->isPic = config->outputType == MH_DYLIB || + config->outputType == MH_BUNDLE || + (config->outputType == MH_EXECUTE && + args.hasFlag(OPT_pie, OPT_no_pie, true)); + + // Now that all dylibs have been loaded, search for those that should be + // re-exported. + { + auto reexportHandler = [](const Arg *arg, + const std::vector<StringRef> &extensions) { + config->hasReexports = true; + StringRef searchName = arg->getValue(); + if (!markReexport(searchName, extensions)) + error(arg->getSpelling() + " " + searchName + + " does not match a supplied dylib"); + }; + std::vector<StringRef> extensions = {".tbd"}; + for (const Arg *arg : args.filtered(OPT_sub_umbrella)) + reexportHandler(arg, extensions); + + extensions.push_back(".dylib"); + for (const Arg *arg : args.filtered(OPT_sub_library)) + reexportHandler(arg, extensions); + } + + // Parse LTO options. + if (const Arg *arg = args.getLastArg(OPT_mcpu)) + parseClangOption(saver.save("-mcpu=" + StringRef(arg->getValue())), + arg->getSpelling()); + + for (const Arg *arg : args.filtered(OPT_mllvm)) + parseClangOption(arg->getValue(), arg->getSpelling()); + + compileBitcodeFiles(); + replaceCommonSymbols(); + + StringRef orderFile = args.getLastArgValue(OPT_order_file); + if (!orderFile.empty()) + parseOrderFile(orderFile); + + if (config->entry) + if (auto *undefined = dyn_cast<Undefined>(config->entry)) + treatUndefinedSymbol(*undefined, "the entry point"); + + // FIXME: This prints symbols that are undefined both in input files and + // via -u flag twice. + for (const Symbol *sym : config->explicitUndefineds) { + if (const auto *undefined = dyn_cast<Undefined>(sym)) + treatUndefinedSymbol(*undefined, "-u"); + } + // Literal exported-symbol names must be defined, but glob + // patterns need not match. + for (const CachedHashStringRef &cachedName : + config->exportedSymbols.literals) { + if (const Symbol *sym = symtab->find(cachedName)) + if (const auto *undefined = dyn_cast<Undefined>(sym)) + treatUndefinedSymbol(*undefined, "-exported_symbol(s_list)"); + } + + // FIXME: should terminate the link early based on errors encountered so + // far? + + createSyntheticSections(); + createSyntheticSymbols(); + + if (!config->exportedSymbols.empty()) { + for (Symbol *sym : symtab->getSymbols()) { + if (auto *defined = dyn_cast<Defined>(sym)) { + StringRef symbolName = defined->getName(); + if (config->exportedSymbols.match(symbolName)) { + if (defined->privateExtern) { + error("cannot export hidden symbol " + symbolName + + "\n>>> defined in " + toString(defined->getFile())); + } + } else { + defined->privateExtern = true; + } + } + } + } else if (!config->unexportedSymbols.empty()) { + for (Symbol *sym : symtab->getSymbols()) + if (auto *defined = dyn_cast<Defined>(sym)) + if (config->unexportedSymbols.match(defined->getName())) + defined->privateExtern = true; + } + + for (const Arg *arg : args.filtered(OPT_sectcreate)) { + StringRef segName = arg->getValue(0); + StringRef sectName = arg->getValue(1); + StringRef fileName = arg->getValue(2); + Optional<MemoryBufferRef> buffer = readFile(fileName); + if (buffer) + inputFiles.insert(make<OpaqueFile>(*buffer, segName, sectName)); + } + + { + TimeTraceScope timeScope("Gathering input sections"); + // Gather all InputSections into one vector. + for (const InputFile *file : inputFiles) { + for (const SubsectionMap &map : file->subsections) + for (const SubsectionEntry &subsectionEntry : map) + inputSections.push_back(subsectionEntry.isec); + } + } + + if (config->deadStrip) + markLive(); + + // Write to an output file. + if (target->wordSize == 8) + writeResult<LP64>(); + else + writeResult<ILP32>(); + + depTracker->write(getLLDVersion(), inputFiles, config->outputFile); } - createSyntheticSections(); + if (config->timeTraceEnabled) { + if (auto E = timeTraceProfilerWrite( + args.getLastArgValue(OPT_time_trace_file_eq).str(), + config->outputFile)) { + handleAllErrors(std::move(E), + [&](const StringError &SE) { error(SE.getMessage()); }); + } - // Initialize InputSections. - for (InputFile *file : inputFiles) { - for (SubsectionMap &map : file->subsections) { - for (auto &p : map) { - InputSection *isec = p.second; - inputSections.push_back(isec); - } - } + timeTraceProfilerCleanup(); } - // Write to an output file. - writeResult(); - if (canExitEarly) exitLld(errorCount() ? 1 : 0); - freeArena(); return !errorCount(); }