Skip to content

[lld][MachO]Multi-threaded i/o. Twice as fast linking a large project. #147134

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Open
wants to merge 35 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
35 commits
Select commit Hold shift + click to select a range
c55b5b2
Multi-threaded disk i/o.
johnno1962 Jul 5, 2025
3d11a33
Afterthoughts.
johnno1962 Jul 6, 2025
02fb145
multiThreadedPageIn of library archives.
johnno1962 Jul 6, 2025
a8eeead
Multi-thread i/o in background.
johnno1962 Jul 8, 2025
55e26a8
Response to first review.
johnno1962 Jul 9, 2025
817036b
Second review.
johnno1962 Jul 12, 2025
c07e168
Semms to make a difference.
johnno1962 Jul 12, 2025
eb4827c
Update lld/MachO/Driver.cpp
johnno1962 Jul 15, 2025
ce93ae3
De-Obfuscate loop and thread reaping.
johnno1962 Jul 15, 2025
c47e5c3
Avoiding possible deadlock.
johnno1962 Jul 17, 2025
5caf5a6
Update lld/MachO/Options.td
johnno1962 Jul 17, 2025
890c492
Update lld/MachO/Driver.cpp
johnno1962 Jul 17, 2025
9714785
Update lld/MachO/Driver.cpp
johnno1962 Jul 17, 2025
85fd77f
Update lld/MachO/Driver.cpp
johnno1962 Jul 17, 2025
6f5f7cb
Fourth review.
johnno1962 Jul 17, 2025
e3e0369
Switch to std::atomic_int.
johnno1962 Jul 17, 2025
febf5a9
Switch to std::unique_ptr.
johnno1962 Jul 17, 2025
a5f7a42
Remove a couple of warnings.
johnno1962 Jul 18, 2025
6b874b2
Try LLVM_ATTRIBUTE_UNUSED
johnno1962 Jul 18, 2025
84154d4
Update lld/MachO/Driver.cpp
johnno1962 Jul 18, 2025
ed9f07e
Comparing inner loops.
johnno1962 Jul 18, 2025
ff732ed
Is this valid C++??
johnno1962 Jul 19, 2025
ef23af2
In search of a work queue abstraction.
johnno1962 Jul 21, 2025
4bf74e8
OK to use Process::GetEnv?
johnno1962 Jul 21, 2025
ed9bdb7
Formatting of benchmarks.
johnno1962 Jul 22, 2025
4cab9be
Encapsulate SerialBackgroundQueue. Remove DEBUG output.
johnno1962 Jul 25, 2025
f7c8008
Revert LLVM_DEBUG as gives error: use of undeclared identifier 'DEBUG…
johnno1962 Jul 25, 2025
a6dd0bc
Update lld/MachO/Driver.cpp
johnno1962 Jul 26, 2025
cf5c3fb
Add NDEBUGs
johnno1962 Jul 26, 2025
5901e7d
Update lld/MachO/Driver.cpp
johnno1962 Jul 30, 2025
39cffd0
Update lld/MachO/Driver.cpp
johnno1962 Jul 30, 2025
0af2bde
Update lld/MachO/Options.td
johnno1962 Jul 30, 2025
bb91c53
Fifth review followups.
johnno1962 Jul 30, 2025
432fb04
Headers no longer used
johnno1962 Aug 6, 2025
30b8c13
Threads becomes workers.
johnno1962 Aug 7, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions lld/MachO/Config.h
Original file line number Diff line number Diff line change
Expand Up @@ -186,6 +186,7 @@ struct Configuration {
bool interposable = false;
bool errorForArchMismatch = false;
bool ignoreAutoLink = false;
int readWorkers = 0;
// ld64 allows invalid auto link options as long as the link succeeds. LLD
// does not, but there are cases in the wild where the invalid linker options
// exist. This allows users to ignore the specific invalid options in the case
Expand Down
178 changes: 168 additions & 10 deletions lld/MachO/Driver.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -44,8 +44,10 @@
#include "llvm/Support/FileSystem.h"
#include "llvm/Support/Parallel.h"
#include "llvm/Support/Path.h"
#include "llvm/Support/Process.h"
#include "llvm/Support/TarWriter.h"
#include "llvm/Support/TargetSelect.h"
#include "llvm/Support/Threading.h"
#include "llvm/Support/TimeProfiler.h"
#include "llvm/TargetParser/Host.h"
#include "llvm/TextAPI/Architecture.h"
Expand Down Expand Up @@ -282,11 +284,117 @@ static void saveThinArchiveToRepro(ArchiveFile const *file) {
": Archive::children failed: " + toString(std::move(e)));
}

static InputFile *addFile(StringRef path, LoadType loadType,
bool isLazy = false, bool isExplicit = true,
bool isBundleLoader = false,
bool isForceHidden = false) {
std::optional<MemoryBufferRef> buffer = readFile(path);
struct DeferredFile {
StringRef path;
bool isLazy;
MemoryBufferRef buffer;
};
using DeferredFiles = std::vector<DeferredFile>;

class SerialBackgroundQueue {
std::deque<std::function<void()>> queue;
std::thread *running;
std::mutex mutex;

public:
void queueWork(std::function<void()> work) {
mutex.lock();
if (running && queue.empty()) {
mutex.unlock();
running->join();
mutex.lock();
delete running;
running = nullptr;
}

if (work) {
queue.emplace_back(std::move(work));
if (!running)
running = new std::thread([&]() {
while (true) {
mutex.lock();
if (queue.empty()) {
mutex.unlock();
break;
}
auto work = std::move(queue.front());
mutex.unlock();
work();
mutex.lock();
queue.pop_front();
mutex.unlock();
}
});
}
mutex.unlock();
}
};

// Most input files have been mapped but not yet paged in.
// This code forces the page-ins on multiple threads so
// the process is not stalled waiting on disk buffer i/o.
void multiThreadedPageInBackground(DeferredFiles &deferred) {
static const size_t pageSize = Process::getPageSizeEstimate();
static const size_t largeArchive = 10 * 1024 * 1024;
#ifndef NDEBUG
using namespace std::chrono;
std::atomic_int numDeferedFilesTouched = 0;
static std::atomic_uint64_t totalBytes = 0;
auto t0 = high_resolution_clock::now();
#endif

auto preloadDeferredFile = [&](const DeferredFile &deferredFile) {
const StringRef &buff = deferredFile.buffer.getBuffer();
if (buff.size() > largeArchive)
return;
#ifndef NDEBUG
totalBytes += buff.size();
numDeferedFilesTouched += 1;
#endif

// Reference all file's mmap'd pages to load them into memory.
for (const char *page = buff.data(), *end = page + buff.size(); page < end;
page += pageSize)
LLVM_ATTRIBUTE_UNUSED volatile char t = *page;
};
#if LLVM_ENABLE_THREADS
{ // Create scope for waiting for the taskGroup
std::atomic_size_t index = 0;
llvm::parallel::TaskGroup taskGroup;
for (int w = 0; w < config->readWorkers; w++)
taskGroup.spawn([&index, &preloadDeferredFile, &deferred]() {
while (true) {
size_t localIndex = index.fetch_add(1);
if (localIndex >= deferred.size())
break;
preloadDeferredFile(deferred[localIndex]);
}
});
}
#endif
#ifndef NDEBUG
auto dt = high_resolution_clock::now() - t0;
if (Process::GetEnv("LLD_MULTI_THREAD_PAGE"))
llvm::dbgs() << "multiThreadedPageIn " << totalBytes << "/"
<< numDeferedFilesTouched << "/" << deferred.size() << "/"
<< duration_cast<milliseconds>(dt).count() / 1000. << "\n";
#endif
}

static void multiThreadedPageIn(const DeferredFiles &deferred) {
static SerialBackgroundQueue pageInQueue;
pageInQueue.queueWork([=]() {
DeferredFiles files = deferred;
multiThreadedPageInBackground(files);
});
}

static InputFile *processFile(std::optional<MemoryBufferRef> buffer,
DeferredFiles *archiveContents, StringRef path,
LoadType loadType, bool isLazy = false,
bool isExplicit = true,
bool isBundleLoader = false,
bool isForceHidden = false) {
if (!buffer)
return nullptr;
MemoryBufferRef mbref = *buffer;
Expand Down Expand Up @@ -379,6 +487,8 @@ static InputFile *addFile(StringRef path, LoadType loadType,
continue;
}

if (archiveContents)
archiveContents->push_back({path, isLazy, *mb});
if (!hasObjCSection(*mb))
continue;
if (Error e = file->fetch(c, "-ObjC"))
Expand All @@ -390,7 +500,8 @@ static InputFile *addFile(StringRef path, LoadType loadType,
": Archive::children failed: " + toString(std::move(e)));
}
}
file->addLazySymbols();
if (!archiveContents || archiveContents->empty())
file->addLazySymbols();
loadedArchives[path] = ArchiveFileInfo{file, isCommandLineLoad};
newFile = file;
break;
Expand Down Expand Up @@ -441,6 +552,24 @@ static InputFile *addFile(StringRef path, LoadType loadType,
return newFile;
}

static InputFile *addFile(StringRef path, LoadType loadType,
bool isLazy = false, bool isExplicit = true,
bool isBundleLoader = false,
bool isForceHidden = false) {
return processFile(readFile(path), nullptr, path, loadType, isLazy,
isExplicit, isBundleLoader, isForceHidden);
}

static void deferFile(StringRef path, bool isLazy, DeferredFiles &deferred) {
std::optional<MemoryBufferRef> buffer = readFile(path);
if (!buffer)
return;
if (config->readWorkers)
deferred.push_back({path, isLazy, *buffer});
else
processFile(buffer, nullptr, path, LoadType::CommandLine, isLazy);
}

static std::vector<StringRef> missingAutolinkWarnings;
static void addLibrary(StringRef name, bool isNeeded, bool isWeak,
bool isReexport, bool isHidden, bool isExplicit,
Expand Down Expand Up @@ -564,13 +693,14 @@ void macho::resolveLCLinkerOptions() {
}
}

static void addFileList(StringRef path, bool isLazy) {
static void addFileList(StringRef path, bool isLazy,
DeferredFiles &deferredFiles) {
std::optional<MemoryBufferRef> buffer = readFile(path);
if (!buffer)
return;
MemoryBufferRef mbref = *buffer;
for (StringRef path : args::getLines(mbref))
addFile(rerootPath(path), LoadType::CommandLine, isLazy);
deferFile(rerootPath(path), isLazy, deferredFiles);
}

// We expect sub-library names of the form "libfoo", which will match a dylib
Expand Down Expand Up @@ -1222,14 +1352,16 @@ static void createFiles(const InputArgList &args) {
bool isLazy = false;
// If we've processed an opening --start-lib, without a matching --end-lib
bool inLib = false;
DeferredFiles deferredFiles;

for (const Arg *arg : args) {
const Option &opt = arg->getOption();
warnIfDeprecatedOption(opt);
warnIfUnimplementedOption(opt);

switch (opt.getID()) {
case OPT_INPUT:
addFile(rerootPath(arg->getValue()), LoadType::CommandLine, isLazy);
deferFile(rerootPath(arg->getValue()), isLazy, deferredFiles);
break;
case OPT_needed_library:
if (auto *dylibFile = dyn_cast_or_null<DylibFile>(
Expand All @@ -1249,7 +1381,7 @@ static void createFiles(const InputArgList &args) {
dylibFile->forceWeakImport = true;
break;
case OPT_filelist:
addFileList(arg->getValue(), isLazy);
addFileList(arg->getValue(), isLazy, deferredFiles);
break;
case OPT_force_load:
addFile(rerootPath(arg->getValue()), LoadType::CommandLineForce);
Expand Down Expand Up @@ -1295,6 +1427,24 @@ static void createFiles(const InputArgList &args) {
break;
}
}

if (config->readWorkers) {
multiThreadedPageIn(deferredFiles);

DeferredFiles archiveContents;
std::vector<ArchiveFile *> archives;
for (auto &file : deferredFiles) {
auto inputFile = processFile(file.buffer, &archiveContents, file.path,
LoadType::CommandLine, file.isLazy);
if (ArchiveFile *archive = dyn_cast<ArchiveFile>(inputFile))
archives.push_back(archive);
}

if (!archiveContents.empty())
multiThreadedPageIn(archiveContents);
for (auto *archive : archives)
archive->addLazySymbols();
}
}

static void gatherInputSections() {
Expand Down Expand Up @@ -1687,6 +1837,14 @@ bool link(ArrayRef<const char *> argsArr, llvm::raw_ostream &stdoutOS,
}
}

if (auto *arg = args.getLastArg(OPT_read_workers)) {
StringRef v(arg->getValue());
unsigned threads = 0;
if (!llvm::to_integer(v, threads, 0) || threads < 0)
error(arg->getSpelling() + ": expected a positive integer, but got '" +
arg->getValue() + "'");
config->readWorkers = threads;
}
if (auto *arg = args.getLastArg(OPT_threads_eq)) {
StringRef v(arg->getValue());
unsigned threads = 0;
Expand Down
3 changes: 3 additions & 0 deletions lld/MachO/Options.td
Original file line number Diff line number Diff line change
Expand Up @@ -396,6 +396,9 @@ def dead_strip : Flag<["-"], "dead_strip">,
def interposable : Flag<["-"], "interposable">,
HelpText<"Indirects access to all exported symbols in an image">,
Group<grp_opts>;
def read_workers : Joined<["--"], "read-workers=">,
HelpText<"Approximate number of workers to use to eagerly preload input files content into memory. Use 0 to disable this feature. Default is disabled.">,
Group<grp_lld>;
def order_file : Separate<["-"], "order_file">,
MetaVarName<"<file>">,
HelpText<"Layout functions and data according to specification in <file>">,
Expand Down