-
Notifications
You must be signed in to change notification settings - Fork 15.2k
[lld][MachO]Multi-threaded i/o. Twice as fast linking a large project. #147134
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from all commits
c55b5b2
3d11a33
02fb145
a8eeead
55e26a8
817036b
c07e168
eb4827c
ce93ae3
c47e5c3
5caf5a6
890c492
9714785
85fd77f
6f5f7cb
e3e0369
febf5a9
a5f7a42
6b874b2
84154d4
ed9f07e
ff732ed
ef23af2
4bf74e8
ed9bdb7
4cab9be
f7c8008
a6dd0bc
cf5c3fb
5901e7d
39cffd0
0af2bde
bb91c53
432fb04
30b8c13
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -44,8 +44,10 @@ | |
#include "llvm/Support/FileSystem.h" | ||
#include "llvm/Support/Parallel.h" | ||
#include "llvm/Support/Path.h" | ||
#include "llvm/Support/Process.h" | ||
#include "llvm/Support/TarWriter.h" | ||
#include "llvm/Support/TargetSelect.h" | ||
#include "llvm/Support/Threading.h" | ||
#include "llvm/Support/TimeProfiler.h" | ||
#include "llvm/TargetParser/Host.h" | ||
#include "llvm/TextAPI/Architecture.h" | ||
|
@@ -282,11 +284,117 @@ static void saveThinArchiveToRepro(ArchiveFile const *file) { | |
": Archive::children failed: " + toString(std::move(e))); | ||
} | ||
|
||
static InputFile *addFile(StringRef path, LoadType loadType, | ||
bool isLazy = false, bool isExplicit = true, | ||
bool isBundleLoader = false, | ||
bool isForceHidden = false) { | ||
std::optional<MemoryBufferRef> buffer = readFile(path); | ||
struct DeferredFile { | ||
StringRef path; | ||
bool isLazy; | ||
MemoryBufferRef buffer; | ||
}; | ||
using DeferredFiles = std::vector<DeferredFile>; | ||
|
||
class SerialBackgroundQueue { | ||
std::deque<std::function<void()>> queue; | ||
std::thread *running; | ||
std::mutex mutex; | ||
|
||
public: | ||
void queueWork(std::function<void()> work) { | ||
mutex.lock(); | ||
if (running && queue.empty()) { | ||
mutex.unlock(); | ||
running->join(); | ||
mutex.lock(); | ||
delete running; | ||
running = nullptr; | ||
} | ||
|
||
if (work) { | ||
queue.emplace_back(std::move(work)); | ||
if (!running) | ||
running = new std::thread([&]() { | ||
while (true) { | ||
mutex.lock(); | ||
if (queue.empty()) { | ||
mutex.unlock(); | ||
break; | ||
} | ||
auto work = std::move(queue.front()); | ||
mutex.unlock(); | ||
work(); | ||
mutex.lock(); | ||
queue.pop_front(); | ||
mutex.unlock(); | ||
} | ||
}); | ||
} | ||
mutex.unlock(); | ||
} | ||
}; | ||
|
||
// Most input files have been mapped but not yet paged in. | ||
// This code forces the page-ins on multiple threads so | ||
// the process is not stalled waiting on disk buffer i/o. | ||
void multiThreadedPageInBackground(DeferredFiles &deferred) { | ||
johnno1962 marked this conversation as resolved.
Show resolved
Hide resolved
|
||
static const size_t pageSize = Process::getPageSizeEstimate(); | ||
static const size_t largeArchive = 10 * 1024 * 1024; | ||
#ifndef NDEBUG | ||
using namespace std::chrono; | ||
std::atomic_int numDeferedFilesTouched = 0; | ||
static std::atomic_uint64_t totalBytes = 0; | ||
auto t0 = high_resolution_clock::now(); | ||
#endif | ||
|
||
auto preloadDeferredFile = [&](const DeferredFile &deferredFile) { | ||
const StringRef &buff = deferredFile.buffer.getBuffer(); | ||
if (buff.size() > largeArchive) | ||
return; | ||
#ifndef NDEBUG | ||
totalBytes += buff.size(); | ||
numDeferedFilesTouched += 1; | ||
#endif | ||
|
||
// Reference all file's mmap'd pages to load them into memory. | ||
for (const char *page = buff.data(), *end = page + buff.size(); page < end; | ||
page += pageSize) | ||
LLVM_ATTRIBUTE_UNUSED volatile char t = *page; | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. FYI: I just saw a broken asan test that seems to point to this line having a use-after-free. The next test succeeded, so I think it might be a rare race condition. Do you think this could be related? https://lab.llvm.org/buildbot/#/builders/169/builds/15170/steps/11/logs/stdio There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Hi, I guess if the paging thread is held up for any reason it could still be running when global deallocations take place; The test that failed is a bit of an edge case with a single file with almost no processing. I think the best way to avoid this would be to move ahead with the conversion of the code to use madvise() that was being explored in the other PR. I've rolled back the latest commit and we are back to where we were on the 12th, ready to merge before I started experimenting and everyone lost interest. There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Interesting this should have been the day after 105fc90, I can't think why. |
||
}; | ||
#if LLVM_ENABLE_THREADS | ||
{ // Create scope for waiting for the taskGroup | ||
std::atomic_size_t index = 0; | ||
llvm::parallel::TaskGroup taskGroup; | ||
for (int w = 0; w < config->readWorkers; w++) | ||
taskGroup.spawn([&index, &preloadDeferredFile, &deferred]() { | ||
while (true) { | ||
size_t localIndex = index.fetch_add(1); | ||
if (localIndex >= deferred.size()) | ||
break; | ||
preloadDeferredFile(deferred[localIndex]); | ||
} | ||
}); | ||
} | ||
#endif | ||
#ifndef NDEBUG | ||
auto dt = high_resolution_clock::now() - t0; | ||
if (Process::GetEnv("LLD_MULTI_THREAD_PAGE")) | ||
llvm::dbgs() << "multiThreadedPageIn " << totalBytes << "/" | ||
<< numDeferedFilesTouched << "/" << deferred.size() << "/" | ||
<< duration_cast<milliseconds>(dt).count() / 1000. << "\n"; | ||
#endif | ||
} | ||
|
||
static void multiThreadedPageIn(const DeferredFiles &deferred) { | ||
static SerialBackgroundQueue pageInQueue; | ||
pageInQueue.queueWork([=]() { | ||
DeferredFiles files = deferred; | ||
multiThreadedPageInBackground(files); | ||
}); | ||
} | ||
|
||
static InputFile *processFile(std::optional<MemoryBufferRef> buffer, | ||
DeferredFiles *archiveContents, StringRef path, | ||
LoadType loadType, bool isLazy = false, | ||
bool isExplicit = true, | ||
bool isBundleLoader = false, | ||
bool isForceHidden = false) { | ||
if (!buffer) | ||
return nullptr; | ||
MemoryBufferRef mbref = *buffer; | ||
|
@@ -379,6 +487,8 @@ static InputFile *addFile(StringRef path, LoadType loadType, | |
continue; | ||
} | ||
|
||
if (archiveContents) | ||
archiveContents->push_back({path, isLazy, *mb}); | ||
if (!hasObjCSection(*mb)) | ||
continue; | ||
if (Error e = file->fetch(c, "-ObjC")) | ||
|
@@ -390,7 +500,8 @@ static InputFile *addFile(StringRef path, LoadType loadType, | |
": Archive::children failed: " + toString(std::move(e))); | ||
} | ||
} | ||
file->addLazySymbols(); | ||
if (!archiveContents || archiveContents->empty()) | ||
file->addLazySymbols(); | ||
loadedArchives[path] = ArchiveFileInfo{file, isCommandLineLoad}; | ||
newFile = file; | ||
break; | ||
|
@@ -441,6 +552,24 @@ static InputFile *addFile(StringRef path, LoadType loadType, | |
return newFile; | ||
} | ||
|
||
static InputFile *addFile(StringRef path, LoadType loadType, | ||
bool isLazy = false, bool isExplicit = true, | ||
bool isBundleLoader = false, | ||
bool isForceHidden = false) { | ||
return processFile(readFile(path), nullptr, path, loadType, isLazy, | ||
isExplicit, isBundleLoader, isForceHidden); | ||
} | ||
|
||
static void deferFile(StringRef path, bool isLazy, DeferredFiles &deferred) { | ||
std::optional<MemoryBufferRef> buffer = readFile(path); | ||
if (!buffer) | ||
return; | ||
if (config->readWorkers) | ||
deferred.push_back({path, isLazy, *buffer}); | ||
johnno1962 marked this conversation as resolved.
Show resolved
Hide resolved
|
||
else | ||
processFile(buffer, nullptr, path, LoadType::CommandLine, isLazy); | ||
} | ||
|
||
static std::vector<StringRef> missingAutolinkWarnings; | ||
static void addLibrary(StringRef name, bool isNeeded, bool isWeak, | ||
bool isReexport, bool isHidden, bool isExplicit, | ||
|
@@ -564,13 +693,14 @@ void macho::resolveLCLinkerOptions() { | |
} | ||
} | ||
|
||
static void addFileList(StringRef path, bool isLazy) { | ||
static void addFileList(StringRef path, bool isLazy, | ||
DeferredFiles &deferredFiles) { | ||
std::optional<MemoryBufferRef> buffer = readFile(path); | ||
if (!buffer) | ||
return; | ||
MemoryBufferRef mbref = *buffer; | ||
for (StringRef path : args::getLines(mbref)) | ||
addFile(rerootPath(path), LoadType::CommandLine, isLazy); | ||
deferFile(rerootPath(path), isLazy, deferredFiles); | ||
} | ||
|
||
// We expect sub-library names of the form "libfoo", which will match a dylib | ||
|
@@ -1222,14 +1352,16 @@ static void createFiles(const InputArgList &args) { | |
bool isLazy = false; | ||
// If we've processed an opening --start-lib, without a matching --end-lib | ||
bool inLib = false; | ||
DeferredFiles deferredFiles; | ||
|
||
for (const Arg *arg : args) { | ||
const Option &opt = arg->getOption(); | ||
warnIfDeprecatedOption(opt); | ||
warnIfUnimplementedOption(opt); | ||
|
||
switch (opt.getID()) { | ||
case OPT_INPUT: | ||
addFile(rerootPath(arg->getValue()), LoadType::CommandLine, isLazy); | ||
deferFile(rerootPath(arg->getValue()), isLazy, deferredFiles); | ||
break; | ||
case OPT_needed_library: | ||
if (auto *dylibFile = dyn_cast_or_null<DylibFile>( | ||
|
@@ -1249,7 +1381,7 @@ static void createFiles(const InputArgList &args) { | |
dylibFile->forceWeakImport = true; | ||
break; | ||
case OPT_filelist: | ||
addFileList(arg->getValue(), isLazy); | ||
addFileList(arg->getValue(), isLazy, deferredFiles); | ||
break; | ||
case OPT_force_load: | ||
addFile(rerootPath(arg->getValue()), LoadType::CommandLineForce); | ||
|
@@ -1295,6 +1427,24 @@ static void createFiles(const InputArgList &args) { | |
break; | ||
} | ||
} | ||
|
||
if (config->readWorkers) { | ||
multiThreadedPageIn(deferredFiles); | ||
|
||
DeferredFiles archiveContents; | ||
std::vector<ArchiveFile *> archives; | ||
for (auto &file : deferredFiles) { | ||
auto inputFile = processFile(file.buffer, &archiveContents, file.path, | ||
LoadType::CommandLine, file.isLazy); | ||
if (ArchiveFile *archive = dyn_cast<ArchiveFile>(inputFile)) | ||
archives.push_back(archive); | ||
} | ||
|
||
if (!archiveContents.empty()) | ||
multiThreadedPageIn(archiveContents); | ||
for (auto *archive : archives) | ||
archive->addLazySymbols(); | ||
} | ||
} | ||
|
||
static void gatherInputSections() { | ||
|
@@ -1687,6 +1837,14 @@ bool link(ArrayRef<const char *> argsArr, llvm::raw_ostream &stdoutOS, | |
} | ||
} | ||
|
||
if (auto *arg = args.getLastArg(OPT_read_workers)) { | ||
StringRef v(arg->getValue()); | ||
unsigned threads = 0; | ||
if (!llvm::to_integer(v, threads, 0) || threads < 0) | ||
johnno1962 marked this conversation as resolved.
Show resolved
Hide resolved
|
||
error(arg->getSpelling() + ": expected a positive integer, but got '" + | ||
arg->getValue() + "'"); | ||
config->readWorkers = threads; | ||
} | ||
if (auto *arg = args.getLastArg(OPT_threads_eq)) { | ||
StringRef v(arg->getValue()); | ||
unsigned threads = 0; | ||
|
Uh oh!
There was an error while loading. Please reload this page.