@@ -98,7 +98,8 @@ class InProcessFunctionExecutorImpl : public BenchmarkRunner::FunctionExecutor {
9898public:
9999 static Expected<std::unique_ptr<InProcessFunctionExecutorImpl>>
100100 create (const LLVMState &State, object::OwningBinary<object::ObjectFile> Obj,
101- BenchmarkRunner::ScratchSpace *Scratch) {
101+ BenchmarkRunner::ScratchSpace *Scratch,
102+ std::optional<int > BenchmarkProcessCPU) {
102103 Expected<ExecutableFunction> EF =
103104 ExecutableFunction::create (State.createTargetMachine (), std::move (Obj));
104105
@@ -190,27 +191,31 @@ class SubProcessFunctionExecutorImpl
190191public:
191192 static Expected<std::unique_ptr<SubProcessFunctionExecutorImpl>>
192193 create (const LLVMState &State, object::OwningBinary<object::ObjectFile> Obj,
193- const BenchmarkKey &Key) {
194+ const BenchmarkKey &Key, std::optional< int > BenchmarkProcessCPU ) {
194195 Expected<ExecutableFunction> EF =
195196 ExecutableFunction::create (State.createTargetMachine (), std::move (Obj));
196197 if (!EF)
197198 return EF.takeError ();
198199
199200 return std::unique_ptr<SubProcessFunctionExecutorImpl>(
200- new SubProcessFunctionExecutorImpl (State, std::move (*EF), Key));
201+ new SubProcessFunctionExecutorImpl (State, std::move (*EF), Key,
202+ BenchmarkProcessCPU));
201203 }
202204
203205private:
204206 SubProcessFunctionExecutorImpl (const LLVMState &State,
205207 ExecutableFunction Function,
206- const BenchmarkKey &Key)
207- : State(State), Function(std::move(Function)), Key(Key) {}
208+ const BenchmarkKey &Key,
209+ std::optional<int > BenchmarkCPU)
210+ : State(State), Function(std::move(Function)), Key(Key),
211+ BenchmarkProcessCPU (BenchmarkCPU) {}
208212
209213 enum ChildProcessExitCodeE {
210214 CounterFDReadFailed = 1 ,
211215 RSeqDisableFailed,
212216 FunctionDataMappingFailed,
213- AuxiliaryMemorySetupFailed
217+ AuxiliaryMemorySetupFailed,
218+ SetCPUAffinityFailed
214219 };
215220
216221 StringRef childProcessExitCodeToString (int ExitCode) const {
@@ -223,6 +228,8 @@ class SubProcessFunctionExecutorImpl
223228 return " Failed to map memory for assembled snippet" ;
224229 case ChildProcessExitCodeE::AuxiliaryMemorySetupFailed:
225230 return " Failed to setup auxiliary memory" ;
231+ case ChildProcessExitCodeE::SetCPUAffinityFailed:
232+ return " Failed to set CPU affinity of the benchmarking process" ;
226233 default :
227234 return " Child process returned with unknown exit code" ;
228235 }
@@ -384,6 +391,29 @@ class SubProcessFunctionExecutorImpl
384391 return make_error<SnippetSignal>(ChildSignalInfo.si_signo );
385392 }
386393
394+ static void setCPUAffinityIfRequested (int CPUToUse) {
395+ // Set the CPU affinity for the child process, so that we ensure that if
396+ // the user specified a CPU the process should run on, the benchmarking
397+ // process is running on that CPU.
398+ cpu_set_t CPUMask;
399+ CPU_ZERO (&CPUMask);
400+ CPU_SET (CPUToUse, &CPUMask);
401+ // TODO(boomanaiden154): Rewrite this to use LLVM primitives once they
402+ // are available.
403+ int SetAffinityReturn = sched_setaffinity (0 , sizeof (CPUMask), &CPUMask);
404+ if (SetAffinityReturn == -1 ) {
405+ exit (ChildProcessExitCodeE::SetCPUAffinityFailed);
406+ }
407+
408+ // Check (if assertions are enabled) that we are actually running on the
409+ // CPU that was specified by the user.
410+ unsigned int CurrentCPU;
411+ assert (getcpu (&CurrentCPU, nullptr ) == 0 &&
412+ " Expected getcpu call to succeed." );
413+ assert (static_cast <int >(CurrentCPU) == CPUToUse &&
414+ " Expected current CPU to equal the CPU requested by the user" );
415+ }
416+
387417 Error createSubProcessAndRunBenchmark (
388418 StringRef CounterName, SmallVectorImpl<int64_t > &CounterValues,
389419 ArrayRef<const char *> ValidationCounters,
@@ -416,6 +446,10 @@ class SubProcessFunctionExecutorImpl
416446 }
417447
418448 if (ParentOrChildPID == 0 ) {
449+ if (BenchmarkProcessCPU.has_value ()) {
450+ setCPUAffinityIfRequested (*BenchmarkProcessCPU);
451+ }
452+
419453 // We are in the child process, close the write end of the pipe.
420454 close (PipeFiles[1 ]);
421455 // Unregister handlers, signal handling is now handled through ptrace in
@@ -538,6 +572,7 @@ class SubProcessFunctionExecutorImpl
538572 const LLVMState &State;
539573 const ExecutableFunction Function;
540574 const BenchmarkKey &Key;
575+ const std::optional<int > BenchmarkProcessCPU;
541576};
542577#endif // __linux__
543578} // namespace
@@ -615,11 +650,15 @@ BenchmarkRunner::getRunnableConfiguration(
615650Expected<std::unique_ptr<BenchmarkRunner::FunctionExecutor>>
616651BenchmarkRunner::createFunctionExecutor (
617652 object::OwningBinary<object::ObjectFile> ObjectFile,
618- const BenchmarkKey &Key) const {
653+ const BenchmarkKey &Key, std::optional< int > BenchmarkProcessCPU ) const {
619654 switch (ExecutionMode) {
620655 case ExecutionModeE::InProcess: {
656+ if (BenchmarkProcessCPU.has_value ())
657+ return make_error<Failure>(" The inprocess execution mode does not "
658+ " support benchmark core pinning." );
659+
621660 auto InProcessExecutorOrErr = InProcessFunctionExecutorImpl::create (
622- State, std::move (ObjectFile), Scratch.get ());
661+ State, std::move (ObjectFile), Scratch.get (), BenchmarkProcessCPU );
623662 if (!InProcessExecutorOrErr)
624663 return InProcessExecutorOrErr.takeError ();
625664
@@ -628,7 +667,7 @@ BenchmarkRunner::createFunctionExecutor(
628667 case ExecutionModeE::SubProcess: {
629668#ifdef __linux__
630669 auto SubProcessExecutorOrErr = SubProcessFunctionExecutorImpl::create (
631- State, std::move (ObjectFile), Key);
670+ State, std::move (ObjectFile), Key, BenchmarkProcessCPU );
632671 if (!SubProcessExecutorOrErr)
633672 return SubProcessExecutorOrErr.takeError ();
634673
@@ -643,8 +682,8 @@ BenchmarkRunner::createFunctionExecutor(
643682}
644683
645684std::pair<Error, Benchmark> BenchmarkRunner::runConfiguration (
646- RunnableConfiguration &&RC,
647- const std::optional<StringRef> &DumpFile ) const {
685+ RunnableConfiguration &&RC, const std::optional<StringRef> &DumpFile,
686+ std::optional<int > BenchmarkProcessCPU ) const {
648687 Benchmark &BenchmarkResult = RC.BenchmarkResult ;
649688 object::OwningBinary<object::ObjectFile> &ObjectFile = RC.ObjectFile ;
650689
@@ -665,7 +704,8 @@ std::pair<Error, Benchmark> BenchmarkRunner::runConfiguration(
665704 }
666705
667706 Expected<std::unique_ptr<BenchmarkRunner::FunctionExecutor>> Executor =
668- createFunctionExecutor (std::move (ObjectFile), RC.BenchmarkResult .Key );
707+ createFunctionExecutor (std::move (ObjectFile), RC.BenchmarkResult .Key ,
708+ BenchmarkProcessCPU);
669709 if (!Executor)
670710 return {Executor.takeError (), std::move (BenchmarkResult)};
671711 auto NewMeasurements = runMeasurements (**Executor);
0 commit comments