//===--- Compilation.cpp - Compilation Task Data Structure ----------------===// // // This source file is part of the Swift.org open source project // // Copyright (c) 2014 - 2018 Apple Inc. and the Swift project authors // Licensed under Apache License v2.0 with Runtime Library Exception // // See https://swift.org/LICENSE.txt for license information // See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors // //===----------------------------------------------------------------------===// #include "swift/Driver/Compilation.h" #include "swift/AST/DiagnosticEngine.h" #include "swift/AST/DiagnosticsDriver.h" #include "swift/AST/FineGrainedDependencies.h" #include "swift/AST/FineGrainedDependencyFormat.h" #include "swift/Basic/Assertions.h" #include "swift/Basic/OutputFileMap.h" #include "swift/Basic/ParseableOutput.h" #include "swift/Basic/Program.h" #include "swift/Basic/STLExtras.h" #include "swift/Basic/Statistic.h" #include "swift/Basic/TaskQueue.h" #include "swift/Basic/Version.h" #include "swift/Basic/type_traits.h" #include "swift/Driver/Action.h" #include "swift/Driver/Driver.h" #include "swift/Driver/Job.h" #include "swift/Driver/ToolChain.h" #include "swift/Option/Options.h" #include "llvm/ADT/DenseSet.h" #include "llvm/ADT/MapVector.h" #include "llvm/ADT/SetVector.h" #include "llvm/ADT/StringExtras.h" #include "llvm/ADT/TinyPtrVector.h" #include "llvm/Option/Arg.h" #include "llvm/Option/ArgList.h" #include "llvm/Support/Chrono.h" #include "llvm/Support/Compiler.h" #include "llvm/Support/FileSystem.h" #include "llvm/Support/Path.h" #include "llvm/Support/Timer.h" #include "llvm/Support/YAMLParser.h" #include "llvm/Support/raw_ostream.h" #include #include #if defined(_WIN32) #include #include #endif #define DEBUG_TYPE "batch-mode" // Batch-mode has a sub-mode for testing that randomizes batch partitions, // by user-provided seed. That is the only thing randomized here. #include using namespace swift; using namespace swift::sys; using namespace swift::driver; using namespace swift::parseable_output; using namespace llvm::opt; struct LogJob { const Job *j; LogJob(const Job *j) : j(j) {} }; struct LogJobArray { const ArrayRef js; LogJobArray(const ArrayRef js) : js(js) {} }; struct LogJobSet { const SmallPtrSetImpl &js; LogJobSet(const SmallPtrSetImpl &js) : js(js) {} }; llvm::raw_ostream &operator<<(llvm::raw_ostream &os, const LogJob &lj) { lj.j->printSummary(os); return os; } llvm::raw_ostream &operator<<(llvm::raw_ostream &os, const LogJobArray &ljs) { os << "["; interleave(ljs.js, [&](Job const *j) { os << LogJob(j); }, [&]() { os << ' '; }); os << "]"; return os; } llvm::raw_ostream &operator<<(llvm::raw_ostream &os, const LogJobSet &ljs) { os << "{"; interleave(ljs.js, [&](Job const *j) { os << LogJob(j); }, [&]() { os << ' '; }); os << "}"; return os; } // clang-format off Compilation::Compilation(DiagnosticEngine &Diags, const ToolChain &TC, OutputInfo const &OI, OutputLevel Level, std::unique_ptr InputArgs, std::unique_ptr TranslatedArgs, InputFileList InputsWithTypes, size_t FilelistThreshold, bool EnableBatchMode, unsigned BatchSeed, std::optional BatchCount, std::optional BatchSizeLimit, bool SaveTemps, bool ShowDriverTimeCompilation, std::unique_ptr StatsReporter, bool OnlyOneDependencyFile) : Diags(Diags), TheToolChain(TC), TheOutputInfo(OI), Level(Level), RawInputArgs(std::move(InputArgs)), TranslatedArgs(std::move(TranslatedArgs)), InputFilesWithTypes(std::move(InputsWithTypes)), EnableBatchMode(EnableBatchMode), BatchSeed(BatchSeed), BatchCount(BatchCount), BatchSizeLimit(BatchSizeLimit), SaveTemps(SaveTemps), ShowDriverTimeCompilation(ShowDriverTimeCompilation), Stats(std::move(StatsReporter)), FilelistThreshold(FilelistThreshold), OnlyOneDependencyFile(OnlyOneDependencyFile) { } // clang-format on static bool writeFilelistIfNecessary(const Job *job, const ArgList &args, DiagnosticEngine &diags); using CommandSetVector = llvm::SetVector; using BatchPartition = std::vector>; namespace { static DetailedTaskDescription constructDetailedTaskDescription(const driver::Job &Cmd) { std::string Executable = Cmd.getExecutable(); SmallVector Arguments; std::string CommandLine; SmallVector Inputs; SmallVector Outputs; for (const auto &A : Cmd.getArguments()) { Arguments.push_back(A); } llvm::raw_string_ostream wrapper(CommandLine); Cmd.printCommandLine(wrapper, ""); wrapper.flush(); for (const Action *A : Cmd.getSource().getInputs()) { if (const auto *IA = dyn_cast(A)) Inputs.push_back(CommandInput(IA->getInputArg().getValue())); } for (const driver::Job *J : Cmd.getInputs()) { auto OutFiles = J->getOutput().getPrimaryOutputFilenames(); if (const auto *BJAction = dyn_cast(&Cmd.getSource())) { Inputs.push_back(CommandInput(OutFiles[BJAction->getInputIndex()])); } else { for (llvm::StringRef FileName : OutFiles) { Inputs.push_back(CommandInput(FileName)); } } } // TODO: set up Outputs appropriately. file_types::ID PrimaryOutputType = Cmd.getOutput().getPrimaryOutputType(); if (PrimaryOutputType != file_types::TY_Nothing) { for (llvm::StringRef OutputFileName : Cmd.getOutput().getPrimaryOutputFilenames()) { Outputs.push_back(OutputPair(PrimaryOutputType, OutputFileName.str())); } } file_types::forAllTypes([&](file_types::ID Ty) { for (auto Output : Cmd.getOutput().getAdditionalOutputsForType(Ty)) { Outputs.push_back(OutputPair(Ty, Output.str())); } }); return DetailedTaskDescription{Executable, Arguments, CommandLine, Inputs, Outputs}; } } // namespace namespace swift { namespace driver { class PerformJobsState { /// The containing Compilation object. Compilation &Comp; /// All jobs which have been scheduled for execution (whether or not /// they've finished execution), or which have been determined that they /// don't need to run. CommandSet ScheduledCommands; /// A temporary buffer to hold commands that were scheduled but haven't been /// added to the Task Queue yet, because we might try batching them together /// first. CommandSetVector PendingExecution; /// Set of synthetic BatchJobs that serve to cluster subsets of jobs waiting /// in PendingExecution. Also used to identify (then unpack) BatchJobs back /// to their underlying non-Batch Jobs, when running a callback from /// TaskQueue. CommandSet BatchJobs; /// Persistent counter for allocating quasi-PIDs to Jobs combined into /// BatchJobs. Quasi-PIDs are _negative_ PID-like unique keys used to /// masquerade BatchJob constituents as (quasi)processes, when writing /// parseable output to consumers that don't understand the idea of a batch /// job. They are negative in order to avoid possibly colliding with real /// PIDs (which are always positive). We start at -1000 here as a crude but /// harmless hedge against colliding with an errno value that might slip /// into the stream of real PIDs (say, due to a TaskQueue bug). int64_t NextBatchQuasiPID = parseable_output::QUASI_PID_START; /// All jobs which have finished execution or which have been determined /// that they don't need to run. CommandSet FinishedCommands; /// A map from a Job to the commands it is known to be blocking. /// /// The blocked jobs should be scheduled as soon as possible. llvm::SmallDenseMap, 16> BlockingCommands; /// A map from commands that didn't get to run to whether or not they affect /// downstream commands. /// /// Only intended for source files. llvm::SmallDenseMap UnfinishedCommands; private: /// TaskQueue for execution. std::unique_ptr TQ; /// Cumulative result of PerformJobs(), accumulated from subprocesses. int ResultCode = EXIT_SUCCESS; /// True if any Job crashed. bool AnyAbnormalExit = false; /// Timers for monitoring execution time of subprocesses. llvm::TimerGroup DriverTimerGroup {"driver", "Driver Compilation Time"}; llvm::SmallDenseMap, 16> DriverTimers; const Job *findUnfinishedJob(ArrayRef JL) { for (const Job *Cmd : JL) { if (!FinishedCommands.count(Cmd)) return Cmd; } return nullptr; } /// Schedule the given Job if it has not been scheduled and if all of /// its inputs are in FinishedCommands. void scheduleCommandIfNecessaryAndPossible(const Job *Cmd) { if (ScheduledCommands.count(Cmd)) { if (Comp.getShowJobLifecycle()) { llvm::outs() << "Already scheduled: " << LogJob(Cmd) << "\n"; } return; } if (auto Blocking = findUnfinishedJob(Cmd->getInputs())) { BlockingCommands[Blocking].push_back(Cmd); if (Comp.getShowJobLifecycle()) { llvm::outs() << "Blocked by: " << LogJob(Blocking) << ", now blocking jobs: " << LogJobArray(BlockingCommands[Blocking]) << "\n"; } return; } // Adding to scheduled means we've committed to its completion (not // distinguished from skipping). We never remove it once inserted. ScheduledCommands.insert(Cmd); // Adding to pending means it should be in the next round of additions to // the task queue (either batched or singularly); we remove Jobs from // PendingExecution once we hand them over to the TaskQueue. PendingExecution.insert(Cmd); } // Sort for ease of testing template void scheduleCommandsInSortedOrder(const Jobs &jobs) { llvm::SmallVector sortedJobs; Comp.sortJobsToMatchCompilationInputs(jobs, sortedJobs); for (const Job *Cmd : sortedJobs) scheduleCommandIfNecessaryAndPossible(Cmd); } void addPendingJobToTaskQueue(const Job *Cmd) { // FIXME: Failing here should not take down the whole process. bool success = writeFilelistIfNecessary(Cmd, Comp.getArgs(), Comp.getDiags()); assert(success && "failed to write filelist"); (void)success; assert(Cmd->getExtraEnvironment().empty() && "not implemented for compilations with multiple jobs"); if (Comp.getShowJobLifecycle()) llvm::outs() << "Added to TaskQueue: " << LogJob(Cmd) << "\n"; TQ->addTask(Cmd->getExecutable(), Cmd->getArgumentsForTaskExecution(), std::nullopt, (void *)Cmd); } /// When a task finishes, check other Jobs that may be blocked. void markFinished(const Job *Cmd, bool Skipped=false) { if (Comp.getShowJobLifecycle()) { llvm::outs() << "Job " << (Skipped ? "skipped" : "finished") << ": " << LogJob(Cmd) << "\n"; } FinishedCommands.insert(Cmd); if (auto *Stats = Comp.getStatsReporter()) { auto &D = Stats->getDriverCounters(); if (Skipped) ++D.NumDriverJobsSkipped; else ++D.NumDriverJobsRun; } auto BlockedIter = BlockingCommands.find(Cmd); if (BlockedIter != BlockingCommands.end()) { auto AllBlocked = std::move(BlockedIter->second); if (Comp.getShowJobLifecycle()) { llvm::outs() << "Scheduling maybe-unblocked jobs: " << LogJobArray(AllBlocked) << "\n"; } BlockingCommands.erase(BlockedIter); scheduleCommandsInSortedOrder(AllBlocked); } } bool isBatchJob(const Job *MaybeBatchJob) const { return BatchJobs.count(MaybeBatchJob) != 0; } /// Callback which will be called immediately after a task has started. This /// callback may be used to provide output indicating that the task began. void taskBegan(ProcessId Pid, void *Context) { // TODO: properly handle task began. const Job *BeganCmd = (const Job *)Context; if (Comp.getShowDriverTimeCompilation()) { llvm::SmallString<128> TimerName; llvm::raw_svector_ostream OS(TimerName); OS << LogJob(BeganCmd); DriverTimers.insert({ BeganCmd, std::unique_ptr( new llvm::Timer("task", OS.str(), DriverTimerGroup)) }); DriverTimers[BeganCmd]->startTimer(); } switch (Comp.getOutputLevel()) { case OutputLevel::Normal: break; // For command line or verbose output, print out each command as it // begins execution. case OutputLevel::PrintJobs: BeganCmd->printCommandLineAndEnvironment(llvm::outs()); break; case OutputLevel::Verbose: BeganCmd->printCommandLine(llvm::errs()); break; case OutputLevel::Parseable: BeganCmd->forEachContainedJobAndPID(Pid, [&](const Job *J, Job::PID P) { auto TascDesc = constructDetailedTaskDescription(*J); parseable_output::emitBeganMessage(llvm::errs(), J->getSource().getClassName(), TascDesc, P, TaskProcessInformation(Pid)); }); break; } } /// Check to see if a job produced a zero-length serialized diagnostics /// file, which is used to indicate batch-constituents that were batched /// together with a failing constituent but did not, themselves, produce any /// errors. bool jobWasBatchedWithFailingJobs(const Job *J) const { auto DiaPath = J->getOutput().getAnyOutputForType(file_types::TY_SerializedDiagnostics); if (DiaPath.empty()) return false; if (!llvm::sys::fs::is_regular_file(DiaPath)) return false; uint64_t Size; auto EC = llvm::sys::fs::file_size(DiaPath, Size); if (EC) return false; return Size == 0; } /// If a batch-constituent job happens to be batched together with a job /// that exits with an error, the batch-constituent may be considered /// "cancelled". bool jobIsCancelledBatchConstituent(int ReturnCode, const Job *ContainerJob, const Job *ConstituentJob) { return ReturnCode != 0 && isBatchJob(ContainerJob) && jobWasBatchedWithFailingJobs(ConstituentJob); } /// Unpack a \c BatchJob that has finished into its constituent \c Job /// members, and call \c taskFinished on each, propagating any \c /// TaskFinishedResponse other than \c /// TaskFinishedResponse::ContinueExecution from any of the constituent /// calls. TaskFinishedResponse unpackAndFinishBatch(int ReturnCode, StringRef Output, StringRef Errors, const BatchJob *B) { if (Comp.getShowJobLifecycle()) llvm::outs() << "Batch job finished: " << LogJob(B) << "\n"; auto res = TaskFinishedResponse::ContinueExecution; for (const Job *J : B->getCombinedJobs()) { if (Comp.getShowJobLifecycle()) llvm::outs() << " ==> Unpacked batch constituent finished: " << LogJob(J) << "\n"; auto r = taskFinished( llvm::sys::ProcessInfo::InvalidPid, ReturnCode, Output, Errors, TaskProcessInformation(llvm::sys::ProcessInfo::InvalidPid), (void *)J); if (r != TaskFinishedResponse::ContinueExecution) res = r; } return res; } void emitParseableOutputForEachFinishedJob(ProcessId Pid, int ReturnCode, StringRef Output, const Job *FinishedCmd, TaskProcessInformation ProcInfo) { FinishedCmd->forEachContainedJobAndPID(Pid, [&](const Job *J, Job::PID P) { if (jobIsCancelledBatchConstituent(ReturnCode, FinishedCmd, J)) { // Simulate SIGINT-interruption to parseable-output consumer for any // constituent of a failing batch job that produced no errors of its // own. parseable_output::emitSignalledMessage(llvm::errs(), J->getSource().getClassName(), "cancelled batch constituent", "", SIGINT, P, ProcInfo); } else { parseable_output::emitFinishedMessage(llvm::errs(), J->getSource().getClassName(), Output.str(), ReturnCode, P, ProcInfo); } }); } /// Callback which will be called immediately after a task has finished /// execution. Determines if execution should continue, and also schedule /// any additional Jobs which we now know we need to run. TaskFinishedResponse taskFinished(ProcessId Pid, int ReturnCode, StringRef Output, StringRef Errors, TaskProcessInformation ProcInfo, void *Context) { const Job *const FinishedCmd = (const Job *)Context; if (Pid != llvm::sys::ProcessInfo::InvalidPid) { if (Comp.getShowDriverTimeCompilation()) { DriverTimers[FinishedCmd]->stopTimer(); } processOutputOfFinishedProcess(Pid, ReturnCode, FinishedCmd, Output, ProcInfo); } if (Comp.getStatsReporter() && ProcInfo.getResourceUsage().has_value()) Comp.getStatsReporter()->recordJobMaxRSS( ProcInfo.getResourceUsage()->Maxrss); if (isBatchJob(FinishedCmd)) { return unpackAndFinishBatch(ReturnCode, Output, Errors, static_cast(FinishedCmd)); } if (ReturnCode != EXIT_SUCCESS) return taskFailed(FinishedCmd, ReturnCode); // When a task finishes, we need to reevaluate the other commands that // might have been blocked. markFinished(FinishedCmd); return TaskFinishedResponse::ContinueExecution; } TaskFinishedResponse taskFailed(const Job *FinishedCmd, const int ReturnCode) { // The task failed, so return true without performing any further // dependency analysis. // Store this task's ReturnCode as our Result if we haven't stored // anything yet. if (ResultCode == EXIT_SUCCESS) ResultCode = ReturnCode; if (!isa(FinishedCmd->getSource()) || ReturnCode != EXIT_FAILURE) { Comp.getDiags().diagnose(SourceLoc(), diag::error_command_failed, FinishedCmd->getSource().getClassName(), ReturnCode); } // See how ContinueBuildingAfterErrors gets set up in Driver.cpp for // more info. assert((Comp.getContinueBuildingAfterErrors() || !Comp.getBatchModeEnabled()) && "batch mode diagnostics require ContinueBuildingAfterErrors"); return Comp.getContinueBuildingAfterErrors() ? TaskFinishedResponse::ContinueExecution : TaskFinishedResponse::StopExecution; } #if defined(_WIN32) struct FileBinaryModeRAII { FileBinaryModeRAII(FILE *F) : F(F) { PrevMode = _setmode(_fileno(F), _O_BINARY); } ~FileBinaryModeRAII() { _setmode(_fileno(F), PrevMode); } FILE *F; int PrevMode; }; #else struct FileBinaryModeRAII { FileBinaryModeRAII(FILE *) {} }; #endif void processOutputOfFinishedProcess(ProcessId Pid, int ReturnCode, const Job *const FinishedCmd, StringRef Output, TaskProcessInformation ProcInfo) { switch (Comp.getOutputLevel()) { case OutputLevel::PrintJobs: // Only print the jobs, not the outputs break; case OutputLevel::Normal: case OutputLevel::Verbose: // Send the buffered output to stderr, though only if we // support getting buffered output. if (TaskQueue::supportsBufferingOutput()) { // Temporarily change stderr to binary mode to avoid double // LF -> CR LF conversions on the outputs from child // processes, which have already this conversion appplied. // This makes a difference only for Windows. FileBinaryModeRAII F(stderr); llvm::errs() << Output; } break; case OutputLevel::Parseable: emitParseableOutputForEachFinishedJob(Pid, ReturnCode, Output, FinishedCmd, ProcInfo); break; } } TaskFinishedResponse taskSignalled(ProcessId Pid, StringRef ErrorMsg, StringRef Output, StringRef Errors, void *Context, std::optional Signal, TaskProcessInformation ProcInfo) { const Job *SignalledCmd = (const Job *)Context; if (Comp.getShowDriverTimeCompilation()) { DriverTimers[SignalledCmd]->stopTimer(); } if (Comp.getOutputLevel() == OutputLevel::Parseable) { // Parseable output was requested. SignalledCmd->forEachContainedJobAndPID(Pid, [&](const Job *J, Job::PID P) { parseable_output::emitSignalledMessage(llvm::errs(), J->getSource().getClassName(), ErrorMsg, Output, Signal, P, ProcInfo); }); } else { // Otherwise, send the buffered output to stderr, though only if we // support getting buffered output. if (TaskQueue::supportsBufferingOutput()) llvm::errs() << Output; } if (Comp.getStatsReporter() && ProcInfo.getResourceUsage().has_value()) Comp.getStatsReporter()->recordJobMaxRSS( ProcInfo.getResourceUsage()->Maxrss); if (!ErrorMsg.empty()) Comp.getDiags().diagnose(SourceLoc(), diag::error_unable_to_execute_command, ErrorMsg); if (Signal.has_value()) { Comp.getDiags().diagnose(SourceLoc(), diag::error_command_signalled, SignalledCmd->getSource().getClassName(), Signal.value()); } else { Comp.getDiags() .diagnose(SourceLoc(), diag::error_command_signalled_without_signal_number, SignalledCmd->getSource().getClassName()); } // Since the task signalled, unconditionally set result to -2. ResultCode = -2; AnyAbnormalExit = true; return TaskFinishedResponse::StopExecution; } public: PerformJobsState(Compilation &Comp, std::unique_ptr &&TaskQueue) : Comp(Comp), TQ(std::move(TaskQueue)) {} /// Schedule and run initial, additional, and batch jobs. void runJobs() { scheduleJobsBeforeBatching(); formBatchJobsAndAddPendingJobsToTaskQueue(); runTaskQueueToCompletion(); } private: void scheduleJobsBeforeBatching() { scheduleJobsForNonIncrementalCompilation(); } void scheduleJobsForNonIncrementalCompilation() { for (const Job *Cmd : Comp.getJobs()) scheduleCommandIfNecessaryAndPossible(Cmd); } /// Insert all jobs in \p Cmds (of descriptive name \p Kind) to the \c /// TaskQueue, and clear \p Cmds. template void transferJobsToTaskQueue(Container &Cmds, StringRef Kind) { for (const Job *Cmd : Cmds) { if (Comp.getShowJobLifecycle()) llvm::outs() << "Adding " << Kind << " job to task queue: " << LogJob(Cmd) << "\n"; addPendingJobToTaskQueue(Cmd); } Cmds.clear(); } /// Partition the jobs in \c PendingExecution into those that are \p /// Batchable and those that are \p NonBatchable, clearing \p /// PendingExecution. void getPendingBatchableJobs(CommandSetVector &Batchable, CommandSetVector &NonBatchable) { for (const Job *Cmd : PendingExecution) { if (Comp.getToolChain().jobIsBatchable(Comp, Cmd)) { if (Comp.getShowJobLifecycle()) llvm::outs() << "Batchable: " << LogJob(Cmd) << "\n"; Batchable.insert(Cmd); } else { if (Comp.getShowJobLifecycle()) llvm::outs() << "Not batchable: " << LogJob(Cmd) << "\n"; NonBatchable.insert(Cmd); } } } /// If \p Batch is nonempty, construct a new \c BatchJob from its /// contents by calling \p ToolChain::constructBatchJob, then insert the /// new \c BatchJob into \p Batches. void formBatchJobFromPartitionBatch(std::vector &Batches, std::vector const &Batch) { if (Batch.empty()) return; if (Comp.getShowJobLifecycle()) llvm::outs() << "Forming batch job from " << Batch.size() << " constituents\n"; auto const &TC = Comp.getToolChain(); auto J = TC.constructBatchJob(Batch, NextBatchQuasiPID, Comp); if (J) Batches.push_back(Comp.addJob(std::move(J))); } /// Build a vector of partition indices, one per Job: the i'th index says /// which batch of the partition the i'th Job will be assigned to. If we are /// shuffling due to -driver-batch-seed, the returned indices will not be /// arranged in contiguous runs. We shuffle partition-indices here, not /// elements themselves, to preserve the invariant that each batch is a /// subsequence of the full set of inputs, not just a subset. std::vector assignJobsToPartitions(size_t PartitionSize, size_t NumJobs) { size_t Remainder = NumJobs % PartitionSize; size_t TargetSize = NumJobs / PartitionSize; std::vector PartitionIndex; PartitionIndex.reserve(NumJobs); for (size_t P = 0; P < PartitionSize; ++P) { // Spread remainder evenly across partitions by adding 1 to the target // size of the first Remainder of them. size_t FillCount = TargetSize + ((P < Remainder) ? 1 : 0); std::fill_n(std::back_inserter(PartitionIndex), FillCount, P); } if (Comp.getBatchSeed() != 0) { std::minstd_rand gen(Comp.getBatchSeed()); std::shuffle(PartitionIndex.begin(), PartitionIndex.end(), gen); } assert(PartitionIndex.size() == NumJobs); return PartitionIndex; } /// Create \c NumberOfParallelCommands batches and assign each job to a /// batch either filling each partition in order or, if seeded with a /// nonzero value, pseudo-randomly (but deterministically and nearly-evenly). void partitionIntoBatches(const llvm::SmallVectorImpl &Batchable, BatchPartition &Partition) { if (Comp.getShowJobLifecycle()) { llvm::outs() << "Found " << Batchable.size() << " batchable jobs\n"; llvm::outs() << "Forming into " << Partition.size() << " batches\n"; } assert(!Partition.empty()); auto PartitionIndex = assignJobsToPartitions(Partition.size(), Batchable.size()); assert(PartitionIndex.size() == Batchable.size()); auto const &TC = Comp.getToolChain(); for_each(Batchable, PartitionIndex, [&](const Job *Cmd, size_t Idx) { assert(Idx < Partition.size()); std::vector &P = Partition[Idx]; if (P.empty() || TC.jobsAreBatchCombinable(Comp, P[0], Cmd)) { if (Comp.getShowJobLifecycle()) llvm::outs() << "Adding " << LogJob(Cmd) << " to batch " << Idx << '\n'; P.push_back(Cmd); } else { // Strange but theoretically possible that we have a batchable job // that's not combinable with others; tack a new batch on for it. if (Comp.getShowJobLifecycle()) llvm::outs() << "Adding " << LogJob(Cmd) << " to new batch " << Partition.size() << '\n'; Partition.push_back(std::vector()); Partition.back().push_back(Cmd); } }); } // Selects the number of partitions based on the user-provided batch // count and/or the number of parallel tasks we can run, subject to a // fixed per-batch safety cap, to avoid overcommitting memory. size_t pickNumberOfPartitions() { // If the user asked for something, use that. if (Comp.getBatchCount().has_value()) return Comp.getBatchCount().value(); // This is a long comment to justify a simple calculation. // // Because there is a secondary "outer" build system potentially also // scheduling multiple drivers in parallel on separate build targets // -- while we, the driver, schedule our own subprocesses -- we might // be creating up to $NCPU^2 worth of _memory pressure_. // // Oversubscribing CPU is typically no problem these days, but // oversubscribing memory can lead to paging, which on modern systems // is quite bad. // // In practice, $NCPU^2 processes doesn't _quite_ happen: as core // count rises, it usually exceeds the number of large targets // without any dependencies between them (which are the only thing we // have to worry about): you might have (say) 2 large independent // modules * 2 architectures, but that's only an $NTARGET value of 4, // which is much less than $NCPU if you're on a 24 or 36-way machine. // // So the actual number of concurrent processes is: // // NCONCUR := $NCPU * min($NCPU, $NTARGET) // // Empirically, a frontend uses about 512kb RAM per non-primary file // and about 10mb per primary. The number of non-primaries per // process is a constant in a given module, but the number of // primaries -- the "batch size" -- is inversely proportional to the // batch count (default: $NCPU). As a result, the memory pressure // we can expect is: // // $NCONCUR * (($NONPRIMARYMEM * $NFILE) + // ($PRIMARYMEM * ($NFILE/$NCPU))) // // If we tabulate this across some plausible values, we see // unfortunate memory-pressure results: // // $NFILE // +--------------------- // $NTARGET $NCPU | 100 500 1000 // ----------------+--------------------- // 2 2 | 2gb 11gb 22gb // 4 4 | 4gb 24gb 48gb // 4 8 | 5gb 28gb 56gb // 4 16 | 7gb 36gb 72gb // 4 36 | 11gb 56gb 112gb // // As it happens, the lower parts of the table are dominated by // number of processes rather than the files-per-batch (the batches // are already quite small due to the high core count) and the left // side of the table is dealing with modules too small to worry // about. But the middle and upper-right quadrant is problematic: 4 // and 8 core machines do not typically have 24-48gb of RAM, it'd be // nice not to page on them when building a 4-target project with // 500-file modules. // // Turns we can do that if we just cap the batch size statically at, // say, 25 files per batch, we get a better formula: // // $NCONCUR * (($NONPRIMARYMEM * $NFILE) + // ($PRIMARYMEM * min(25, ($NFILE/$NCPU)))) // // $NFILE // +--------------------- // $NTARGET $NCPU | 100 500 1000 // ----------------+--------------------- // 2 2 | 1gb 2gb 3gb // 4 4 | 4gb 8gb 12gb // 4 8 | 5gb 16gb 24gb // 4 16 | 7gb 32gb 48gb // 4 36 | 11gb 56gb 108gb // // This means that the "performance win" of batch mode diminishes // slightly: the batching factor in the equation drops from // ($NFILE/$NCPU) to min(25, $NFILE/$NCPU). In practice this seems to // not cost too much: the additional factor in number of subprocesses // run is the following: // // $NFILE // +--------------------- // $NTARGET $NCPU | 100 500 1000 // ----------------+--------------------- // 2 2 | 2x 10x 20x // 4 4 | - 5x 10x // 4 8 | - 2.5x 5x // 4 16 | - 1.25x 2.5x // 4 36 | - - 1.1x // // Where - means "no difference" because the batches were already // smaller than 25. // // Even in the worst case here, the 1000-file module on 2-core // machine is being built with only 40 subprocesses, rather than the // pre-batch-mode 1000. I.e. it's still running 96% fewer // subprocesses than before. And significantly: it's doing so while // not exceeding the RAM of a typical 2-core laptop. // An explanation of why the partition calculation isn't integer division. // Using an example, a module of 26 files exceeds the limit of 25 and must // be compiled in 2 batches. Integer division yields 26/25 = 1 batch, but // a single batch of 26 exceeds the limit. The calculation must round up, // which can be calculated using: `(x + y - 1) / y` auto DivideRoundingUp = [](size_t Num, size_t Div) -> size_t { return (Num + Div - 1) / Div; }; size_t DefaultSizeLimit = 25; size_t NumTasks = TQ->getNumberOfParallelTasks(); size_t NumFiles = PendingExecution.size(); size_t SizeLimit = Comp.getBatchSizeLimit().value_or(DefaultSizeLimit); return std::max(NumTasks, DivideRoundingUp(NumFiles, SizeLimit)); } /// Select jobs that are batch-combinable from \c PendingExecution, combine /// them together into \p BatchJob instances (also inserted into \p /// BatchJobs), and enqueue all \c PendingExecution jobs (whether batched or /// not) into the \c TaskQueue for execution. void formBatchJobsAndAddPendingJobsToTaskQueue() { // If batch mode is not enabled, just transfer the set of pending jobs to // the task queue, as-is. if (!Comp.getBatchModeEnabled()) { transferJobsToTaskQueue(PendingExecution, "standard"); return; } size_t NumPartitions = pickNumberOfPartitions(); CommandSetVector Batchable, NonBatchable; std::vector Batches; // Split the batchable from non-batchable pending jobs. getPendingBatchableJobs(Batchable, NonBatchable); // Partition the batchable jobs into sets. BatchPartition Partition(NumPartitions); partitionIntoBatches(Batchable.takeVector(), Partition); // Construct a BatchJob from each batch in the partition. for (auto const &Batch : Partition) { formBatchJobFromPartitionBatch(Batches, Batch); } PendingExecution.clear(); // Save batches so we can locate and decompose them on task-exit. for (const Job *Cmd : Batches) BatchJobs.insert(Cmd); // Enqueue the resulting jobs, batched and non-batched alike. transferJobsToTaskQueue(Batches, "batch"); transferJobsToTaskQueue(NonBatchable, "non-batch"); } void runTaskQueueToCompletion() { do { using namespace std::placeholders; // Ask the TaskQueue to execute. if (TQ->execute(std::bind(&PerformJobsState::taskBegan, this, _1, _2), std::bind(&PerformJobsState::taskFinished, this, _1, _2, _3, _4, _5, _6), std::bind(&PerformJobsState::taskSignalled, this, _1, _2, _3, _4, _5, _6, _7))) { if (ResultCode == EXIT_SUCCESS) { // FIXME: Error from task queue while Result == EXIT_SUCCESS most // likely means some fork/exec or posix_spawn failed; TaskQueue saw // "an error" at some stage before even calling us with a process // exit / signal (or else a poll failed); unfortunately the task // causing it was dropped on the floor and we have no way to recover // it here, so we report a very poor, generic error. Comp.getDiags().diagnose(SourceLoc(), diag::error_unable_to_execute_command, ""); ResultCode = -2; AnyAbnormalExit = true; return; } } // Returning without error from TaskQueue::execute should mean either an // empty TaskQueue or a failed subprocess. assert(!(ResultCode == 0 && TQ->hasRemainingTasks())); // Task-exit callbacks from TaskQueue::execute may have unblocked jobs, // which means there might be PendingExecution jobs to enqueue here. If // there are, we need to continue trying to make progress on the // TaskQueue before we start marking deferred jobs as skipped, below. if (!PendingExecution.empty() && ResultCode == 0) { formBatchJobsAndAddPendingJobsToTaskQueue(); continue; } // It's possible that by marking some jobs as skipped, we unblocked // some jobs and thus have entries in PendingExecution again; push // those through to the TaskQueue. formBatchJobsAndAddPendingJobsToTaskQueue(); // If we added jobs to the TaskQueue, and we are not in an error state, // we want to give the TaskQueue another run. } while (ResultCode == 0 && TQ->hasRemainingTasks()); } public: Compilation::Result takeResult() && { if (ResultCode == 0) ResultCode = Comp.getDiags().hadAnyError(); const bool hadAbnormalExit = hadAnyAbnormalExit(); const auto resultCode = ResultCode; return Compilation::Result{hadAbnormalExit, resultCode}; } bool hadAnyAbnormalExit() { return AnyAbnormalExit; } }; } // namespace driver } // namespace swift Compilation::~Compilation() = default; Job *Compilation::addJob(std::unique_ptr J) { Job *result = J.get(); Jobs.emplace_back(std::move(J)); return result; } Job *Compilation::addExternalJob(std::unique_ptr J) { Job *result = J.get(); ExternalJobs.emplace_back(std::move(J)); return result; } static void writeInputJobsToFilelist(llvm::raw_fd_ostream &out, const Job *job, const file_types::ID infoType) { // FIXME: Duplicated from ToolChains.cpp. for (const Job *input : job->getInputs()) { const CommandOutput &outputInfo = input->getOutput(); if (outputInfo.getPrimaryOutputType() == infoType) { for (auto &output : outputInfo.getPrimaryOutputFilenames()) out << output << "\n"; } else { auto output = outputInfo.getAnyOutputForType(infoType); if (!output.empty()) out << output << "\n"; } } } static void writeSourceInputActionsToFilelist(llvm::raw_fd_ostream &out, const Job *job, const ArgList &args) { // Ensure that -index-file-path works in conjunction with // -driver-use-filelists. It needs to be the only primary. if (Arg *A = args.getLastArg(options::OPT_index_file_path)) out << A->getValue() << "\n"; else { // The normal case for non-single-compile jobs. for (const Action *A : job->getSource().getInputs()) { // A could be a GeneratePCHJobAction if (!isa(A)) continue; const auto *IA = cast(A); out << IA->getInputArg().getValue() << "\n"; } } } static void writeOutputToFilelist(llvm::raw_fd_ostream &out, const Job *job, const file_types::ID infoType) { const CommandOutput &outputInfo = job->getOutput(); assert(outputInfo.getPrimaryOutputType() == infoType); for (auto &output : outputInfo.getPrimaryOutputFilenames()) out << output << "\n"; } static void writeIndexUnitOutputPathsToFilelist(llvm::raw_fd_ostream &out, const Job *job) { const CommandOutput &outputInfo = job->getOutput(); for (auto &output : outputInfo.getIndexUnitOutputFilenames()) out << output << "\n"; } static void writeSupplementaryOutputToFilelist(llvm::raw_fd_ostream &out, const Job *job) { job->getOutput().writeOutputFileMap(out); } static bool writeFilelistIfNecessary(const Job *job, const ArgList &args, DiagnosticEngine &diags) { bool ok = true; for (const FilelistInfo &filelistInfo : job->getFilelistInfos()) { if (filelistInfo.path.empty()) return true; std::error_code error; llvm::raw_fd_ostream out(filelistInfo.path, error, llvm::sys::fs::OF_None); if (out.has_error()) { out.clear_error(); diags.diagnose(SourceLoc(), diag::error_unable_to_make_temporary_file, error.message()); ok = false; continue; } switch (filelistInfo.whichFiles) { case FilelistInfo::WhichFiles::InputJobs: writeInputJobsToFilelist(out, job, filelistInfo.type); break; case FilelistInfo::WhichFiles::SourceInputActions: writeSourceInputActionsToFilelist(out, job, args); break; case FilelistInfo::WhichFiles::InputJobsAndSourceInputActions: writeInputJobsToFilelist(out, job, filelistInfo.type); writeSourceInputActionsToFilelist(out, job, args); break; case FilelistInfo::WhichFiles::Output: writeOutputToFilelist(out, job, filelistInfo.type); break; case FilelistInfo::WhichFiles::IndexUnitOutputPaths: writeIndexUnitOutputPathsToFilelist(out, job); break; case FilelistInfo::WhichFiles::SupplementaryOutput: writeSupplementaryOutputToFilelist(out, job); break; } } return ok; } Compilation::Result Compilation::performJobsImpl(std::unique_ptr &&TQ) { PerformJobsState State(*this, std::move(TQ)); State.runJobs(); return std::move(State).takeResult(); } Compilation::Result Compilation::performSingleCommand(const Job *Cmd) { assert(Cmd->getInputs().empty() && "This can only be used to run a single command with no inputs"); switch (Cmd->getCondition()) { case Job::Condition::CheckDependencies: return Compilation::Result::code(0); case Job::Condition::RunWithoutCascading: case Job::Condition::Always: case Job::Condition::NewlyAdded: break; } if (!writeFilelistIfNecessary(Cmd, *TranslatedArgs.get(), Diags)) return Compilation::Result::code(1); switch (Level) { case OutputLevel::Normal: case OutputLevel::Parseable: break; case OutputLevel::PrintJobs: Cmd->printCommandLineAndEnvironment(llvm::outs()); return Compilation::Result::code(0); case OutputLevel::Verbose: Cmd->printCommandLine(llvm::errs()); break; } SmallVector Argv; Argv.push_back(Cmd->getExecutable()); Argv.append(Cmd->getArguments().begin(), Cmd->getArguments().end()); Argv.push_back(nullptr); const char *ExecPath = Cmd->getExecutable(); const char **argv = Argv.data(); for (auto &envPair : Cmd->getExtraEnvironment()) { #if defined(_MSC_VER) int envResult =_putenv_s(envPair.first, envPair.second); #else int envResult = setenv(envPair.first, envPair.second, /*replacing=*/true); #endif assert(envResult == 0 && "expected environment variable to be set successfully"); // Bail out early in release builds. if (envResult != 0) { return Compilation::Result::code(envResult); } } const auto returnCode = ExecuteInPlace(ExecPath, argv); return Compilation::Result::code(returnCode); } static bool writeAllSourcesFile(DiagnosticEngine &diags, StringRef path, ArrayRef inputFiles) { std::error_code error; llvm::raw_fd_ostream out(path, error, llvm::sys::fs::OF_None); if (out.has_error()) { out.clear_error(); diags.diagnose(SourceLoc(), diag::error_unable_to_make_temporary_file, error.message()); return false; } for (auto inputPair : inputFiles) { if (!file_types::isPartOfSwiftCompilation(inputPair.first)) continue; out << inputPair.second->getValue() << "\n"; } return true; } Compilation::Result Compilation::performJobs(std::unique_ptr &&TQ) { if (AllSourceFilesPath) if (!writeAllSourcesFile(Diags, AllSourceFilesPath, getInputFiles())) return Compilation::Result::code(EXIT_FAILURE); // If we don't have to do any cleanup work, just exec the subprocess. if (Level < OutputLevel::Parseable && !ShowDriverTimeCompilation && (SaveTemps || TempFilePaths.empty()) && Jobs.size() == 1) { return performSingleCommand(Jobs.front().get()); } if (!TaskQueue::supportsParallelExecution() && TQ->getNumberOfParallelTasks() > 1) { Diags.diagnose(SourceLoc(), diag::warning_parallel_execution_not_supported); } auto result = performJobsImpl(std::move(TQ)); if (!SaveTemps) { for (const auto &pathPair : TempFilePaths) { if (!result.hadAbnormalExit || pathPair.getValue() == PreserveOnSignal::No) (void)llvm::sys::fs::remove(pathPair.getKey()); } } if (Stats) Stats->noteCurrentProcessExitStatus(result.exitCode); return result; } const char *Compilation::getAllSourcesPath() const { if (!AllSourceFilesPath) { SmallString<128> Buffer; std::error_code EC = llvm::sys::fs::createTemporaryFile("sources", "", Buffer); if (EC) { // Use the constructor that prints both the error code and the // description. // FIXME: This should not take down the entire process. auto error = llvm::make_error( EC, "- unable to create list of input sources"); llvm::report_fatal_error(std::move(error)); } auto *mutableThis = const_cast(this); mutableThis->addTemporaryFile(Buffer.str(), PreserveOnSignal::Yes); mutableThis->AllSourceFilesPath = getArgs().MakeArgString(Buffer); } return AllSourceFilesPath; } unsigned Compilation::countSwiftInputs() const { unsigned inputCount = 0; for (const auto &p : InputFilesWithTypes) if (p.first == file_types::TY_Swift) ++inputCount; return inputCount; } void Compilation::addDependencyPathOrCreateDummy( StringRef depPath, function_ref addDependencyPath) { if (!OnlyOneDependencyFile) { addDependencyPath(); return; } if (!HaveAlreadyAddedDependencyPath) { addDependencyPath(); HaveAlreadyAddedDependencyPath = true; } else if (!depPath.empty()) { // Create dummy empty file std::error_code EC; llvm::raw_fd_ostream(depPath, EC, llvm::sys::fs::OF_None); } } template void Compilation::sortJobsToMatchCompilationInputs( const JobCollection &unsortedJobs, SmallVectorImpl &sortedJobs) const { llvm::DenseMap jobsByInput; for (const Job *J : unsortedJobs) { // Only worry about sorting compilation jobs if (const CompileJobAction *CJA = dyn_cast(&J->getSource())) { const InputAction *IA = CJA->findSingleSwiftInput(); jobsByInput.insert(std::make_pair(IA->getInputArg().getValue(), J)); } else sortedJobs.push_back(J); } for (const InputPair &P : getInputFiles()) { auto I = jobsByInput.find(P.second->getValue()); if (I != jobsByInput.end()) { sortedJobs.push_back(I->second); } } } template void Compilation::sortJobsToMatchCompilationInputs>( const ArrayRef &, SmallVectorImpl &sortedJobs) const;