blob: 30ec7ad4ef546d76976ceefe3685b0c5a6063978 [file] [log] [blame]
// Copyright 2018 Google Inc. All Rights Reserved.
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// See the License for the specific language governing permissions and
// limitations under the License.
#include "thread_pool.h"
#include <assert.h>
#include <atomic>
#include <condition_variable>
#include <thread>
#include "metrics.h"
#include "util.h"
struct ThreadPoolImpl : ThreadPool {
ThreadPoolImpl(int num_threads);
virtual ~ThreadPoolImpl();
void RunTasks(std::vector<std::function<void()>>&& tasks) override;
void WorkerThreadLoop();
struct Batch {
Batch(size_t task_count, std::vector<std::function<void()>>&& tasks)
: task_count(task_count), tasks(std::move(tasks)) {}
const size_t task_count;
std::atomic<size_t> next_task_idx { 0 };
std::atomic<size_t> tasks_completed { 0 };
std::vector<std::function<void()>> tasks;
bool completed = false;
std::mutex mutex_;
std::shared_ptr<Batch> current_batch_;
bool shutting_down_ = false;
std::condition_variable worker_cv_;
std::condition_variable main_cv_;
std::vector<std::thread> threads_;
ThreadPoolImpl::ThreadPoolImpl(int num_threads) {
if (num_threads <= 1) {
// On a single-core machine (or with "-d nothreads"), don't start any
// threads.
for (int i = 0; i < num_threads; ++i) {
threads_[i] = std::thread([this] {
ThreadPoolImpl::~ThreadPoolImpl() {
std::lock_guard<std::mutex> lock(mutex_);
shutting_down_ = true;
for (auto& thread : threads_) {
void ThreadPoolImpl::RunTasks(std::vector<std::function<void()>>&& tasks) {
// Sometimes it's better to run the tasks on the caller's thread:
// - When parsing the manifest tree, only one file is parsed at a time, so if
// a manifest tree has many small files, the overhead of dispatching each
// file to a worker thread can be substantial.
// - When ninja runs on a single-core machine, or with "-d nothreads", there
// are no worker threads in the pool.
const size_t task_count = tasks.size();
if (threads_.empty() || task_count <= 1) {
for (auto& task : tasks) {
std::shared_ptr<Batch> batch = std::make_shared<Batch>(task_count,
std::lock_guard<std::mutex> lock(mutex_);
assert(current_batch_.get() == nullptr &&
"the thread pool isn't intended for reentrant or concurrent use");
current_batch_ = batch;
std::unique_lock<std::mutex> lock(mutex_);
main_cv_.wait(lock, [batch]() { return batch->completed; });
current_batch_ = {};
// The client's std::function might do interesting work when it's destructed
// (e.g. destruct a lambda's captured state), so destruct the functions before
// returning. It's safe to modify the batch's tasks vector because there are
// no more tasks to run. The Batch itself is freed at an unpredictable time.
void ThreadPoolImpl::WorkerThreadLoop() {
while (true) {
// A shared_ptr object isn't thread-safe itself, but its control block is
// thread-safe. This worker thread must lock the mutex before checking the
// active batch.
std::shared_ptr<Batch> batch;
// Wait until either:
// - There is an active batch with at least one task remaining.
// - The thread pool is shutting down.
std::unique_lock<std::mutex> lock(mutex_);
worker_cv_.wait(lock, [this, &batch]() {
auto b = current_batch_;
if (b && b->next_task_idx.load() < b->task_count) {
batch = b;
return true;
return shutting_down_;
if (shutting_down_) {
while (true) {
// Try to start another task in this batch. Atomically load and increment
// the next task index.
size_t idx = batch->next_task_idx++;
if (idx >= batch->task_count) {
// The fetched next-task-index is expected to exceed the total number of
// tasks as the threads finish the batch. Return to the main loop. Some
// other thread will finish the batch, if it hasn't already.
// Atomically increment the number of completed tasks. Exactly one worker
// thread should notice that the completed task count equals the total
// number of tasks, and that worker thread signals the main thread.
if (++batch->tasks_completed >= batch->task_count) {
assert(batch->tasks_completed.load() == batch->task_count &&
"BatchThreadPool::Batch completion count exceeded task count");
// Every task is completed, so mark the batch done and wake up the main
// thread.
std::lock_guard<std::mutex> lock(mutex_);
batch->completed = true;
static int g_num_threads = 1;
void SetThreadPoolThreadCount(int num_threads) {
g_num_threads = std::max(num_threads, 1);
int GetOptimalThreadPoolJobCount() {
if (g_num_threads > 1) {
// Magic constant: when splitting work into tasks for the thread pool, try
// to create a fixed number of tasks per thread in the pool.
return g_num_threads * 2;
} else {
// If there are no worker threads, then multiple tasks aren't useful.
// Returning 1 will disable manifest and log file splitting.
return 1;
std::unique_ptr<ThreadPool> CreateThreadPool() {
return std::unique_ptr<ThreadPool>(new ThreadPoolImpl(g_num_threads));