mirror of
https://github.com/pytorch/pytorch.git
synced 2025-10-20 21:14:14 +08:00
Summary: PR https://github.com/pytorch/pytorch/pull/31033 was unlanded due to macos build failure: https://app.circleci.com/jobs/github/pytorch/pytorch/3916388 This PR has changes that `setNumThreads` is only for android and moved to separate class `org.pytorch.PytorchAndroid` as a static function which is better as it has global effect Pull Request resolved: https://github.com/pytorch/pytorch/pull/31205 Reviewed By: dreiss Differential Revision: D18977250 Pulled By: IvanKobzarev fbshipit-source-id: 4995859808af498c82933c4db52bd7c7dfae90e5
64 lines
1.8 KiB
C++
64 lines
1.8 KiB
C++
#ifndef CAFFE2_UTILS_THREADPOOL_H_
|
|
#define CAFFE2_UTILS_THREADPOOL_H_
|
|
|
|
#include "ThreadPoolCommon.h"
|
|
|
|
#include <functional>
|
|
#include <memory>
|
|
#include <mutex>
|
|
#include <vector>
|
|
#include <atomic>
|
|
|
|
#include "caffe2/core/common.h"
|
|
|
|
//
|
|
// A work-stealing threadpool loosely based off of pthreadpool
|
|
//
|
|
|
|
namespace caffe2 {
|
|
|
|
struct Task;
|
|
class WorkersPool;
|
|
|
|
constexpr size_t kCacheLineSize = 64;
|
|
|
|
// A threadpool with the given number of threads.
|
|
// NOTE: the kCacheLineSize alignment is present only for cache
|
|
// performance, and is not strictly enforced (for example, when
|
|
// the object is created on the heap). Thus, in order to avoid
|
|
// misaligned intrinsics, no SSE instructions shall be involved in
|
|
// the ThreadPool implementation.
|
|
// Note: alignas is disabled because some compilers do not deal with
|
|
// CAFFE2_API and alignas annotations at the same time.
|
|
class CAFFE2_API /*alignas(kCacheLineSize)*/ ThreadPool {
|
|
public:
|
|
static std::unique_ptr<ThreadPool> defaultThreadPool();
|
|
ThreadPool(int numThreads);
|
|
~ThreadPool();
|
|
// Returns the number of threads currently in use
|
|
int getNumThreads() const;
|
|
void setNumThreads(size_t numThreads);
|
|
|
|
// Sets the minimum work size (range) for which to invoke the
|
|
// threadpool; work sizes smaller than this will just be run on the
|
|
// main (calling) thread
|
|
void setMinWorkSize(size_t size);
|
|
size_t getMinWorkSize() const { return minWorkSize_; }
|
|
void run(const std::function<void(int, size_t)>& fn, size_t range);
|
|
|
|
// Run an arbitrary function in a thread-safe manner accessing the Workers
|
|
// Pool
|
|
void withPool(const std::function<void(WorkersPool*)>& fn);
|
|
|
|
private:
|
|
mutable std::mutex executionMutex_;
|
|
size_t minWorkSize_;
|
|
std::atomic_size_t numThreads_;
|
|
std::shared_ptr<WorkersPool> workersPool_;
|
|
std::vector<std::shared_ptr<Task>> tasks_;
|
|
};
|
|
|
|
} // namespace caffe2
|
|
|
|
#endif // CAFFE2_UTILS_THREADPOOL_H_
|