mirror of
https://github.com/pytorch/pytorch.git
synced 2025-10-20 21:14:14 +08:00
As the title stated **Changes:** - Add **record**, **query** and **enable_timing** check - Add related tests Pull Request resolved: https://github.com/pytorch/pytorch/pull/151404 Approved by: https://github.com/albanD
148 lines
4.2 KiB
C++
148 lines
4.2 KiB
C++
#pragma once
|
|
|
|
#include <c10/core/DeviceType.h>
|
|
#include <c10/core/Stream.h>
|
|
#include <c10/core/impl/DeviceGuardImplInterface.h>
|
|
#include <c10/util/Exception.h>
|
|
|
|
namespace c10::impl {
|
|
|
|
template <typename T>
|
|
struct InlineEvent final {
|
|
InlineEvent() = delete;
|
|
InlineEvent(
|
|
const DeviceType _device_type,
|
|
const EventFlag _flag = EventFlag::PYTORCH_DEFAULT)
|
|
: backend_{_device_type}, device_type_{_device_type}, flag_{_flag} {}
|
|
|
|
// Copy constructor and copy assignment operator (deleted)
|
|
InlineEvent(const InlineEvent&) = delete;
|
|
InlineEvent& operator=(const InlineEvent&) = delete;
|
|
|
|
// Move constructor and move assignment operator
|
|
InlineEvent(InlineEvent&& other) noexcept
|
|
: event_(other.event_),
|
|
backend_(std::move(other.backend_)),
|
|
device_type_(other.device_type_),
|
|
device_index_(other.device_index_),
|
|
flag_(other.flag_),
|
|
was_marked_for_recording_(other.was_marked_for_recording_) {
|
|
other.event_ = nullptr;
|
|
}
|
|
InlineEvent& operator=(InlineEvent&& other) noexcept {
|
|
swap(other);
|
|
return *this;
|
|
}
|
|
|
|
void swap(InlineEvent& other) noexcept {
|
|
std::swap(event_, other.event_);
|
|
std::swap(backend_, other.backend_);
|
|
std::swap(device_type_, other.device_type_);
|
|
std::swap(device_index_, other.device_index_);
|
|
std::swap(flag_, other.flag_);
|
|
std::swap(was_marked_for_recording_, other.was_marked_for_recording_);
|
|
}
|
|
|
|
~InlineEvent() noexcept {
|
|
if (event_)
|
|
backend_.destroyEvent(event_, device_index_);
|
|
}
|
|
|
|
DeviceType device_type() const noexcept {
|
|
return device_type_;
|
|
}
|
|
DeviceIndex device_index() const noexcept {
|
|
return device_index_;
|
|
}
|
|
EventFlag flag() const noexcept {
|
|
return flag_;
|
|
}
|
|
bool was_marked_for_recording() const noexcept {
|
|
return was_marked_for_recording_;
|
|
}
|
|
|
|
void recordOnce(const Stream& stream) {
|
|
if (!was_marked_for_recording_)
|
|
record(stream);
|
|
}
|
|
|
|
void record(const Stream& stream) {
|
|
TORCH_CHECK(
|
|
stream.device_type() == device_type_,
|
|
"Event device type ",
|
|
DeviceTypeName(device_type_),
|
|
" does not match recording stream's device type ",
|
|
DeviceTypeName(stream.device_type()),
|
|
".");
|
|
|
|
backend_.record(&event_, stream, device_index_, flag_);
|
|
was_marked_for_recording_ = true;
|
|
device_index_ = stream.device_index();
|
|
}
|
|
|
|
void block(const Stream& stream) const {
|
|
if (!was_marked_for_recording_)
|
|
return;
|
|
|
|
TORCH_CHECK(
|
|
stream.device_type() == device_type_,
|
|
"Event device type ",
|
|
DeviceTypeName(device_type_),
|
|
" does not match blocking stream's device type ",
|
|
DeviceTypeName(stream.device_type()),
|
|
".");
|
|
|
|
backend_.block(event_, stream);
|
|
}
|
|
|
|
bool query() const {
|
|
if (!was_marked_for_recording_)
|
|
return true;
|
|
return backend_.queryEvent(event_);
|
|
}
|
|
|
|
void* eventId() const {
|
|
return event_;
|
|
}
|
|
|
|
double elapsedTime(const InlineEvent& other) const {
|
|
TORCH_CHECK(
|
|
other.device_type() == device_type_,
|
|
"Event device type ",
|
|
DeviceTypeName(device_type_),
|
|
" does not match other's device type ",
|
|
DeviceTypeName(other.device_type()),
|
|
".");
|
|
TORCH_CHECK_VALUE(
|
|
(flag_ == EventFlag::BACKEND_DEFAULT) &&
|
|
(other.flag_ == EventFlag::BACKEND_DEFAULT),
|
|
"Both events must be created with argument 'enable_timing=True'.");
|
|
TORCH_CHECK_VALUE(
|
|
was_marked_for_recording() && other.was_marked_for_recording(),
|
|
"Both events must be recorded before calculating elapsed time.");
|
|
// elapsedTime in MPS can wait event to be completed if event is not ready,
|
|
// which is a little differenct from CUDA
|
|
TORCH_CHECK(
|
|
(query() && other.query()) || device_type_ == DeviceType::MPS,
|
|
"Both events must be completed before calculating elapsed time.");
|
|
|
|
return backend_.elapsedTime(event_, other.event_, device_index_);
|
|
}
|
|
|
|
void synchronize() const {
|
|
if (!was_marked_for_recording_)
|
|
return;
|
|
backend_.synchronizeEvent(event_);
|
|
}
|
|
|
|
private:
|
|
void* event_ = nullptr;
|
|
T backend_;
|
|
DeviceType device_type_;
|
|
DeviceIndex device_index_ = -1;
|
|
EventFlag flag_ = EventFlag::PYTORCH_DEFAULT;
|
|
bool was_marked_for_recording_ = false;
|
|
};
|
|
|
|
} // namespace c10::impl
|