mirror of
https://github.com/pytorch/pytorch.git
synced 2025-10-20 21:14:14 +08:00
Summary: Since we increment the counter after performing the callback, it leads to the assertion error when callback raises an error and increment never happens. Let's increment first to avoid it. Test Plan: tba Rollback Plan: Differential Revision: D77475650 Pull Request resolved: https://github.com/pytorch/pytorch/pull/157185 Approved by: https://github.com/xmfan
172 lines
5.5 KiB
Python
172 lines
5.5 KiB
Python
"""
|
|
This module provides callback management functionality for TorchDynamo's compilation process.
|
|
|
|
It implements a thread-safe system for registering, managing and executing callbacks that run
|
|
at the start and end of TorchDynamo compilations. Key features include:
|
|
|
|
- Registration and deregistration of compilation callbacks
|
|
- Thread-safe callback handling with proper locking mechanisms
|
|
- Prevention of duplicate callback execution when configured
|
|
- Decorator utilities for easy callback registration
|
|
- Context manager for controlled callback lifecycle
|
|
|
|
The module centers around the CompilationCallbackHandler class which maintains separate
|
|
lists for start and end callbacks, manages their execution order, and ensures thread-safety.
|
|
Utility decorators @on_compile_start and @on_compile_end provide a convenient way to
|
|
register compilation hooks.
|
|
|
|
Example usage:
|
|
@on_compile_start
|
|
def my_start_callback():
|
|
print("Starting compilation")
|
|
|
|
@on_compile_end
|
|
def my_end_callback():
|
|
print("Compilation complete")
|
|
"""
|
|
|
|
import enum
|
|
import threading
|
|
from collections.abc import Generator
|
|
from contextlib import contextmanager
|
|
from dataclasses import dataclass, field # noqa: F811
|
|
from typing import Any, Callable
|
|
|
|
|
|
class CallbackTrigger(enum.Enum):
|
|
# most common case, dynamo attempts to trace a new frame
|
|
DYNAMO = 1
|
|
# backward compilation can be deferred to runtime
|
|
LAZY_BACKWARD = 2
|
|
# some backends autotune at runtime
|
|
TRITON_AUTOTUNING = 3 # Temporarily disabled due to spam
|
|
# cudagraphs record at runtime
|
|
CUDAGRAPH_RECORDING = 4
|
|
|
|
|
|
@dataclass
|
|
class CallbackArgs:
|
|
callback_trigger: CallbackTrigger
|
|
compile_id: str
|
|
|
|
|
|
@dataclass
|
|
class CompilationCallbackHandler:
|
|
start_callbacks: list[Callable[[CallbackArgs], None]] = field(default_factory=list)
|
|
end_callbacks: list[Callable[[CallbackArgs], None]] = field(default_factory=list)
|
|
|
|
__pending_callbacks_counter: int = field(default=0, init=False, repr=False)
|
|
__pending_callbacks_counter_lock: threading.Lock = field(
|
|
default_factory=threading.Lock, init=False, repr=False
|
|
)
|
|
|
|
def register_start_callback(
|
|
self, callback: Callable[[CallbackArgs], None]
|
|
) -> Callable[[CallbackArgs], None]:
|
|
"""
|
|
Register a callback function to be called when the compilation starts.
|
|
|
|
Args:
|
|
- callback (Callable): The callback function to register.
|
|
"""
|
|
self.start_callbacks.append(callback)
|
|
return callback
|
|
|
|
def register_end_callback(
|
|
self, callback: Callable[[CallbackArgs], None]
|
|
) -> Callable[[CallbackArgs], None]:
|
|
"""
|
|
Register a callback function to be called when the compilation ends.
|
|
|
|
Args:
|
|
- callback (Callable): The callback function to register.
|
|
"""
|
|
self.end_callbacks.append(callback)
|
|
return callback
|
|
|
|
def remove_start_callback(self, callback: Callable[[CallbackArgs], None]) -> None:
|
|
"""
|
|
Remove a registered start callback function.
|
|
|
|
Args:
|
|
- callback (Callable): The callback function to remove.
|
|
"""
|
|
self.start_callbacks.remove(callback)
|
|
|
|
def remove_end_callback(self, callback: Callable[[CallbackArgs], None]) -> None:
|
|
"""
|
|
Remove a registered end callback function.
|
|
|
|
Args:
|
|
- callback (Callable): The callback function to remove.
|
|
"""
|
|
self.end_callbacks.remove(callback)
|
|
|
|
def run_start_callbacks(self, args: CallbackArgs) -> None:
|
|
"""
|
|
Execute all registered start callbacks.
|
|
"""
|
|
for callback in self.start_callbacks:
|
|
callback(args)
|
|
|
|
def run_end_callbacks(self, args: CallbackArgs) -> None:
|
|
"""
|
|
Execute all registered end callbacks.
|
|
"""
|
|
for callback in self.end_callbacks:
|
|
callback(args)
|
|
|
|
@contextmanager
|
|
def install_callbacks(
|
|
self, trigger: CallbackTrigger, compile_id: str
|
|
) -> Generator[None, Any, Any]:
|
|
"""
|
|
Context manager to install the callbacks and run them when the context is exited.
|
|
"""
|
|
args = CallbackArgs(trigger, compile_id)
|
|
try:
|
|
with self.__pending_callbacks_counter_lock:
|
|
self.__pending_callbacks_counter += 1
|
|
if self.__pending_callbacks_counter == 1:
|
|
self.run_start_callbacks(args)
|
|
yield
|
|
finally:
|
|
with self.__pending_callbacks_counter_lock:
|
|
assert self.__pending_callbacks_counter > 0, (
|
|
"Pending callbacks counter cannot become negative."
|
|
)
|
|
if self.__pending_callbacks_counter == 1:
|
|
self.run_end_callbacks(args)
|
|
self.__pending_callbacks_counter -= 1
|
|
|
|
def clear(self) -> None:
|
|
"""
|
|
Clear all registered callbacks.
|
|
"""
|
|
self.start_callbacks.clear()
|
|
self.end_callbacks.clear()
|
|
assert self.__pending_callbacks_counter == 0
|
|
|
|
|
|
callback_handler = CompilationCallbackHandler()
|
|
|
|
|
|
def on_compile_start(
|
|
callback: Callable[[CallbackArgs], None],
|
|
) -> Callable[[CallbackArgs], None]:
|
|
"""
|
|
Decorator to register a callback function for the start of the compilation.
|
|
"""
|
|
callback_handler.register_start_callback(callback)
|
|
return callback
|
|
|
|
|
|
def on_compile_end(
|
|
callback: Callable[[CallbackArgs], None],
|
|
) -> Callable[[CallbackArgs], None]:
|
|
"""
|
|
Decorator to register a callback function for the end of the compilation.
|
|
"""
|
|
callback_handler.register_end_callback(callback)
|
|
return callback
|