|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
"""Profiler to check if there are any bottlenecks in your code.""" |
|
|
|
import cProfile |
|
import io |
|
import logging |
|
import os |
|
import pstats |
|
import tempfile |
|
from pathlib import Path |
|
from typing import Optional, Union |
|
|
|
from typing_extensions import override |
|
|
|
from lightning_fabric.utilities.cloud_io import get_filesystem |
|
from pytorch_lightning.profilers.profiler import Profiler |
|
from pytorch_lightning.utilities.rank_zero import rank_zero_only |
|
|
|
log = logging.getLogger(__name__) |
|
|
|
|
|
class AdvancedProfiler(Profiler): |
|
"""This profiler uses Python's cProfiler to record more detailed information about time spent in each function call |
|
recorded during a given action. |
|
|
|
The output is quite verbose and you should only use this if you want very detailed reports. |
|
|
|
""" |
|
|
|
def __init__( |
|
self, |
|
dirpath: Optional[Union[str, Path]] = None, |
|
filename: Optional[str] = None, |
|
line_count_restriction: float = 1.0, |
|
dump_stats: bool = False, |
|
) -> None: |
|
""" |
|
Args: |
|
dirpath: Directory path for the ``filename``. If ``dirpath`` is ``None`` but ``filename`` is present, the |
|
``trainer.log_dir`` (from :class:`~pytorch_lightning.loggers.tensorboard.TensorBoardLogger`) |
|
will be used. |
|
|
|
filename: If present, filename where the profiler results will be saved instead of printing to stdout. |
|
The ``.txt`` extension will be used automatically. |
|
|
|
line_count_restriction: this can be used to limit the number of functions |
|
reported for each action. either an integer (to select a count of lines), |
|
or a decimal fraction between 0.0 and 1.0 inclusive (to select a percentage of lines) |
|
|
|
dump_stats: Whether to save raw profiler results. When ``True`` then ``dirpath`` must be provided. |
|
|
|
Raises: |
|
ValueError: |
|
If you attempt to stop recording an action which was never started. |
|
""" |
|
super().__init__(dirpath=dirpath, filename=filename) |
|
self.profiled_actions: dict[str, cProfile.Profile] = {} |
|
self.line_count_restriction = line_count_restriction |
|
self.dump_stats = dump_stats |
|
|
|
@override |
|
def start(self, action_name: str) -> None: |
|
if action_name not in self.profiled_actions: |
|
self.profiled_actions[action_name] = cProfile.Profile() |
|
self.profiled_actions[action_name].enable() |
|
|
|
@override |
|
def stop(self, action_name: str) -> None: |
|
pr = self.profiled_actions.get(action_name) |
|
if pr is None: |
|
raise ValueError(f"Attempting to stop recording an action ({action_name}) which was never started.") |
|
pr.disable() |
|
|
|
def _dump_stats(self, action_name: str, profile: cProfile.Profile) -> None: |
|
assert self.dirpath |
|
dst_filepath = os.path.join(self.dirpath, self._prepare_filename(action_name=action_name, extension=".prof")) |
|
dst_fs = get_filesystem(dst_filepath) |
|
dst_fs.mkdirs(self.dirpath, exist_ok=True) |
|
|
|
with ( |
|
tempfile.TemporaryDirectory(prefix="test", suffix=str(rank_zero_only.rank), dir=os.getcwd()) as tmp_dir, |
|
dst_fs.open(dst_filepath, "wb") as dst_file, |
|
): |
|
src_filepath = os.path.join(tmp_dir, "tmp.prof") |
|
profile.dump_stats(src_filepath) |
|
src_fs = get_filesystem(src_filepath) |
|
with src_fs.open(src_filepath, "rb") as src_file: |
|
dst_file.write(src_file.read()) |
|
|
|
@override |
|
def summary(self) -> str: |
|
recorded_stats = {} |
|
for action_name, pr in self.profiled_actions.items(): |
|
if self.dump_stats: |
|
self._dump_stats(action_name, pr) |
|
s = io.StringIO() |
|
ps = pstats.Stats(pr, stream=s).strip_dirs().sort_stats("cumulative") |
|
ps.print_stats(self.line_count_restriction) |
|
recorded_stats[action_name] = s.getvalue() |
|
return self._stats_to_str(recorded_stats) |
|
|
|
@override |
|
def teardown(self, stage: Optional[str]) -> None: |
|
super().teardown(stage=stage) |
|
self.profiled_actions = {} |
|
|
|
def __reduce__(self) -> tuple: |
|
|
|
return ( |
|
self.__class__, |
|
(), |
|
{"dirpath": self.dirpath, "filename": self.filename, "line_count_restriction": self.line_count_restriction}, |
|
) |
|
|