common

zeus.optimizer.pipeline_frequency.common

Shared constants and models between the server and the client (optimizer).

PFOServerSettings

Bases: BaseSettings

PFO server settings, configurable via environment variables.

For instance, setting ZEUS_PFO_LOG_LEVEL=INFO will automatically set the log_level variable to "INFO".

Attributes:

Name	Type	Description
`scheduler`	`PyObject`	Name of the `FrequencyScheduler` to use.
`scheduler_args`	`dict[str, Any]`	Any extra arguments required by `scheduler.__init__`.
`log_level`	`str`	Log level, e.g. "debug", "info".
`dump_data`	`bool`	Whether the scheduler should dump internal state to the filesystem (for future inspection purposes).
`dump_dir`	`str`	Directory to dump state in (if enabled)
`max_job_idle_time`	`int`	Maximum time in seconds that a job can be idle for before its states are automatically deleted from the server.

Source code in zeus/optimizer/pipeline_frequency/common.py

class PFOServerSettings(BaseSettings):
    """PFO server settings, configurable via environment variables.

    For instance, setting `ZEUS_PFO_LOG_LEVEL=INFO` will automatically set
    the `log_level` variable to `"INFO"`.

    Attributes:
        scheduler: Name of the `FrequencyScheduler` to use.
        scheduler_args: Any extra arguments required by `scheduler.__init__`.
        log_level: Log level, e.g. "debug", "info".
        dump_data: Whether the scheduler should dump internal state to the filesystem
            (for future inspection purposes).
        dump_dir: Directory to dump state in (if enabled)
        max_job_idle_time: Maximum time in seconds that a job can be idle for before
            its states are automatically deleted from the server.
    """

    scheduler: PyObject = "PointSolution"  # type: ignore
    scheduler_args: dict[str, Any] = {}
    log_level: str = "DEBUG"
    dump_data: bool = True
    dump_dir: str = "./dump"
    max_job_idle_time: int = 60 * 60 * 24 * 7  # 1 week

    @validator("scheduler", pre=True)
    def _fix_scheduler_import_path(cls, value):
        """Prepend `zeus.optimizer.pipeline_frequency.server.scheduler.` to the scheduler type name."""
        return f"zeus.optimizer.pipeline_frequency.server.scheduler.{value}"

    @validator("scheduler_args")
    def _validate_scheduler_args(cls, args, values):
        """Check whether args are as expected by the scheduler's constructor."""
        scheduler = values["scheduler"]
        full_args = args | dict(job_info=None, rank_infos=None, pfo_settings=None)
        constructor_args = inspect.signature(scheduler)
        try:
            constructor_args.bind(**full_args)
        except TypeError as e:
            raise ValueError(f"Invalid scheduler args: {e}") from None
        return args

    @validator("log_level")
    def _make_upper_case(cls, value):
        return value.upper()

    class Config:  # type: ignore
        """Configuration class read by pydantic."""

        env_prefix = "zeus_pfo_"

Config

Configuration class read by pydantic.

Source code in zeus/optimizer/pipeline_frequency/common.py

class Config:  # type: ignore
    """Configuration class read by pydantic."""

    env_prefix = "zeus_pfo_"

_fix_scheduler_import_path

_fix_scheduler_import_path(value)

Prepend zeus.optimizer.pipeline_frequency.server.scheduler. to the scheduler type name.

Source code in zeus/optimizer/pipeline_frequency/common.py

@validator("scheduler", pre=True)
def _fix_scheduler_import_path(cls, value):
    """Prepend `zeus.optimizer.pipeline_frequency.server.scheduler.` to the scheduler type name."""
    return f"zeus.optimizer.pipeline_frequency.server.scheduler.{value}"

_validate_scheduler_args

_validate_scheduler_args(args, values)

Check whether args are as expected by the scheduler's constructor.

Source code in zeus/optimizer/pipeline_frequency/common.py

@validator("scheduler_args")
def _validate_scheduler_args(cls, args, values):
    """Check whether args are as expected by the scheduler's constructor."""
    scheduler = values["scheduler"]
    full_args = args | dict(job_info=None, rank_infos=None, pfo_settings=None)
    constructor_args = inspect.signature(scheduler)
    try:
        constructor_args.bind(**full_args)
    except TypeError as e:
        raise ValueError(f"Invalid scheduler args: {e}") from None
    return args

JobInfo

Bases: BaseModel

Training job information reported to the server.

Attributes:

Name	Type	Description
`job_id`	`str`	Globally unique ID of the training job, generated by the server. This field should be an empty string when sent to the server.
`pp_degree`	`int`	Pipeline parallel degree.
`dp_degree`	`int`	Data parallel degree.
`tp_degree`	`int`	Tensor parallel degree.
`world_size`	`int`	World size of the training job.
`job_metadata`	`Optional[str]`	An optional arbitrary string that describes the job. This will be appended to the job ID if given. Typically for logging purposes.
`framework`	`Optional[str]`	Framework used for training.
`model_name`	`Optional[str]`	Name of the model being trained.
`partition_method`	`Optional[str]`	Pipeline partition method used.
`microbatch_size`	`Optional[int]`	Microbatch size used in training.
`num_microbatches`	`Optional[int]`	Number of microbatches in training.

Source code in zeus/optimizer/pipeline_frequency/common.py

class JobInfo(BaseModel):
    """Training job information reported to the server.

    Attributes:
        job_id: Globally unique ID of the training job, generated by the server.
            This field should be an empty string when sent to the server.
        pp_degree: Pipeline parallel degree.
        dp_degree: Data parallel degree.
        tp_degree: Tensor parallel degree.
        world_size: World size of the training job.
        job_metadata: An optional arbitrary string that describes the job. This will
            be appended to the job ID if given. Typically for logging purposes.
        framework: Framework used for training.
        model_name: Name of the model being trained.
        partition_method: Pipeline partition method used.
        microbatch_size: Microbatch size used in training.
        num_microbatches: Number of microbatches in training.
    """

    job_id: str = ""
    pp_degree: int = Field(ge=1)
    dp_degree: int = Field(ge=1)
    tp_degree: int = Field(ge=1)
    world_size: int = Field(ge=1)
    job_metadata: Optional[str] = None
    framework: Optional[str] = None
    model_name: Optional[str] = None
    partition_method: Optional[str] = None
    microbatch_size: Optional[int] = None
    num_microbatches: Optional[int] = None

    @validator("job_id")
    def _check_empty_job_id(cls, job_id):
        assert not job_id
        return job_id

    @validator("world_size")
    def _check_world_size(cls, world_size, values):
        """Product of PP, DP, and TP degree would be identical to the world size."""
        assert (
            values["pp_degree"] * values["dp_degree"] * values["tp_degree"]
            == world_size
        )
        return world_size

    def set_job_id(self, scheduler_name: str):
        """Generate and set the job ID."""
        parts = [
            datetime.now().strftime("%F-%H-%M-%S"),
            self.framework,
            self.model_name,
            self.partition_method,
            f"dp{self.dp_degree}",
            f"pp{self.pp_degree}",
            f"tp{self.tp_degree}",
            f"mbs{self.microbatch_size}",
            f"nmb{self.num_microbatches}",
            scheduler_name,
        ]

        parts = [part for part in parts if part]
        if self.job_metadata:
            parts.append(self.job_metadata)

        self.job_id = "+".join(parts)

_check_world_size

_check_world_size(world_size, values)

Product of PP, DP, and TP degree would be identical to the world size.

Source code in zeus/optimizer/pipeline_frequency/common.py

@validator("world_size")
def _check_world_size(cls, world_size, values):
    """Product of PP, DP, and TP degree would be identical to the world size."""
    assert (
        values["pp_degree"] * values["dp_degree"] * values["tp_degree"]
        == world_size
    )
    return world_size

set_job_id

set_job_id(scheduler_name)

Generate and set the job ID.

Source code in zeus/optimizer/pipeline_frequency/common.py

def set_job_id(self, scheduler_name: str):
    """Generate and set the job ID."""
    parts = [
        datetime.now().strftime("%F-%H-%M-%S"),
        self.framework,
        self.model_name,
        self.partition_method,
        f"dp{self.dp_degree}",
        f"pp{self.pp_degree}",
        f"tp{self.tp_degree}",
        f"mbs{self.microbatch_size}",
        f"nmb{self.num_microbatches}",
        scheduler_name,
    ]

    parts = [part for part in parts if part]
    if self.job_metadata:
        parts.append(self.job_metadata)

    self.job_id = "+".join(parts)

RankInfo

Bases: BaseModel

Information passed to the server from each rank.

Attributes:

Name	Type	Description
`rank`	`int`	Global rank of the reporting process.
`dp_rank`	`int`	Data parallel rank of the reporting procees.
`pp_rank`	`int`	Pipeline parallel rank of the reporting procees.
`tp_rank`	`int`	Tensor parallel rank of the reporting procees.
`available_frequencies`	`list[int]`	List of available frequencies for the rank's GPU.
`pipe_schedule`	`list[str]`	Pipeline schedule (list of strings) for the rank. For example, ["forward", "backward"].

Source code in zeus/optimizer/pipeline_frequency/common.py

class RankInfo(BaseModel):
    """Information passed to the server from each rank.

    Attributes:
        rank: Global rank of the reporting process.
        dp_rank: Data parallel rank of the reporting procees.
        pp_rank: Pipeline parallel rank of the reporting procees.
        tp_rank: Tensor parallel rank of the reporting procees.
        available_frequencies: List of available frequencies for the rank's GPU.
        pipe_schedule: Pipeline schedule (list of strings) for the rank.
            For example, ["forward", "backward"].
    """

    rank: int = Field(ge=0)
    dp_rank: int = Field(ge=0)
    pp_rank: int = Field(ge=0)
    tp_rank: int = Field(ge=0)
    available_frequencies: list[int]
    pipe_schedule: list[str] = []

    @validator("pipe_schedule", pre=True, always=True)
    def validate_pipe_schedule(cls, value):
        """Check that the pipeline schedule is not empty."""
        if not value or len(value) == 0:
            raise ValueError("pipe_schedule must not be empty")
        return value

validate_pipe_schedule

validate_pipe_schedule(value)

Check that the pipeline schedule is not empty.

Source code in zeus/optimizer/pipeline_frequency/common.py

@validator("pipe_schedule", pre=True, always=True)
def validate_pipe_schedule(cls, value):
    """Check that the pipeline schedule is not empty."""
    if not value or len(value) == 0:
        raise ValueError("pipe_schedule must not be empty")
    return value

FrequencySchedule

Bases: BaseModel

Frequency schedule for one iteration.

frequencies is a list of tuples, where the first element is the name of the instruction and the second element is the frequency to use for that instruction.

Source code in zeus/optimizer/pipeline_frequency/common.py

class FrequencySchedule(BaseModel):
    """Frequency schedule for one iteration.

    `frequencies` is a list of tuples, where the first element is the name of the
    instruction and the second element is the frequency to use for that instruction.
    """

    rank: int = Field(ge=0)
    frequencies: list[tuple[str, int]]

ProfilingResult

Bases: BaseModel

Profiling results for a FrequencySchedule of a rank.

Attributes:

Name	Type	Description
`rank`	`int`	Global rank of the reporting client.
`iter_time`	`list[float]`	List of latency of all iterations within the profiling window in seconds.
`iter_energy`	`list[float]`	List of energy consumption of all iterations within the profiling window in Joules.
`time_breakdown`	`dict[str, list[list[float]]]`	Duration of each operation across multiple iterations. e.g. `time_breakdown["forward"][i]` is the list of latencies of all forward computations in the `i`th iteration.
`energy_breakdown`	`dict[str, list[list[float]]]`	Energy consumption of each operation across multple iterations. Value has the same structure as `time_breakdown`.

Source code in zeus/optimizer/pipeline_frequency/common.py

class ProfilingResult(BaseModel):
    """Profiling results for a `FrequencySchedule` of a rank.

    Attributes:
        rank: Global rank of the reporting client.
        iter_time: List of latency of all iterations within the profiling window in seconds.
        iter_energy: List of energy consumption of all iterations within the profiling window in Joules.
        time_breakdown: Duration of each operation across multiple iterations.
            e.g. `time_breakdown["forward"][i]` is the list of latencies of all forward computations
            in the `i`th iteration.
        energy_breakdown: Energy consumption of each operation across multple iterations.
            Value has the same structure as `time_breakdown`.
    """

    rank: int = Field(ge=0)
    iter_time: list[float]
    iter_energy: list[float]
    time_breakdown: dict[str, list[list[float]]] = {}
    energy_breakdown: dict[str, list[list[float]]] = {}

OfflineProfilingResult

Bases: BaseModel

Profiling results generated from offline profiling each instruction.

Attributes:

Name	Type	Description
`rank`	`int`	Global rank of the reporting client.
`dp_rank`	`int`	Data parallel rank of the reporting procees.
`pp_rank`	`int`	Pipeline parallel rank of the reporting procees.
`tp_rank`	`int`	Tensor parallel rank of the reporting procees.
`forward_time`	`dict[int, float]`	Dict that maps frequency to average forward computation time.
`forward_energy`	`dict[int, float]`	Dict that maps frequency to average forward computation energy.
`backward_time`	`dict[int, float]`	Dict that maps frequency to average backward computation time.
`backward_energy`	`dict[int, float]`	Dict that maps frequency to average backward computation energy.

Source code in zeus/optimizer/pipeline_frequency/common.py

class OfflineProfilingResult(BaseModel):
    """Profiling results generated from offline profiling each instruction.

    Attributes:
        rank: Global rank of the reporting client.
        dp_rank: Data parallel rank of the reporting procees.
        pp_rank: Pipeline parallel rank of the reporting procees.
        tp_rank: Tensor parallel rank of the reporting procees.
        forward_time: Dict that maps frequency to average forward computation time.
        forward_energy: Dict that maps frequency to average forward computation energy.
        backward_time: Dict that maps frequency to average backward computation time.
        backward_energy: Dict that maps frequency to average backward computation energy.
    """

    rank: int = Field(ge=0)
    dp_rank: int = Field(ge=0)
    pp_rank: int = Field(ge=0)
    tp_rank: int = Field(ge=0)
    forward_time: dict[int, float]
    forward_energy: dict[int, float]
    backward_time: dict[int, float]
    backward_energy: dict[int, float]

InstructionProfilingResult

Bases: BaseModel

Time and energy profiling results for each instruction in each stage.

Source code in zeus/optimizer/pipeline_frequency/common.py

class InstructionProfilingResult(BaseModel):
    """Time and energy profiling results for each instruction in each stage."""

    __root__: list[OfflineProfilingResult]

    def to_csv(self, filepath: str) -> None:
        """Serialize and save this object into a CSV file.

        Columns: rank, dp_rank, pp_rank, tp_rank, stage, instruction, frequency, time, energy
        Notes
            - `rank` is the global rank of the process.
            - `pp_rank` and `stage` are always the same, for backwards compatibility.
            - All ranks and `stage` are zero-indexed.
            - `instruction` is either "forward" or "backward".
            - `time` and `energy` are already averaged over profiling iterations.
        """
        if not filepath.endswith(".csv"):
            raise ValueError("Filepath does not end with '.csv'")

        # fmt: off
        headers = ["rank", "dp_rank", "pp_rank", "tp_rank", "stage", "instruction", "frequency", "time", "energy"]
        records: list[tuple[int, int, int, int, int, str, int, float, float]] = []
        for res in self.__root__:
            prefix = (res.rank, res.dp_rank, res.pp_rank, res.tp_rank, res.pp_rank)
            for freq in res.forward_time:
                records.append((*prefix, "forward", freq, res.forward_time[freq], res.forward_energy[freq]))
            for freq in res.backward_time:
                records.append((*prefix, "backward", freq, res.backward_time[freq], res.backward_energy[freq]))
        # fmt: on

        df = pd.DataFrame.from_records(records, columns=headers)
        df.to_csv(filepath, index=False)

to_csv

to_csv(filepath)

Serialize and save this object into a CSV file.

Columns: rank, dp_rank, pp_rank, tp_rank, stage, instruction, frequency, time, energy Notes - rank is the global rank of the process. - pp_rank and stage are always the same, for backwards compatibility. - All ranks and stage are zero-indexed. - instruction is either "forward" or "backward". - time and energy are already averaged over profiling iterations.

Source code in zeus/optimizer/pipeline_frequency/common.py

def to_csv(self, filepath: str) -> None:
    """Serialize and save this object into a CSV file.

    Columns: rank, dp_rank, pp_rank, tp_rank, stage, instruction, frequency, time, energy
    Notes
        - `rank` is the global rank of the process.
        - `pp_rank` and `stage` are always the same, for backwards compatibility.
        - All ranks and `stage` are zero-indexed.
        - `instruction` is either "forward" or "backward".
        - `time` and `energy` are already averaged over profiling iterations.
    """
    if not filepath.endswith(".csv"):
        raise ValueError("Filepath does not end with '.csv'")

    # fmt: off
    headers = ["rank", "dp_rank", "pp_rank", "tp_rank", "stage", "instruction", "frequency", "time", "energy"]
    records: list[tuple[int, int, int, int, int, str, int, float, float]] = []
    for res in self.__root__:
        prefix = (res.rank, res.dp_rank, res.pp_rank, res.tp_rank, res.pp_rank)
        for freq in res.forward_time:
            records.append((*prefix, "forward", freq, res.forward_time[freq], res.forward_energy[freq]))
        for freq in res.backward_time:
            records.append((*prefix, "backward", freq, res.backward_time[freq], res.backward_energy[freq]))
    # fmt: on

    df = pd.DataFrame.from_records(records, columns=headers)
    df.to_csv(filepath, index=False)

save_prof `async`

save_prof(data, directory, schedule_num)

Save a list of ProfilingResults in the designated directory.

Source code in zeus/optimizer/pipeline_frequency/common.py

async def save_prof(
    data: list[ProfilingResult],
    directory: str,
    schedule_num: int,
) -> None:
    """Save a list of `ProfilingResult`s in the designated directory."""
    os.makedirs(directory, exist_ok=True)
    async with aiofiles.open(f"{directory}/{schedule_num}.prof.json", "w") as f:
        obj = _ProfilingResultList(__root__=data).json()
        await f.write(obj)

load_prof

load_prof(directory, schedule_num)

Load a list of ProfilingResults saved in the designated directory.

Source code in zeus/optimizer/pipeline_frequency/common.py

def load_prof(directory: str, schedule_num: int) -> list[ProfilingResult]:
    """Load a list of `ProfilingResult`s saved in the designated directory."""
    filepath = f"{directory}/{schedule_num}.prof.json"
    return _ProfilingResultList.parse_file(filepath).__root__

save_sched `async`

save_sched(data, directory, schedule_num)

Save a list of FrequencySchedules in the designated directory.

Source code in zeus/optimizer/pipeline_frequency/common.py

async def save_sched(
    data: list[FrequencySchedule],
    directory: str,
    schedule_num: int,
) -> None:
    """Save a list of `FrequencySchedule`s in the designated directory."""
    os.makedirs(directory, exist_ok=True)
    async with aiofiles.open(f"{directory}/{schedule_num}.sched.json", "w") as f:
        obj = _FrequencyScheduleList(__root__=data).json()
        await f.write(obj)

load_sched

load_sched(directory, schedule_num)

Load a list of FrequencySchedules saved in the designated directory.

Source code in zeus/optimizer/pipeline_frequency/common.py

def load_sched(directory: str, schedule_num: int) -> list[FrequencySchedule]:
    """Load a list of `FrequencySchedule`s saved in the designated directory."""
    filepath = f"{directory}/{schedule_num}.sched.json"
    return _FrequencyScheduleList.parse_file(filepath).__root__

save_ranks `async`

save_ranks(data, directory)

Save a list of RankInfos in the designated directory.

Source code in zeus/optimizer/pipeline_frequency/common.py

async def save_ranks(data: list[RankInfo], directory: str) -> None:
    """Save a list of `RankInfo`s in the designated directory."""
    os.makedirs(directory, exist_ok=True)
    async with aiofiles.open(f"{directory}/ranks.json", "w") as f:
        obj = _RankInfoList(__root__=data).json()
        await f.write(obj)

load_ranks

load_ranks(directory)

Load a list of RankInfos saved in the designated directory.

Source code in zeus/optimizer/pipeline_frequency/common.py

def load_ranks(directory: str) -> list[RankInfo]:
    """Load a list of `RankInfo`s saved in the designated directory."""
    filepath = f"{directory}/ranks.json"
    return _RankInfoList.parse_file(filepath).__root__

common

zeus.optimizer.pipeline_frequency.common

PFOServerSettings

Config

_fix_scheduler_import_path

_validate_scheduler_args

JobInfo

_check_world_size

set_job_id

RankInfo

validate_pipe_schedule

FrequencySchedule

ProfilingResult

OfflineProfilingResult

InstructionProfilingResult

to_csv

save_prof async

load_prof

save_sched async

load_sched

save_ranks async

load_ranks

save_prof `async`

save_sched `async`

save_ranks `async`