llmcompressor.pytorch.model_load.helpers

Functions:

get_completed_stages –

Given a checkpoint directory for a staged run, get the list of stages that
get_session_model –

:return: pytorch module stored by the active CompressionSession,
parse_dtype –

:param dtype_arg: dtype or string to parse
save_checkpoint –

Save a model, processor, and recipe
save_completed_stages –

Save a list of completed stages to a checkpoint directory

get_completed_stages

get_completed_stages(checkpoint_dir: Any) -> List[str]

Given a checkpoint directory for a staged run, get the list of stages that have completed in a prior run if the checkpoint_dir is a string

Parameters:

checkpoint_dir
(Any) –

path to staged checkpoint

Returns:

List[str] –

list of completed stage names

Source code in llmcompressor/pytorch/model_load/helpers.py

def get_completed_stages(checkpoint_dir: Any) -> List[str]:
    """
    Given a checkpoint directory for a staged run, get the list of stages that
    have completed in a prior run if the checkpoint_dir is a string

    :param checkpoint_dir: path to staged checkpoint
    :return: list of completed stage names
    """
    if isinstance(checkpoint_dir, str):
        stage_path = os.path.join(checkpoint_dir, COMPLETED_STAGES_FILENAME)
        if os.path.exists(stage_path):
            with open(stage_path) as stage_file:
                stage_data = json.load(stage_file)
                return stage_data["completed"]

    return []

get_session_model

get_session_model() -> Optional[Module]

Returns:

Optional[Module] –

pytorch module stored by the active CompressionSession, or None if no session is active

Source code in llmcompressor/pytorch/model_load/helpers.py

def get_session_model() -> Optional[Module]:
    """
    :return: pytorch module stored by the active CompressionSession,
        or None if no session is active
    """
    session = active_session()
    if not session:
        return None

    active_model = session.state.model
    return active_model

load_safetensors_state_dict

load_safetensors_state_dict(
    file_path: str,
) -> Dict[str, torch.Tensor]

Load a safetensors file from disk

Parameters:

file_path
(str) –

path to the safetensors file

Returns:

Dict[str, Tensor] –

dictionary of safetensors data

Source code in llmcompressor/pytorch/model_load/helpers.py

def load_safetensors_state_dict(file_path: str) -> Dict[str, torch.Tensor]:
    """
    Load a safetensors file from disk

    :param file_path: path to the safetensors file
    :return: dictionary of safetensors data
    """
    with safe_open(file_path, framework="pt", device="cpu") as f:
        return {key: f.get_tensor(key) for key in f.keys()}

parse_dtype

parse_dtype(dtype_arg: Union[str, dtype]) -> torch.dtype

Parameters:

dtype_arg
(Union[str, dtype]) –

dtype or string to parse

Returns:

dtype –

torch.dtype parsed from input string

Source code in llmcompressor/pytorch/model_load/helpers.py

def parse_dtype(dtype_arg: Union[str, torch.dtype]) -> torch.dtype:
    """
    :param dtype_arg: dtype or string to parse
    :return: torch.dtype parsed from input string
    """
    dtype_arg = str(dtype_arg)
    dtype = "auto"  # get precision from model by default
    if dtype_arg in ("half", "float16", "torch.float16"):
        dtype = torch.float16
    elif dtype_arg in ("torch.bfloat16", "bfloat16"):
        dtype = torch.bfloat16
    elif dtype_arg in ("full", "float32", "torch.float32"):
        dtype = torch.float32

    return dtype

save_checkpoint

save_checkpoint(
    save_path: str,
    model: PreTrainedModel,
    processor: Optional[Processor] = None,
    save_safetensors: bool = True,
    save_compressed: bool = True,
    skip_sparsity_compression_stats: bool = False,
)

Save a model, processor, and recipe

Parameters:

save_path
(str) –

Path used to save model and processor
model
(PreTrainedModel) –

model to save
processor
(Optional[Processor], default: None ) –

processor to save
save_safetensors
(bool, default: True ) –

save model checkpoint using safetensors file type
save_compressed
(bool, default: True ) –

save model checkpoint using compressed-tensors format

Source code in llmcompressor/pytorch/model_load/helpers.py

def save_checkpoint(
    save_path: str,
    model: PreTrainedModel,
    processor: Optional[Processor] = None,
    save_safetensors: bool = True,
    save_compressed: bool = True,
    skip_sparsity_compression_stats: bool = False,
):
    """
    Save a model, processor, and recipe

    :param save_path: Path used to save model and processor
    :param model: model to save
    :param processor: processor to save
    :param save_safetensors: save model checkpoint using safetensors file type
    :param save_compressed: save model checkpoint using compressed-tensors format
    """
    from llmcompressor.transformers.compression.compressed_tensors_utils import (
        get_model_compressor,  # avoid circular import
    )

    # used for decompression
    # unfortunately, if skip_sparsity_compression_stats==True, sparsity stats
    # are computed twice. In the future, track sparsity from recipe or
    # share recipe between compression and decompression
    compressor = get_model_compressor(
        model=model,
        save_compressed=save_compressed,
        skip_sparsity_compression_stats=skip_sparsity_compression_stats,
    )

    # saving the model also saves the recipe
    model.save_pretrained(
        save_path,
        save_safetensors=save_safetensors,
        save_compressed=save_compressed,
        skip_sparsity_compression_stats=skip_sparsity_compression_stats,
    )
    if processor is not None:
        processor.save_pretrained(save_path)

    # decompression: saving the model modifies the model strcuture
    # as this is only a checkpoint, decompress model to enable future training/oneshot
    if compressor is not None:
        compressor.decompress_model(model)

save_completed_stages

save_completed_stages(
    checkpoint_dir: str, completed_stages: List[str]
)

Save a list of completed stages to a checkpoint directory

Parameters:

checkpoint_dir
(str) –

model checkpoint directory to save stages to
completed_stages
(List[str]) –

list of stage names that have been run

Source code in llmcompressor/pytorch/model_load/helpers.py

def save_completed_stages(checkpoint_dir: str, completed_stages: List[str]):
    """
    Save a list of completed stages to a checkpoint directory

    :param checkpoint_dir: model checkpoint directory to save stages to
    :param completed_stages: list of stage names that have been run
    """
    stage_path = os.path.join(checkpoint_dir, COMPLETED_STAGES_FILENAME)
    with open(stage_path, "w") as out_file:
        json.dump({"completed": completed_stages}, out_file)

llmcompressor.pytorch.model_load.helpers

get_completed_stages

`checkpoint_dir`

get_session_model

load_safetensors_state_dict

`file_path`

parse_dtype

`dtype_arg`

save_checkpoint

`save_path`

`model`

`processor`

`save_safetensors`

`save_compressed`

save_completed_stages

`checkpoint_dir`

`completed_stages`