Source code for oumi.quantize.base

# Copyright 2025 - Oumi
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Base quantization class and common utilities."""

from abc import ABC, abstractmethod
from dataclasses import dataclass, field
from typing import Any

from oumi.core.configs import QuantizationConfig



[docs]
@dataclass
class QuantizationResult:
    """Result of quantization."""

    quantized_size_bytes: int
    """Size of the quantized model in bytes."""

    output_path: str
    """Path to the quantized model."""

    quantization_method: str
    """Quantization method used."""

    format_type: str
    """Format type of the quantized model."""

    additional_info: dict[str, Any] = field(default_factory=dict)
    """Additional information about the quantization process."""




[docs]
class BaseQuantization(ABC):
    """Abstract base class for all quantization methods.

    This class defines the common interface that all quantization implementations
    must follow, ensuring consistency across different quantization approaches.
    """

    # Subclasses should define these class attributes
    supported_methods: list[str] = []
    supported_formats: list[str] = []


[docs]
    @abstractmethod
    def quantize(self, config: QuantizationConfig) -> QuantizationResult:
        """Main quantization method - must be implemented by subclasses.

        Args:
            config: Quantization configuration containing model parameters,
                method, output path, and other settings.

        Returns:
            QuantizationResult containing:
            - quantized_size_bytes: Size of the quantized model in bytes
            - output_path: Path to the quantized model
            - quantization_method: Quantization method used
            - format_type: Format type of the quantized model
            - additional_info: Additional method-specific information

        Raises:
            RuntimeError: If quantization fails for any reason
            ValueError: If configuration is invalid for this quantizer
        """
        raise NotImplementedError("Subclasses must implement quantize method")



[docs]
    @abstractmethod
    def raise_if_requirements_not_met(self) -> None:
        """Raise an error if the requirements are not met."""
        raise NotImplementedError(
            "Subclasses must implement raise_if_requirements_not_met method"
        )



[docs]
    def get_supported_methods(self) -> list[str]:
        """Return list of quantization methods supported by this quantizer.

        Returns:
            List of method names (e.g., ["awq_q4_0", "awq_q8_0"])
        """
        return self.supported_methods.copy()



[docs]
    def get_supported_formats(self) -> list[str]:
        """Return list of output formats supported by this quantizer.

        Returns:
            List of format names (e.g., ["gguf", "pytorch"])
        """
        return self.supported_formats.copy()



[docs]
    def supports_method(self, method: str) -> bool:
        """Check if this quantizer supports the given method.

        Args:
            method: Quantization method name to check

        Returns:
            True if method is supported, False otherwise
        """
        return method in self.supported_methods



[docs]
    def supports_format(self, format_name: str) -> bool:
        """Check if this quantizer supports the given output format.

        Args:
            format_name: Output format name to check

        Returns:
            True if format is supported, False otherwise
        """
        return format_name in self.supported_formats



[docs]
    def validate_config(self, config: QuantizationConfig) -> None:
        """Validate configuration for this quantizer.

        Args:
            config: Quantization configuration to validate

        Raises:
            ValueError: If configuration is invalid for this quantizer
        """
        if not self.supports_method(config.method):
            raise ValueError(
                f"Method '{config.method}' not supported by {self.__class__.__name__}."
                f"Supported methods: {self.supported_methods}"
            )

        if not self.supports_format(config.output_format):
            raise ValueError(
                f"Format '{config.output_format}' not supported by "
                f"{self.__class__.__name__}. "
                f"Supported formats: {self.supported_formats}"
            )



[docs]
    def validate_requirements(self) -> bool:
        """Check if all required dependencies are available.

        Returns:
            True if all dependencies are available and quantization can proceed,
            False otherwise.
        """
        try:
            self.raise_if_requirements_not_met()
            return True
        except Exception:
            return False