config

`birdnet_stm32.training.config` ¶

Model configuration dataclass with JSON serialization and validation.

Replaces the raw dict config previously saved alongside checkpoints. Backward-compatible: loads legacy JSON files that lack newer fields.

`ModelConfig` `dataclass` ¶

Immutable model configuration for training, conversion, and deployment.

Attributes:

Name	Type	Description
`sample_rate`	`int`	Audio sample rate in Hz.
`num_mels`	`int`	Number of mel frequency bins.
`spec_width`	`int`	Spectrogram width in frames.
`fft_length`	`int`	FFT window size.
`chunk_duration`	`float`	Audio chunk duration in seconds.
`hop_length`	`int`	STFT hop length in samples.
`audio_frontend`	`str`	Frontend mode ('librosa', 'hybrid', 'raw', 'mfcc', 'log_mel').
`mag_scale`	`str`	Magnitude scaling ('pwl', 'pcen', 'db', 'none').
`embeddings_size`	`int`	Dense embedding dimension before classifier.
`alpha`	`float`	Width multiplier for channel counts.
`depth_multiplier`	`int`	Block repeat count per stage.
`num_classes`	`int`	Number of output classes.
`class_names`	`list[str]`	Ordered list of class label strings.
`frontend_trainable`	`bool`	Whether frontend weights are trainable.
`n_mfcc`	`int`	Number of MFCC coefficients (mfcc frontend only).
`use_se`	`bool`	Whether SE channel attention is enabled.
`se_reduction`	`int`	SE reduction factor.
`use_inverted_residual`	`bool`	Whether inverted residual blocks are used.
`expansion_factor`	`int`	Inverted residual expansion factor.
`use_attention_pooling`	`bool`	Whether attention pooling replaces GAP.
`dropout_rate`	`float`	Dropout rate before classifier head.

Source code in birdnet_stm32/training/config.py

@dataclass
class ModelConfig:
    """Immutable model configuration for training, conversion, and deployment.

    Attributes:
        sample_rate: Audio sample rate in Hz.
        num_mels: Number of mel frequency bins.
        spec_width: Spectrogram width in frames.
        fft_length: FFT window size.
        chunk_duration: Audio chunk duration in seconds.
        hop_length: STFT hop length in samples.
        audio_frontend: Frontend mode ('librosa', 'hybrid', 'raw', 'mfcc', 'log_mel').
        mag_scale: Magnitude scaling ('pwl', 'pcen', 'db', 'none').
        embeddings_size: Dense embedding dimension before classifier.
        alpha: Width multiplier for channel counts.
        depth_multiplier: Block repeat count per stage.
        num_classes: Number of output classes.
        class_names: Ordered list of class label strings.
        frontend_trainable: Whether frontend weights are trainable.
        n_mfcc: Number of MFCC coefficients (mfcc frontend only).
        use_se: Whether SE channel attention is enabled.
        se_reduction: SE reduction factor.
        use_inverted_residual: Whether inverted residual blocks are used.
        expansion_factor: Inverted residual expansion factor.
        use_attention_pooling: Whether attention pooling replaces GAP.
        dropout_rate: Dropout rate before classifier head.
    """

    # Audio
    sample_rate: int = 24000
    num_mels: int = 64
    spec_width: int = 256
    fft_length: int = 512
    chunk_duration: float = 3.0
    hop_length: int = 281
    audio_frontend: str = "hybrid"
    mag_scale: str = "pwl"
    n_mfcc: int = 20

    # Model architecture
    embeddings_size: int = 256
    alpha: float = 1.0
    depth_multiplier: int = 1
    use_se: bool = True
    se_reduction: int = 8
    use_inverted_residual: bool = True
    expansion_factor: int = 2
    use_attention_pooling: bool = False
    dropout_rate: float = 0.5
    frontend_trainable: bool = False

    # Classes
    num_classes: int = 0
    class_names: list[str] = field(default_factory=list)

    # -- Validation ----------------------------------------------------------

    _VALID_FRONTENDS = frozenset({"librosa", "hybrid", "raw", "mfcc", "log_mel"})
    _VALID_MAG_SCALES = frozenset({"pwl", "pcen", "db", "none"})

    def __post_init__(self) -> None:
        """Validate field values after initialization."""
        if self.sample_rate <= 0:
            raise ValueError(f"sample_rate must be positive, got {self.sample_rate}")
        if self.num_mels <= 0:
            raise ValueError(f"num_mels must be positive, got {self.num_mels}")
        if self.spec_width <= 0:
            raise ValueError(f"spec_width must be positive, got {self.spec_width}")
        if self.fft_length <= 0:
            raise ValueError(f"fft_length must be positive, got {self.fft_length}")
        if self.chunk_duration <= 0:
            raise ValueError(f"chunk_duration must be positive, got {self.chunk_duration}")
        if self.audio_frontend not in self._VALID_FRONTENDS:
            raise ValueError(f"audio_frontend '{self.audio_frontend}' not in {sorted(self._VALID_FRONTENDS)}")
        if self.mag_scale not in self._VALID_MAG_SCALES:
            raise ValueError(f"mag_scale '{self.mag_scale}' not in {sorted(self._VALID_MAG_SCALES)}")
        if self.alpha <= 0:
            raise ValueError(f"alpha must be positive, got {self.alpha}")
        if self.depth_multiplier < 1:
            raise ValueError(f"depth_multiplier must be >= 1, got {self.depth_multiplier}")
        if not 0 <= self.dropout_rate < 1:
            raise ValueError(f"dropout_rate must be in [0, 1), got {self.dropout_rate}")
        if self.num_classes < 0:
            raise ValueError(f"num_classes must be >= 0, got {self.num_classes}")
        if self.class_names and len(self.class_names) != self.num_classes:
            raise ValueError(f"class_names length ({len(self.class_names)}) != num_classes ({self.num_classes})")

    # -- Serialization -------------------------------------------------------

    def to_dict(self) -> dict:
        """Convert to a plain dict suitable for JSON serialization."""
        return asdict(self)

    def save(self, path: str | Path) -> None:
        """Write config to a JSON file.

        Args:
            path: Destination file path.
        """
        path = Path(path)
        path.parent.mkdir(parents=True, exist_ok=True)
        path.write_text(json.dumps(self.to_dict(), indent=2) + "\n")

    @classmethod
    def from_dict(cls, data: dict) -> ModelConfig:
        """Create a ModelConfig from a dict, ignoring unknown keys.

        Unknown keys are silently dropped so legacy configs still load.

        Args:
            data: Dictionary of config values.

        Returns:
            Validated ModelConfig instance.
        """
        valid_keys = {f.name for f in cls.__dataclass_fields__.values()}
        filtered = {k: v for k, v in data.items() if k in valid_keys}
        return cls(**filtered)

    @classmethod
    def load(cls, path: str | Path) -> ModelConfig:
        """Load config from a JSON file.

        Args:
            path: Path to JSON config file.

        Returns:
            Validated ModelConfig instance.

        Raises:
            FileNotFoundError: If path does not exist.
        """
        path = Path(path)
        data = json.loads(path.read_text())
        return cls.from_dict(data)

`__post_init__()` ¶

Validate field values after initialization.

Source code in birdnet_stm32/training/config.py

def __post_init__(self) -> None:
    """Validate field values after initialization."""
    if self.sample_rate <= 0:
        raise ValueError(f"sample_rate must be positive, got {self.sample_rate}")
    if self.num_mels <= 0:
        raise ValueError(f"num_mels must be positive, got {self.num_mels}")
    if self.spec_width <= 0:
        raise ValueError(f"spec_width must be positive, got {self.spec_width}")
    if self.fft_length <= 0:
        raise ValueError(f"fft_length must be positive, got {self.fft_length}")
    if self.chunk_duration <= 0:
        raise ValueError(f"chunk_duration must be positive, got {self.chunk_duration}")
    if self.audio_frontend not in self._VALID_FRONTENDS:
        raise ValueError(f"audio_frontend '{self.audio_frontend}' not in {sorted(self._VALID_FRONTENDS)}")
    if self.mag_scale not in self._VALID_MAG_SCALES:
        raise ValueError(f"mag_scale '{self.mag_scale}' not in {sorted(self._VALID_MAG_SCALES)}")
    if self.alpha <= 0:
        raise ValueError(f"alpha must be positive, got {self.alpha}")
    if self.depth_multiplier < 1:
        raise ValueError(f"depth_multiplier must be >= 1, got {self.depth_multiplier}")
    if not 0 <= self.dropout_rate < 1:
        raise ValueError(f"dropout_rate must be in [0, 1), got {self.dropout_rate}")
    if self.num_classes < 0:
        raise ValueError(f"num_classes must be >= 0, got {self.num_classes}")
    if self.class_names and len(self.class_names) != self.num_classes:
        raise ValueError(f"class_names length ({len(self.class_names)}) != num_classes ({self.num_classes})")

`to_dict()` ¶

Convert to a plain dict suitable for JSON serialization.

Source code in birdnet_stm32/training/config.py

def to_dict(self) -> dict:
    """Convert to a plain dict suitable for JSON serialization."""
    return asdict(self)

`save(path)` ¶

Write config to a JSON file.

Parameters:

Name	Type	Description	Default
`path`	`str \| Path`	Destination file path.	required

Source code in birdnet_stm32/training/config.py

def save(self, path: str | Path) -> None:
    """Write config to a JSON file.

    Args:
        path: Destination file path.
    """
    path = Path(path)
    path.parent.mkdir(parents=True, exist_ok=True)
    path.write_text(json.dumps(self.to_dict(), indent=2) + "\n")

`from_dict(data)` `classmethod` ¶

Create a ModelConfig from a dict, ignoring unknown keys.

Unknown keys are silently dropped so legacy configs still load.

Parameters:

Name	Type	Description	Default
`data`	`dict`	Dictionary of config values.	required

Returns:

Type	Description
`ModelConfig`	Validated ModelConfig instance.

Source code in birdnet_stm32/training/config.py

@classmethod
def from_dict(cls, data: dict) -> ModelConfig:
    """Create a ModelConfig from a dict, ignoring unknown keys.

    Unknown keys are silently dropped so legacy configs still load.

    Args:
        data: Dictionary of config values.

    Returns:
        Validated ModelConfig instance.
    """
    valid_keys = {f.name for f in cls.__dataclass_fields__.values()}
    filtered = {k: v for k, v in data.items() if k in valid_keys}
    return cls(**filtered)

`load(path)` `classmethod` ¶

Load config from a JSON file.

Parameters:

Name	Type	Description	Default
`path`	`str \| Path`	Path to JSON config file.	required

Returns:

Type	Description
`ModelConfig`	Validated ModelConfig instance.

Raises:

Type	Description
`FileNotFoundError`	If path does not exist.

Source code in birdnet_stm32/training/config.py

@classmethod
def load(cls, path: str | Path) -> ModelConfig:
    """Load config from a JSON file.

    Args:
        path: Path to JSON config file.

    Returns:
        Validated ModelConfig instance.

    Raises:
        FileNotFoundError: If path does not exist.
    """
    path = Path(path)
    data = json.loads(path.read_text())
    return cls.from_dict(data)

config

birdnet_stm32.training.config ¶

ModelConfig dataclass ¶

__post_init__() ¶

to_dict() ¶

save(path) ¶

from_dict(data) classmethod ¶

load(path) classmethod ¶

`birdnet_stm32.training.config` ¶

`ModelConfig` `dataclass` ¶

`__post_init__()` ¶

`to_dict()` ¶

`save(path)` ¶

`from_dict(data)` `classmethod` ¶

`load(path)` `classmethod` ¶