Source code for sequifier.io.yaml

import numpy
import yaml

from sequifier.config.train_config import (
    DotDict,
    ModelSpecModel,
    TrainingSpecModel,
    TrainModel,
)



[docs]
def represent_sequifier_object(dumper, data):
    """
    Represents objects from 'sequifier.config.train_config' (like TrainModel,
    ModelSpecModel, TrainingSpecModel) as a simple YAML mapping,
    using the object's __dict__. This effectively removes the
    !!python/object tag and the explicit '__dict__:', '__fields_set__:' keys.
    """
    # We assume the object's __dict__ contains the attributes to be serialized.
    # If these objects are Pydantic models, using data.model_dump(mode='python')
    # would be more robust if available.
    return dumper.represent_dict(data.__dict__)




[docs]
def represent_dot_dict(dumper, data):
    """
    Represents DotDict objects as a simple YAML mapping.
    The original output showed a 'dictitems' attribute. If your DotDict
    is essentially a dictionary, this will work.
    """
    # If DotDict has a specific attribute like 'dictitems' that holds the actual dict:
    # return dumper.represent_dict(data.dictitems)
    # If DotDict is a subclass of dict or dict-like:
    return dumper.represent_dict(dict(data))




[docs]
def represent_numpy_float(dumper, data):
    """
    Represents numpy.float64 (and similar numpy floats) as standard YAML floats.
    """
    return dumper.represent_float(float(data))




[docs]
def represent_numpy_int(dumper, data):
    """
    Represents numpy.int64 (and similar numpy integers) as standard YAML integers.
    """
    return dumper.represent_int(int(data))




[docs]
class TrainModelDumper(yaml.Dumper):
    """A custom YAML dumper for TrainModel objects.

    This dumper extends the base yaml.Dumper to provide custom serialization
    for TrainModel and related objects, ensuring a clean and readable YAML
    output. It also modifies the indentation behavior for better formatting.
    """

    # You can add more customizations here if needed, like indent width.

[docs]
    def increase_indent(self, flow=False, indentless=False):
        """Increase the indentation level for the YAML output.

        This method overrides the default behavior to force indentation for all
        block-style collections, improving the readability of the output YAML.

        Args:
            flow: Whether the context is a flow-style collection.
            indentless: Whether the context is an indentless sequence.

        Returns:
            The result of the parent class's increase_indent method, with flow
            forced to False.
        """
        return super(TrainModelDumper, self).increase_indent(flow, False)




TrainModelDumper.add_representer(TrainModel, represent_sequifier_object)
TrainModelDumper.add_representer(ModelSpecModel, represent_sequifier_object)
TrainModelDumper.add_representer(TrainingSpecModel, represent_sequifier_object)
TrainModelDumper.add_representer(DotDict, represent_dot_dict)
TrainModelDumper.add_representer(numpy.float64, represent_numpy_float)
TrainModelDumper.add_representer(
    numpy.float32, represent_numpy_float
)  # Add for other numpy float types if necessary
TrainModelDumper.add_representer(numpy.int64, represent_numpy_int)
TrainModelDumper.add_representer(
    numpy.int32, represent_numpy_int
)  # Add for other numpy int types if necessary