AutoDataset

`AutoDataset` #

Source code in focoos/data/auto_dataset.py

class AutoDataset:
    def __init__(
        self,
        dataset_name: str,
        task: Task,
        layout: DatasetLayout,
        datasets_dir: str = DATASETS_DIR,
    ):
        self.task = task
        self.layout = layout
        self.datasets_dir = datasets_dir
        self.dataset_name = dataset_name

        if self.layout is not DatasetLayout.CATALOG:
            dataset_path = os.path.join(self.datasets_dir, dataset_name)
        else:
            dataset_path = self.datasets_dir

        if dataset_path.endswith(".zip") or dataset_path.endswith(".gz"):
            # compressed path: datasets_root_dir/dataset_compressed/{dataset_name}.zip
            # _dest_path = os.path.join(self.datasets_root_dir, dataset_name.split(".")[0])
            assert not (self.layout == DatasetLayout.CATALOG and not is_inside_sagemaker()), (
                "Catalog layout does not support compressed datasets externally to Sagemaker."
            )
            if self.layout == DatasetLayout.CATALOG:
                dataset_path = extract_archive(dataset_path)
                logger.info(f"Extracted archive: {dataset_path}, {os.listdir(dataset_path)}")
            else:
                dataset_name = dataset_name.split(".")[0]
                _dest_path = os.path.join(self.datasets_dir, dataset_name)
                dataset_path = extract_archive(dataset_path, _dest_path)
                logger.info(f"Extracted archive: {dataset_path}, {os.listdir(dataset_path)}")

        self.dataset_path = str(dataset_path)
        self.dataset_name = dataset_name
        logger.info(
            f"✅ Dataset name: {self.dataset_name}, Dataset Path: {self.dataset_path}, Dataset Layout: {self.layout}"
        )

    def _load_split(self, dataset_name: str, split: DatasetSplitType) -> DictDataset:
        if self.layout == DatasetLayout.CATALOG:
            return DictDataset.from_catalog(ds_name=dataset_name, split=split, root=self.dataset_path)
        else:
            ds_root = self.dataset_path
            if not check_folder_exists(ds_root):
                raise FileNotFoundError(f"Dataset {ds_root} not found")
            split_path = self._get_split_path(dataset_root=ds_root, split_type=split)
            if self.layout == DatasetLayout.ROBOFLOW_SEG:
                return DictDataset.from_roboflow_seg(ds_dir=split_path, task=self.task)
            elif self.layout == DatasetLayout.CLS_FOLDER:
                return DictDataset.from_folder(root_dir=split_path)
            # elif self.layout == DatasetLayout.SUPERVISELY:
            #     return DictDataset.from_supervisely(ds_dir=split_path, task=self.task)
            elif self.layout == DatasetLayout.ROBOFLOW_COCO:
                return DictDataset.from_roboflow_coco(ds_dir=split_path, task=self.task)
            else:  # Focoos
                raise NotImplementedError(f"Dataset layout {self.layout} not implemented")

    def _load_mapper(
        self,
        augs: List[T.Transform],
        is_validation_split: bool,
    ) -> DatasetMapper:
        if self.task == Task.SEMSEG:
            return SemanticDatasetMapper(
                image_format="RGB",
                ignore_label=255,
                augmentations=augs,
                is_train=not is_validation_split,
            )
        elif self.task == Task.DETECTION:
            return DetectionDatasetMapper(
                image_format="RGB",
                is_train=not is_validation_split,
                augmentations=augs,
            )
        elif self.task == Task.INSTANCE_SEGMENTATION:
            return DetectionDatasetMapper(
                image_format="RGB",
                is_train=not is_validation_split,
                augmentations=augs,
                use_instance_mask=True,
            )
        elif self.task == Task.CLASSIFICATION:
            return ClassificationDatasetMapper(
                image_format="RGB",
                is_train=not is_validation_split,
                augmentations=augs,
            )
        else:
            raise NotImplementedError(f"Task {self.task} not found in autodataset _load_mapper()")

    def _get_split_path(self, dataset_root: str, split_type: DatasetSplitType) -> str:
        if split_type == DatasetSplitType.TRAIN:
            possible_names = ["train", "training"]
            for name in possible_names:
                split_path = os.path.join(dataset_root, name)
                if check_folder_exists(split_path):
                    return split_path
            raise FileNotFoundError(f"Train split not found in {dataset_root}")
        elif split_type == DatasetSplitType.VAL:
            possible_names = ["valid", "val", "validation"]
            for name in possible_names:
                split_path = os.path.join(dataset_root, name)
                if check_folder_exists(split_path):
                    return split_path
            raise FileNotFoundError(f"Validation split not found in {dataset_root}")
        else:
            raise ValueError(f"Invalid split type: {split_type}")

    def get_split(
        self,
        augs: List[T.Transform],
        split: DatasetSplitType = DatasetSplitType.TRAIN,
    ) -> MapDataset:
        """
        Generate a dataset for a given dataset name with optional augmentations.

        Parameters:
            short_edge_length (int): The length of the shorter edge of the images.
            max_size (int): The maximum size of the images.
            extra_augs (List[Transform]): Extra augmentations to apply.

        Returns:
            MapDataset: A DictDataset with DatasetMapper for training.
        """

        return MapDataset(
            dataset=self._load_split(dataset_name=self.dataset_name, split=split),
            mapper=self._load_mapper(
                augs=augs,
                is_validation_split=(split == DatasetSplitType.VAL),
            ),
        )  # type: ignore

`get_split(augs, split=DatasetSplitType.TRAIN)` #

Generate a dataset for a given dataset name with optional augmentations.

Parameters:

Name	Type	Description	Default
`short_edge_length`	`int`	The length of the shorter edge of the images.	required
`max_size`	`int`	The maximum size of the images.	required
`extra_augs`	`List[Transform]`	Extra augmentations to apply.	required

Returns:

Name	Type	Description
`MapDataset`	`MapDataset`	A DictDataset with DatasetMapper for training.

Source code in focoos/data/auto_dataset.py

def get_split(
    self,
    augs: List[T.Transform],
    split: DatasetSplitType = DatasetSplitType.TRAIN,
) -> MapDataset:
    """
    Generate a dataset for a given dataset name with optional augmentations.

    Parameters:
        short_edge_length (int): The length of the shorter edge of the images.
        max_size (int): The maximum size of the images.
        extra_augs (List[Transform]): Extra augmentations to apply.

    Returns:
        MapDataset: A DictDataset with DatasetMapper for training.
    """

    return MapDataset(
        dataset=self._load_split(dataset_name=self.dataset_name, split=split),
        mapper=self._load_mapper(
            augs=augs,
            is_validation_split=(split == DatasetSplitType.VAL),
        ),
    )  # type: ignore

`DatasetAugmentations` `dataclass` #

Configuration class for dataset augmentations.

This class defines parameters for various image transformations used in training and validation pipelines for computer vision tasks. It provides a comprehensive set of options for both color and geometric augmentations.

Attributes:

Name	Type	Description
`resolution`	`int`	Target image size for resizing operations. Range [256, 1024]. Default: 640.
`color_augmentation`	`float`	Strenght of color augmentations. Range [0,1]. Default: 0.0.
`horizontal_flip`	`float`	Probability of applying horizontal flip. Range [0,1]. Default: 0.0.
`vertical_flip`	`float`	Probability of applying vertical flip. Range [0,1]. Default: 0.0.
`zoom_out`	`float`	Probability of applying RandomZoomOut. Range [0,1]. Default: 0.0.
`zoom_out_side`	`float`	Zoom out side range. Range [1,5]. Default: 4.0.
`rotation`	`float`	Probability of applying RandomRotation. 1 equals +/-180 degrees. Range [0,1]. Default: 0.0.
`square`	`bool`	Whether to Square the image. Default: False.
`aspect_ratio`	`float`	Aspect ratio for resizing (actual scale range is (2 -aspect_ratio, 2 aspect_ratio). Range [0,1]. Default: 0.0.
`scale_ratio`	`Optional[float]`	scale factor for resizing (actual scale range is (2 -scale_ratio, 2 scale_ratio). Range [0,1]. Default: None.
`max_size`	`Optional[int]`	Maximum allowed dimension after resizing. Range [256, sys.maxsize]. Default: sys.maxsize.
`crop`	`bool`	Whether to apply RandomCrop. Default: False.
`crop_size_min`	`Optional[int]`	Minimum crop size for RandomCrop. Range [256, 1024]. Default: None.
`crop_size_max`	`Optional[int]`	Maximum crop size for RandomCrop. Range [256, 1024]. Default: None.

Source code in focoos/data/default_aug.py

@dataclass
class DatasetAugmentations:
    """
    Configuration class for dataset augmentations.

    This class defines parameters for various image transformations used in training and validation
    pipelines for computer vision tasks. It provides a comprehensive set of options for both
    color and geometric augmentations.

    Attributes:
        resolution (int): Target image size for resizing operations.
            Range [256, 1024]. Default: 640.
        ==
        color_augmentation (float): Strenght of color augmentations.
            Range [0,1]. Default: 0.0.
        ==
        horizontal_flip (float): Probability of applying horizontal flip.
            Range [0,1]. Default: 0.0.
        vertical_flip (float): Probability of applying vertical flip.
            Range [0,1]. Default: 0.0.
        zoom_out (float): Probability of applying RandomZoomOut.
            Range [0,1]. Default: 0.0.
        zoom_out_side (float): Zoom out side range.
            Range [1,5]. Default: 4.0.
        rotation (float): Probability of applying RandomRotation. 1 equals +/-180 degrees.
            Range [0,1]. Default: 0.0.
        ==
        square (bool): Whether to Square the image.
            Default: False.
        aspect_ratio (float): Aspect ratio for resizing (actual scale range is (2 ** -aspect_ratio, 2 ** aspect_ratio).
            Range [0,1]. Default: 0.0.
        scale_ratio (Optional[float]): scale factor for resizing (actual scale range is (2 ** -scale_ratio, 2 ** scale_ratio).
            Range [0,1]. Default: None.
        max_size (Optional[int]): Maximum allowed dimension after resizing.
            Range [256, sys.maxsize]. Default: sys.maxsize.
        ==
        crop (bool): Whether to apply RandomCrop.
            Default: False.
        crop_size_min (Optional[int]): Minimum crop size for RandomCrop.
            Range [256, 1024]. Default: None.
        crop_size_max (Optional[int]): Maximum crop size for RandomCrop.
            Range [256, 1024]. Default: None.
    """

    # Resolution for resizing
    resolution: int = 640

    # Color augmentation parameters
    color_augmentation: float = 0.0
    color_base_brightness: int = 32
    color_base_saturation: float = 0.5
    color_base_contrast: float = 0.5
    color_base_hue: float = 18
    # blur: float = 0.0
    # noise: float = 0.0

    # Geometric augmentation
    horizontal_flip: float = 0.0
    vertical_flip: float = 0.0
    zoom_out: float = 0.0
    zoom_out_side: float = 4.0
    rotation: float = 0.0
    aspect_ratio: float = 0.0

    ## Rescaling
    square: float = 0.0
    scale_ratio: float = 0.0
    max_size: int = 4096

    # Cropping
    crop: bool = False
    crop_size: Optional[int] = None

    # TODO: Add more augmentations like:
    # - GaussianBlur
    # - RandomNoise
    # - RandomResizedCrop

    def override(self, args):
        if not isinstance(args, dict):
            args = vars(args)
        for key, value in args.items():
            if hasattr(self, key) and value is not None:
                setattr(self, key, value)
        return self

    def get_augmentations(self, img_format="RGB", task: Optional[Task] = None) -> List[T.Transform]:
        """Generate augmentation pipeline based on configuration."""
        augs = []
        self.max_size = self.max_size if self.max_size else sys.maxsize

        ### Add color augmentation if configured
        if self.color_augmentation > 0:
            brightness_delta = int(self.color_base_brightness * self.color_augmentation)
            contrast_delta = self.color_base_contrast * self.color_augmentation
            saturation_delta = self.color_base_saturation * self.color_augmentation
            hue_delta = int(self.color_base_hue * self.color_augmentation)
            augs.append(
                T.ColorAugSSDTransform(
                    img_format=img_format,
                    brightness_delta=brightness_delta,
                    contrast_low=(1 - contrast_delta),
                    contrast_high=(1 + contrast_delta),
                    saturation_low=(1 - saturation_delta),
                    saturation_high=(1 + saturation_delta),
                    hue_delta=hue_delta,
                ),
            )

        ### Add geometric augmentations
        # Add flipping augmentations if configured
        if self.horizontal_flip > 0:
            augs.append(A.RandomFlip(prob=self.horizontal_flip, horizontal=True))
        if self.vertical_flip > 0:
            augs.append(A.RandomFlip(prob=self.vertical_flip, horizontal=False, vertical=True))

        # Add zoom out augmentations if configured
        if self.zoom_out > 0.0:
            seg_pad_value = 255 if task == Task.SEMSEG else 0
            augs.append(
                A.RandomApply(
                    A.RandomZoomOut(side_range=(1.0, self.zoom_out_side), pad_value=0, seg_pad_value=seg_pad_value),
                    prob=self.zoom_out,
                )
            )

        ### Add AspectRatio augmentations based on configuration
        if self.square > 0.0:
            augs.append(A.RandomApply(A.Resize(shape=(self.resolution, self.resolution)), prob=self.square))
        elif self.aspect_ratio > 0.0:
            augs.append(A.RandomAspectRatio(aspect_ratio=self.aspect_ratio))

        ### Add Resizing augmentations based on configuration
        min_scale, max_scale = 2 ** (-self.scale_ratio), 2**self.scale_ratio
        augs.append(
            A.ResizeShortestEdge(
                short_edge_length=[int(x * self.resolution) for x in [min_scale, max_scale]],
                sample_style="range",
                max_size=self.max_size,
            )
        )

        ### Add rotation augmentations if configured
        if self.rotation > 0:
            angle = self.rotation * 180
            augs.append(A.RandomRotation(angle=(-angle, angle), expand=False))

        # Add cropping if configured
        if self.crop:
            crop_range = (self.crop_size or self.resolution, self.crop_size or self.resolution)
            augs.append(A.RandomCrop(crop_type="absolute_range", crop_size=crop_range))

        return augs

`get_augmentations(img_format='RGB', task=None)` #

Generate augmentation pipeline based on configuration.

Source code in focoos/data/default_aug.py

def get_augmentations(self, img_format="RGB", task: Optional[Task] = None) -> List[T.Transform]:
    """Generate augmentation pipeline based on configuration."""
    augs = []
    self.max_size = self.max_size if self.max_size else sys.maxsize

    ### Add color augmentation if configured
    if self.color_augmentation > 0:
        brightness_delta = int(self.color_base_brightness * self.color_augmentation)
        contrast_delta = self.color_base_contrast * self.color_augmentation
        saturation_delta = self.color_base_saturation * self.color_augmentation
        hue_delta = int(self.color_base_hue * self.color_augmentation)
        augs.append(
            T.ColorAugSSDTransform(
                img_format=img_format,
                brightness_delta=brightness_delta,
                contrast_low=(1 - contrast_delta),
                contrast_high=(1 + contrast_delta),
                saturation_low=(1 - saturation_delta),
                saturation_high=(1 + saturation_delta),
                hue_delta=hue_delta,
            ),
        )

    ### Add geometric augmentations
    # Add flipping augmentations if configured
    if self.horizontal_flip > 0:
        augs.append(A.RandomFlip(prob=self.horizontal_flip, horizontal=True))
    if self.vertical_flip > 0:
        augs.append(A.RandomFlip(prob=self.vertical_flip, horizontal=False, vertical=True))

    # Add zoom out augmentations if configured
    if self.zoom_out > 0.0:
        seg_pad_value = 255 if task == Task.SEMSEG else 0
        augs.append(
            A.RandomApply(
                A.RandomZoomOut(side_range=(1.0, self.zoom_out_side), pad_value=0, seg_pad_value=seg_pad_value),
                prob=self.zoom_out,
            )
        )

    ### Add AspectRatio augmentations based on configuration
    if self.square > 0.0:
        augs.append(A.RandomApply(A.Resize(shape=(self.resolution, self.resolution)), prob=self.square))
    elif self.aspect_ratio > 0.0:
        augs.append(A.RandomAspectRatio(aspect_ratio=self.aspect_ratio))

    ### Add Resizing augmentations based on configuration
    min_scale, max_scale = 2 ** (-self.scale_ratio), 2**self.scale_ratio
    augs.append(
        A.ResizeShortestEdge(
            short_edge_length=[int(x * self.resolution) for x in [min_scale, max_scale]],
            sample_style="range",
            max_size=self.max_size,
        )
    )

    ### Add rotation augmentations if configured
    if self.rotation > 0:
        angle = self.rotation * 180
        augs.append(A.RandomRotation(angle=(-angle, angle), expand=False))

    # Add cropping if configured
    if self.crop:
        crop_range = (self.crop_size or self.resolution, self.crop_size or self.resolution)
        augs.append(A.RandomCrop(crop_type="absolute_range", crop_size=crop_range))

    return augs

AutoDataset

AutoDataset #

get_split(augs, split=DatasetSplitType.TRAIN) #

DatasetAugmentations dataclass #

get_augmentations(img_format='RGB', task=None) #

`AutoDataset` #

`get_split(augs, split=DatasetSplitType.TRAIN)` #

`DatasetAugmentations` `dataclass` #

`get_augmentations(img_format='RGB', task=None)` #