Source code for opr.datasets.base

"""Base dataset implementation."""
from pathlib import Path
from typing import Any, Dict, List, Literal, Optional, Tuple, Union

import numpy as np
import pandas as pd
import torch
from loguru import logger
from pandas import DataFrame
from torch import Tensor
from torch.utils.data import Dataset

from opr.datasets.augmentations import (
    DefaultCloudSetTransform,
    DefaultCloudTransform,
    DefaultImageTransform,
    DefaultSemanticTransform,
)



[docs]
class BasePlaceRecognitionDataset(Dataset):
    """Base class for track-based Place Recognition dataset."""

    dataset_root: Path
    subset: Literal["train", "val", "test"]
    dataset_df: DataFrame
    data_to_load: Tuple[str, ...]

    def __init__(
        self,
        dataset_root: Union[str, Path],
        subset: Literal["train", "val", "test"],
        data_to_load: Union[str, Tuple[str, ...]],
        positive_threshold: float = 10.0,
        negative_threshold: float = 50.0,
        image_transform: Optional[Any] = None,
        semantic_transform: Optional[Any] = None,
        pointcloud_transform: Optional[Any] = None,
        pointcloud_set_transform: Optional[Any] = None,
    ) -> None:
        """Base class for track-based Place Recognition dataset.

        Args:
            dataset_root (Union[str, Path]): The path to the root directory of the dataset.
            subset (Literal["train", "val", "test"]): The subset of the dataset to load.
            data_to_load (Union[str, Tuple[str, ...]]): The list of data sources to load.
            positive_threshold (float): The maximum distance between two elements
                for them to be considered positive. Defaults to 10.0.
            negative_threshold (float): The maximum distance between two elements
                for them to be considered non-negative. Defaults to 50.0.
            image_transform (Any, optional): Images transform. Defaults to None.
            semantic_transform (Any, optional): Semantic masks transform. Defaults to None.
            pointcloud_transform (Any, optional): Point clouds transform. Defaults to None.
            pointcloud_set_transform (Any, optional): Point clouds set transform. Defaults to None.

        Raises:
            FileNotFoundError: If the dataset_root directory does not exist.
            ValueError: If an invalid subset is given.
            FileNotFoundError: If the csv file for the given subset does not exist.
            ValueError: If positive_threshold or negative_threshold is a negative number.
        """
        self.dataset_root = Path(dataset_root)
        if not self.dataset_root.exists():
            raise FileNotFoundError(f"Given dataset_root={self.dataset_root!r} doesn't exist")

        valid_subsets = ("train", "val", "test")
        if subset not in valid_subsets:
            raise ValueError(f"Invalid subset argument: {subset!r} not in {valid_subsets!r}")
        self.subset = subset

        subset_csv_path = self.dataset_root / f"{subset}.csv"
        if not subset_csv_path.exists() and subset == "test":
            logger.warning(
                f"There is no test.csv file in given dataset_root={self.dataset_root!r}."
                "Trying to load val.csv instead."
            )
            subset_csv_path = self.dataset_root / "val.csv"
        if not subset_csv_path.exists():
            raise FileNotFoundError(
                f"There is no {subset}.csv file in given dataset_root={self.dataset_root!r}."
                "Consider checking documentation on how to preprocess the dataset."
            )
        self.dataset_df = pd.read_csv(subset_csv_path, index_col=0)

        if isinstance(data_to_load, str):
            data_to_load = tuple([data_to_load])
        else:
            data_to_load = tuple(data_to_load)
        self.data_to_load = data_to_load

        if positive_threshold < 0.0:
            raise ValueError(f"positive_threshold must be non-negative, but {positive_threshold!r} given.")
        if negative_threshold < 0.0:
            raise ValueError(f"negative_threshold must be non-negative, but {negative_threshold!r} given.")

        self._positives_mask, self._negatives_mask = self._build_masks(positive_threshold, negative_threshold)
        self._positives_index, self._nonnegative_index = self._build_indexes(
            positive_threshold, negative_threshold
        )

        # TODO: images and masks transforms should be performed simualtenously via Albumentations
        self.image_transform = image_transform or DefaultImageTransform(train=(self.subset == "train"))
        self.semantic_transform = semantic_transform or DefaultSemanticTransform(
            train=(self.subset == "train")
        )
        self.pointcloud_transform = pointcloud_transform or DefaultCloudTransform(
            train=(self.subset == "train")
        )
        self.pointcloud_set_transform = pointcloud_set_transform or DefaultCloudSetTransform(
            train=(self.subset == "train")
        )

    def __len__(self) -> int:  # noqa: D105
        return len(self.dataset_df)

    def __getitem__(self, idx: int) -> Dict[str, Tensor]:  # noqa: D105
        raise NotImplementedError()

    def _build_masks(self, positive_threshold: float, negative_threshold: float) -> Tuple[Tensor, Tensor]:
        """Build boolean masks for dataset elements that satisfy a UTM distance threshold condition.

        Args:
            positive_threshold (float): The maximum UTM distance between two elements
                for them to be considered positive.
            negative_threshold (float): The maximum UTM distance between two elements
                for them to be considered non-negative.

        Returns:
            Tuple[Tensor, Tensor]: A tuple of two boolean masks that satisfy the UTM distance threshold
                condition for each element in the dataset. The first mask contains the indices of elements
                that satisfy the positive threshold, while the second mask contains the indices of elements
                that satisfy the negative threshold.
        """
        northing_easting = torch.tensor(
            self.dataset_df[["northing", "easting"]].to_numpy(dtype=np.float64), dtype=torch.float64
        )
        distances = torch.cdist(northing_easting, northing_easting)

        positives_mask = (distances > 0) & (distances < positive_threshold)
        negatives_mask = distances > negative_threshold

        return positives_mask, negatives_mask

    def _build_indexes(
        self, positive_threshold: float, negative_threshold: float
    ) -> Tuple[List[Tensor], List[Tensor]]:
        """Build index of elements that satisfy a UTM distance threshold condition.

        Args:
            positive_threshold (float): The maximum UTM distance between two elements
                for them to be considered positive.
            negative_threshold (float): The maximum UTM distance between two elements
                for them to be considered non-negative.

        Returns:
            Tuple[List[Tensor], List[Tensor]]: Tuple (positive_indices, nonnegative_indices)
                of two lists of element indexes that satisfy the UTM distance threshold condition
                for each element in the dataset.
        """
        northing_easting = torch.tensor(
            self.dataset_df[["northing", "easting"]].to_numpy(dtype=np.float64), dtype=torch.float64
        )
        distances = torch.cdist(northing_easting, northing_easting)

        positives_mask = (distances > 0) & (distances < positive_threshold)
        nonnegatives_mask = distances < negative_threshold

        # Convert the boolean masks to index tensors
        positive_indices = [torch.nonzero(row).squeeze(dim=-1) for row in positives_mask]
        nonnegative_indices = [torch.nonzero(row).squeeze(dim=-1) for row in nonnegatives_mask]

        return positive_indices, nonnegative_indices

    @property
    def positives_index(self) -> List[Tensor]:
        """List of indexes of positive samples for each element in the dataset."""
        return self._positives_index

    @property
    def nonnegative_index(self) -> List[Tensor]:
        """List of indexes of non-negatives samples for each element in the dataset."""
        return self._nonnegative_index

    @property
    def positives_mask(self) -> Tensor:
        """Boolean mask of positive samples for each element in the dataset."""
        return self._positives_mask

    @property
    def negatives_mask(self) -> Tensor:
        """Boolean mask of negative samples for each element in the dataset."""
        return self._negatives_mask


[docs]
    def collate_fn(self, data_list: List[Dict[str, Tensor]]) -> Dict[str, Tensor]:
        """Collate function for torch.utils.data.DataLoader."""
        raise NotImplementedError()