Source code for cleanvision.utils.base_issue_manager

from abc import ABC, abstractmethod
from typing import Dict, Any

import pandas as pd

from cleanvision.dataset.base_dataset import Dataset


[docs]class IssueManager(ABC): """Base class for managing data issues of a particular type in Imagelab.""" visualization: str issue_name: str def __init__(self) -> None: self.info: Dict[str, Dict[str, Any]] = {"statistics": {}} self.issues: pd.DataFrame = pd.DataFrame() self.summary: pd.DataFrame = pd.DataFrame(columns=["issue_type"]) def __repr__(self) -> str: class_name = self.__class__.__name__ return class_name def __str__(self) -> str: class_name = self.__class__.__name__ return class_name
[docs] @staticmethod def check_params(**kwargs: Any) -> None: allowed_kwargs: Dict[str, Any] = { "params": Dict[str, Any], "dataset": Dataset, "imagelab_info": Dict[str, Any], "n_jobs": int, } for name, value in kwargs.items(): if name not in allowed_kwargs: raise ValueError(f"{name} is not a valid keyword argument.") if value is not None and not isinstance(value, allowed_kwargs[name]): raise ValueError( f"Valid type for keyword argument {name} can only be {allowed_kwargs[name]}. {name} cannot be type {type(name)}. " )
[docs] @abstractmethod def find_issues(self, **kwargs: Any) -> None: """Finds occurrences of this particular issue in the dataset.""" self.check_params(**kwargs) return
[docs] @abstractmethod def get_default_params(self) -> Dict[str, Any]: """Returns default params to be used by the issue_manager""" raise NotImplementedError
[docs] @abstractmethod def update_params(self, params: Dict[str, Any]) -> None: """Sets params for an issue manager. Default params will be overridden by user provided params""" raise NotImplementedError
@staticmethod def _compute_summary(issues_boolean: "pd.Series[bool]") -> Dict[str, int]: return {"num_images": issues_boolean.sum()}