Don't use type[T]; use Callable[..., T] (#1073)

tmke8 · web-flow · commit bf8c4fdef756 · 2024-03-08T14:03:24.000Z
It's much more type-safe.
diff --git a/ethicml/implementations/dro_modules/dro_loss.py b/ethicml/implementations/dro_modules/dro_loss.py
@@ -1,6 +1,6 @@
 """DRO Loss."""
 
-from typing import Type
+from typing import Protocol
 from typing_extensions import override
 
 from torch import Tensor, nn
@@ -9,10 +9,14 @@
 __all__ = ["DROLoss"]
 
 
+class LossFactory(Protocol):
+    def __call__(self, *, reduction: str = "mean") -> _Loss: ...
+
+
 class DROLoss(nn.Module):
     """Fairness Without Demographics Loss."""
 
-    def __init__(self, loss_module: Type[_Loss] | None = None, eta: float = 0.5):
+    def __init__(self, loss_module: LossFactory | None = None, eta: float = 0.5):
         super().__init__()
         if loss_module is None:
             loss_module = NLLLoss
diff --git a/ethicml/implementations/hgr_modules/facl/facl_hgr.py b/ethicml/implementations/hgr_modules/facl/facl_hgr.py
@@ -1,6 +1,6 @@
 """Independence of 2 variables."""
 
-from typing import Type
+from collections.abc import Callable
 
 import numpy as np
 import torch
@@ -9,7 +9,9 @@
 from .density_estimation import Kde
 
 
-def _joint_2(x: Tensor, y: Tensor, density: Type[Kde], damping: float = 1e-10) -> Tensor:
+def _joint_2(
+    x: Tensor, y: Tensor, density: Callable[[Tensor], Kde], damping: float = 1e-10
+) -> Tensor:
     x = (x - x.mean()) / x.std()
     y = (y - y.mean()) / y.std()
     data = torch.cat([x.unsqueeze(-1), y.unsqueeze(-1)], -1)
@@ -27,7 +29,7 @@ def _joint_2(x: Tensor, y: Tensor, density: Type[Kde], damping: float = 1e-10) -
     return h2d
 
 
-def hgr(x: Tensor, y: Tensor, density: Type[Kde], damping: float = 1e-10) -> Tensor:
+def hgr(x: Tensor, y: Tensor, density: Callable[[Tensor], Kde], damping: float = 1e-10) -> Tensor:
     """An estimator of the Hirschfeld-Gebelein-Renyi maximum correlation coefficient.
 
     This function is using Witsenhausen’s Characterization.
@@ -48,7 +50,7 @@ def hgr(x: Tensor, y: Tensor, density: Type[Kde], damping: float = 1e-10) -> Ten
     return torch.svd(Q)[1][1]
 
 
-def chi_2(x: Tensor, y: Tensor, density: Type[Kde], damping: float = 0) -> Tensor:
+def chi_2(x: Tensor, y: Tensor, density: Callable[[Tensor], Kde], damping: float = 0) -> Tensor:
     r"""The :math:`\chi^2` divergence between the joint distribution and the product of marginals.
 
     This is know to be the square of an upper-bound on the Hirschfeld-Gebelein-Renyi maximum
@@ -71,7 +73,9 @@ def chi_2(x: Tensor, y: Tensor, density: Type[Kde], damping: float = 0) -> Tenso
 # Independence of conditional variables
 
 
-def _joint_3(x: Tensor, y: Tensor, z: Tensor, density: Type[Kde], damping: float = 1e-10) -> Tensor:
+def _joint_3(
+    x: Tensor, y: Tensor, z: Tensor, density: Callable[[Tensor], Kde], damping: float = 1e-10
+) -> Tensor:
     x = (x - x.mean()) / x.std()
     y = (y - y.mean()) / y.std()
     z = (z - z.mean()) / z.std()
@@ -90,7 +94,7 @@ def _joint_3(x: Tensor, y: Tensor, z: Tensor, density: Type[Kde], damping: float
     return h3d
 
 
-def hgr_cond(x: Tensor, y: Tensor, z: Tensor, density: Type[Kde]) -> np.ndarray:
+def hgr_cond(x: Tensor, y: Tensor, z: Tensor, density: Callable[[Tensor], Kde]) -> np.ndarray:
     r"""An estimator of the function :math:`z\to HGR(x|z, y|z)`.
 
     Where HGR is the Hirschfeld-Gebelein-Renyi maximum correlation
@@ -113,7 +117,7 @@ def hgr_cond(x: Tensor, y: Tensor, z: Tensor, density: Type[Kde]) -> np.ndarray:
     return np.array([torch.svd(Q[:, :, i])[1][1] for i in range(Q.shape[2])])
 
 
-def chi_2_cond(x: Tensor, y: Tensor, z: Tensor, density: Type[Kde]) -> Tensor:
+def chi_2_cond(x: Tensor, y: Tensor, z: Tensor, density: Callable[[Tensor], Kde]) -> Tensor:
     r"""An estimator of the function :math:`z\to chi^2(x|z, y|z)`.
 
     Where :math:`\chi^2` is the :math:`\chi^2` divergence between the joint distribution on (x,y)
diff --git a/ethicml/implementations/hgr_modules/facl_hgr.py b/ethicml/implementations/hgr_modules/facl_hgr.py
@@ -1,6 +1,6 @@
 """Independence of 2 variables."""
 
-from typing import Type
+from collections.abc import Callable
 
 import numpy as np
 import torch
@@ -9,7 +9,9 @@
 from .density_estimation import Kde
 
 
-def _joint_2(x: Tensor, y: Tensor, density: Type[Kde], damping: float = 1e-10) -> Tensor:
+def _joint_2(
+    x: Tensor, y: Tensor, density: Callable[[Tensor], Kde], damping: float = 1e-10
+) -> Tensor:
     x = (x - x.mean()) / x.std()
     y = (y - y.mean()) / y.std()
     data = torch.cat([x.unsqueeze(-1), y.unsqueeze(-1)], -1)
@@ -27,7 +29,7 @@ def _joint_2(x: Tensor, y: Tensor, density: Type[Kde], damping: float = 1e-10) -
     return h2d
 
 
-def hgr(x: Tensor, y: Tensor, density: Type[Kde], damping: float = 1e-10) -> Tensor:
+def hgr(x: Tensor, y: Tensor, density: Callable[[Tensor], Kde], damping: float = 1e-10) -> Tensor:
     """An estimator of the Hirschfeld-Gebelein-Renyi maximum correlation coefficient.
 
     This function is using Witsenhausen’s Characterization.
@@ -48,7 +50,7 @@ def hgr(x: Tensor, y: Tensor, density: Type[Kde], damping: float = 1e-10) -> Ten
     return torch.svd(Q)[1][1]
 
 
-def chi_2(x: Tensor, y: Tensor, density: Type[Kde], damping: float = 0) -> Tensor:
+def chi_2(x: Tensor, y: Tensor, density: Callable[[Tensor], Kde], damping: float = 0) -> Tensor:
     r"""The :math:`\chi^2` divergence between the joint distribution and the product of marginals.
 
     This is know to be the square of an upper-bound on the Hirschfeld-Gebelein-Renyi maximum
@@ -71,7 +73,9 @@ def chi_2(x: Tensor, y: Tensor, density: Type[Kde], damping: float = 0) -> Tenso
 # Independence of conditional variables
 
 
-def _joint_3(x: Tensor, y: Tensor, z: Tensor, density: Type[Kde], damping: float = 1e-10) -> Tensor:
+def _joint_3(
+    x: Tensor, y: Tensor, z: Tensor, density: Callable[[Tensor], Kde], damping: float = 1e-10
+) -> Tensor:
     x = (x - x.mean()) / x.std()
     y = (y - y.mean()) / y.std()
     z = (z - z.mean()) / z.std()
@@ -90,7 +94,7 @@ def _joint_3(x: Tensor, y: Tensor, z: Tensor, density: Type[Kde], damping: float
     return h3d
 
 
-def hgr_cond(x: Tensor, y: Tensor, z: Tensor, density: Type[Kde]) -> np.ndarray:
+def hgr_cond(x: Tensor, y: Tensor, z: Tensor, density: Callable[[Tensor], Kde]) -> np.ndarray:
     r"""An estimator of the function :math:`z\to HGR(x|z, y|z)`.
 
     Where HGR is the Hirschfeld-Gebelein-Renyi maximum correlation
@@ -113,7 +117,7 @@ def hgr_cond(x: Tensor, y: Tensor, z: Tensor, density: Type[Kde]) -> np.ndarray:
     return np.array([torch.svd(Q[:, :, i])[1][1] for i in range(Q.shape[2])])
 
 
-def chi_2_cond(x: Tensor, y: Tensor, z: Tensor, density: Type[Kde]) -> Tensor:
+def chi_2_cond(x: Tensor, y: Tensor, z: Tensor, density: Callable[[Tensor], Kde]) -> Tensor:
     r"""An estimator of the function :math:`z\to chi^2(x|z, y|z)`.
 
     Where :math:`\chi^2` is the :math:`\chi^2` divergence between the joint distribution on (x,y)
diff --git a/ethicml/run/cross_validator.py b/ethicml/run/cross_validator.py
@@ -1,9 +1,10 @@
 """Cross Validation for any in process (at the moment) Algorithm."""
 
 from collections import defaultdict
+from collections.abc import Callable
 from itertools import product
 from statistics import mean
-from typing import Any, Mapping, NamedTuple, Sequence, Type
+from typing import Any, Mapping, NamedTuple, Sequence
 
 from ethicml.metrics.accuracy import Accuracy
 from ethicml.metrics.cv import AbsCV
@@ -55,7 +56,7 @@ class CVResults:
 
     """
 
-    def __init__(self, results: list[ResultTuple], model: type[InAlgorithm]):
+    def __init__(self, results: list[ResultTuple], model: Callable[..., InAlgorithm]):
         self.raw_storage = results
         self.model = model
         self.mean_storage = self._organize_and_compute_means()
@@ -195,7 +196,7 @@ class CrossValidator:
 
     def __init__(
         self,
-        model: Type[InAlgorithm],
+        model: Callable[..., InAlgorithm],
         hyperparams: Mapping[str, Sequence[Any]],
         folds: int = 3,
         max_parallel: int = 0,
diff --git a/tests/data/dataset_modification_test.py b/tests/data/dataset_modification_test.py
@@ -1,6 +1,7 @@
 """Test modifiactions to a dataset."""
 
-from typing import Type, Union
+from collections.abc import Callable
+from typing import Union
 
 import pandas as pd
 import pytest
@@ -14,7 +15,8 @@
 @pytest.mark.parametrize("dataset_name", available_tabular())
 @pytest.mark.parametrize("scaler_type", [StandardScaler, MinMaxScaler])
 def test_scaling(
-    dataset_name: str, scaler_type: Union[Type[StandardScaler], Type[MinMaxScaler]]
+    dataset_name: str,
+    scaler_type: Union[Callable[[], StandardScaler], Callable[[], StandardScaler]],
 ) -> None:
     """Test that scaling works."""
     scaler = scaler_type()
@@ -42,7 +44,8 @@ def test_scaling(
 @pytest.mark.parametrize("dataset_name", available_tabular())
 @pytest.mark.parametrize("scaler_type", [StandardScaler, MinMaxScaler])
 def test_scaling_separate_test(
-    dataset_name: str, scaler_type: Union[Type[StandardScaler], Type[MinMaxScaler]]
+    dataset_name: str,
+    scaler_type: Union[Callable[[], StandardScaler], Callable[[], StandardScaler]],
 ) -> None:
     """Test that scaling works."""
     scaler = scaler_type()
diff --git a/tests/models_test/inprocess_test/cv_test.py b/tests/models_test/inprocess_test/cv_test.py
@@ -1,6 +1,7 @@
 """Tests for cross validation."""
 
-from typing import Dict, List, NamedTuple, Sequence, Type, Union
+from collections.abc import Callable
+from typing import Dict, List, NamedTuple, Sequence, Union
 
 import numpy as np
 import pytest
@@ -14,7 +15,7 @@
 class CvParam(NamedTuple):
     """Specification of a unit test for cross validation."""
 
-    model: Type[InAlgorithm]
+    model: Callable[..., InAlgorithm]
     hyperparams: Dict[str, Union[Sequence[float], List[str], Sequence[KernelType]]]
     num_pos: int
 
@@ -32,7 +33,7 @@ class CvParam(NamedTuple):
 @pytest.mark.parametrize(("model", "hyperparams", "num_pos"), CV_PARAMS)
 def test_cv(
     toy_train_test: TrainTestPair,
-    model: Type[InAlgorithm],
+    model: Callable[..., InAlgorithm],
     hyperparams: Dict[str, Union[Sequence[float], List[str]]],
     num_pos: int,
 ) -> None:
@@ -53,7 +54,7 @@ def test_cv(
 @pytest.mark.parametrize(("model", "hyperparams", "num_pos"), CV_PARAMS)
 def test_parallel_cv(
     toy_train_test: TrainTestPair,
-    model: Type[InAlgorithm],
+    model: Callable[..., InAlgorithm],
     hyperparams: Dict[str, Union[Sequence[float], List[str]]],
     num_pos: int,
 ) -> None:
diff --git a/tests/models_test/inprocess_test/zafar_test.py b/tests/models_test/inprocess_test/zafar_test.py
@@ -3,7 +3,8 @@
 They are kept separate because they're very slow.
 """
 
-from typing import Dict, Generator, List, Type
+from collections.abc import Callable
+from typing import Dict, Generator, List
 
 import numpy as np
 import pytest
@@ -61,7 +62,7 @@ def test_zafar(toy_train_test: TrainTestPair) -> None:  # noqa: PLR0915
 
     hyperparams: Dict[str, List[float]] = {"gamma": [1, 1e-1, 1e-2]}
 
-    model_class: Type[InAlgorithm] = ZafarAccuracy
+    model_class: Callable[..., InAlgorithm] = ZafarAccuracy
     zafar_cv = CrossValidator(model_class, hyperparams, folds=3)
 
     assert zafar_cv is not None