Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Fix auc calculation and add tests #197

Merged
merged 10 commits into from
Apr 26, 2021
Merged
Show file tree
Hide file tree
Changes from 4 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
35 changes: 24 additions & 11 deletions tests/classification/test_auc.py
Original file line number Diff line number Diff line change
Expand Up @@ -32,19 +32,29 @@ def sk_auc(x, y):
return _sk_auc(x, y)


def sk_auc_reorder(x, y):
x = x.flatten()
y = y.flatten()
idx = np.argsort(x, kind='stable')
x = x[idx]
y = y[idx]
return _sk_auc(x, y)
Borda marked this conversation as resolved.
Show resolved Hide resolved
Borda marked this conversation as resolved.
Show resolved Hide resolved


Input = namedtuple('Input', ["x", "y"])

_examples = []
# generate already ordered samples, sorted in both directions
for i in range(4):
x = np.random.randint(0, 5, (NUM_BATCHES * 8))
y = np.random.randint(0, 5, (NUM_BATCHES * 8))
idx = np.argsort(x, kind='stable')
x = x[idx] if i % 2 == 0 else x[idx[::-1]]
y = y[idx] if i % 2 == 0 else x[idx[::-1]]
x = x.reshape(NUM_BATCHES, 8)
y = y.reshape(NUM_BATCHES, 8)
_examples.append(Input(x=tensor(x), y=tensor(y)))
for batch_size in (8, 4049):
ananyahjha93 marked this conversation as resolved.
Show resolved Hide resolved
for i in range(4):
x = np.random.rand((NUM_BATCHES * batch_size))
y = np.random.rand((NUM_BATCHES * batch_size))
idx = np.argsort(x, kind='stable')
x = x[idx] if i % 2 == 0 else x[idx[::-1]]
y = y[idx] if i % 2 == 0 else x[idx[::-1]]
x = x.reshape(NUM_BATCHES, batch_size)
y = y.reshape(NUM_BATCHES, batch_size)
_examples.append(Input(x=tensor(x), y=tensor(y)))


@pytest.mark.parametrize("x, y", _examples)
Expand All @@ -62,8 +72,11 @@ def test_auc(self, x, y, ddp, dist_sync_on_step):
dist_sync_on_step=dist_sync_on_step,
)

def test_auc_functional(self, x, y):
self.run_functional_metric_test(x, y, metric_functional=auc, sk_metric=sk_auc, metric_args={"reorder": False})
@pytest.mark.parametrize("reorder", [True, False])
def test_auc_functional(self, x, y, reorder):
self.run_functional_metric_test(x, y, metric_functional=auc,
sk_metric=partial(sk_auc_reorder, reorder=reorder),
Borda marked this conversation as resolved.
Show resolved Hide resolved
metric_args={"reorder": reorder})


@pytest.mark.parametrize(['x', 'y', 'expected'], [
Expand Down
4 changes: 1 addition & 3 deletions torchmetrics/functional/classification/auc.py
Original file line number Diff line number Diff line change
Expand Up @@ -16,8 +16,6 @@
import torch
from torch import Tensor

from torchmetrics.utilities.data import _stable_1d_sort


def _auc_update(x: Tensor, y: Tensor) -> Tuple[Tensor, Tensor]:
if x.ndim > 1 or y.ndim > 1:
Expand All @@ -35,7 +33,7 @@ def _auc_update(x: Tensor, y: Tensor) -> Tuple[Tensor, Tensor]:

def _auc_compute(x: Tensor, y: Tensor, reorder: bool = False) -> Tensor:
if reorder:
x, x_idx = _stable_1d_sort(x)
x, x_idx = torch.sort(x)
SkafteNicki marked this conversation as resolved.
Show resolved Hide resolved
SkafteNicki marked this conversation as resolved.
Show resolved Hide resolved
y = y[x_idx]

dx = x[1:] - x[:-1]
Expand Down
29 changes: 0 additions & 29 deletions torchmetrics/utilities/data.py
Original file line number Diff line number Diff line change
Expand Up @@ -151,35 +151,6 @@ def get_num_classes(
return num_classes


SkafteNicki marked this conversation as resolved.
Show resolved Hide resolved
def _stable_1d_sort(x: torch, nb: int = 2049):
"""
Stable sort of 1d tensors. Pytorch defaults to a stable sorting algorithm
if number of elements are larger than 2048. This function pads the tensors,
makes the sort and returns the sorted array (with the padding removed)
See this discussion: https://discuss.pytorch.org/t/is-torch-sort-stable/20714

Raises:
ValueError:
If dim of ``x`` is greater than 1 since stable sort works with only 1d tensors.

Example:
>>> data = torch.tensor([8, 7, 2, 6, 4, 5, 3, 1, 9, 0])
>>> _stable_1d_sort(data)
(tensor([0, 1, 2, 3, 4, 5, 6, 7, 8, 9]), tensor([9, 7, 2, 6, 4, 5, 3, 1, 0, 8]))
>>> _stable_1d_sort(data, nb=5)
(tensor([0, 1, 2, 3, 4]), tensor([9, 7, 2, 6, 4]))
"""
if x.ndim > 1:
raise ValueError('Stable sort only works on 1d tensors')
n = x.numel()
if n < nb:
x_max = x.max()
x = torch.cat([x, (x_max + 1) * torch.ones(nb - n, dtype=x.dtype, device=x.device)], 0)
x_sort = x.sort()
i = min(nb, n)
return x_sort.values[:i], x_sort.indices[:i]


def apply_to_collection(
data: Any,
dtype: Union[type, tuple],
Expand Down