| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170 |
- # LICENSE HEADER MANAGED BY add-license-header
- #
- # Copyright 2018 Kornia Team
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- #
- from __future__ import annotations
- from typing import Optional
- import torch
- import torch.nn.functional as F
- from torch import nn
- from kornia.losses._utils import mask_ignore_pixels
- # based on:
- # https://github.com/kevinzakka/pytorch-goodies/blob/master/losses.py
- def tversky_loss(
- pred: torch.Tensor,
- target: torch.Tensor,
- alpha: float,
- beta: float,
- eps: float = 1e-8,
- ignore_index: Optional[int] = -100,
- ) -> torch.Tensor:
- r"""Criterion that computes Tversky Coefficient loss.
- According to :cite:`salehi2017tversky`, we compute the Tversky Coefficient as follows:
- .. math::
- \text{S}(P, G, \alpha; \beta) =
- \frac{|PG|}{|PG| + \alpha |P \setminus G| + \beta |G \setminus P|}
- Where:
- - :math:`P` and :math:`G` are the predicted and ground truth binary
- labels.
- - :math:`\alpha` and :math:`\beta` control the magnitude of the
- penalties for FPs and FNs, respectively.
- Note:
- - :math:`\alpha = \beta = 0.5` => dice coeff
- - :math:`\alpha = \beta = 1` => tanimoto coeff
- - :math:`\alpha + \beta = 1` => F beta coeff
- Args:
- pred: logits tensor with shape :math:`(N, C, H, W)` where C = number of classes.
- target: labels tensor with shape :math:`(N, H, W)` where each value
- is :math:`0 ≤ targets[i] ≤ C-1`.
- alpha: the first coefficient in the denominator.
- beta: the second coefficient in the denominator.
- eps: scalar for numerical stability.
- ignore_index: labels with this value are ignored in the loss computation.
- Return:
- the computed loss.
- Example:
- >>> N = 5 # num_classes
- >>> pred = torch.randn(1, N, 3, 5, requires_grad=True)
- >>> target = torch.empty(1, 3, 5, dtype=torch.long).random_(N)
- >>> output = tversky_loss(pred, target, alpha=0.5, beta=0.5)
- >>> output.backward()
- """
- if not isinstance(pred, torch.Tensor):
- raise TypeError(f"pred type is not a torch.Tensor. Got {type(pred)}")
- if not len(pred.shape) == 4:
- raise ValueError(f"Invalid pred shape, we expect BxNxHxW. Got: {pred.shape}")
- if not pred.shape[-2:] == target.shape[-2:]:
- raise ValueError(f"pred and target shapes must be the same. Got: {pred.shape} and {target.shape}")
- if not pred.device == target.device:
- raise ValueError(f"pred and target must be in the same device. Got: {pred.device} and {target.device}")
- # compute softmax over the classes axis
- pred_soft = F.softmax(pred, dim=1)
- target, target_mask = mask_ignore_pixels(target, ignore_index)
- p_true = pred_soft.gather(1, target.unsqueeze(1)) # (B,1,H,W)
- if target_mask is not None:
- m = target_mask.unsqueeze(1).to(dtype=pred.dtype)
- p_true = p_true * m
- total = m.sum((1, 2, 3))
- else:
- B, _, H, W = pred.shape
- total = torch.full((B,), H * W, dtype=pred.dtype, device=pred.device)
- intersection = p_true.sum((1, 2, 3))
- # denominator = intersection + (alpha + beta) * (total - intersection) + eps
- # instead of multiple ops, do it in one fused step:
- denominator = torch.addcmul(
- intersection, # base
- total - intersection, # tensor1
- torch.full_like(total, alpha + beta), # tensor2 (scalar as tensor)
- value=1.0, # (intersection) + 1 * (tensor1*tensor2)
- ).add_(eps) # in-place add eps
- score = intersection.div(denominator)
- return 1.0 - score.mean()
- class TverskyLoss(nn.Module):
- r"""Criterion that computes Tversky Coefficient loss.
- According to :cite:`salehi2017tversky`, we compute the Tversky Coefficient as follows:
- .. math::
- \text{S}(P, G, \alpha; \beta) =
- \frac{|PG|}{|PG| + \alpha |P \setminus G| + \beta |G \setminus P|}
- Where:
- - :math:`P` and :math:`G` are the predicted and ground truth binary
- labels.
- - :math:`\alpha` and :math:`\beta` control the magnitude of the
- penalties for FPs and FNs, respectively.
- Note:
- - :math:`\alpha = \beta = 0.5` => dice coeff
- - :math:`\alpha = \beta = 1` => tanimoto coeff
- - :math:`\alpha + \beta = 1` => F beta coeff
- Args:
- alpha: the first coefficient in the denominator.
- beta: the second coefficient in the denominator.
- eps: scalar for numerical stability.
- ignore_index: labels with this value are ignored in the loss computation.
- Shape:
- - Pred: :math:`(N, C, H, W)` where C = number of classes.
- - Target: :math:`(N, H, W)` where each value is
- :math:`0 ≤ targets[i] ≤ C-1`.
- Examples:
- >>> N = 5 # num_classes
- >>> criterion = TverskyLoss(alpha=0.5, beta=0.5)
- >>> pred = torch.randn(1, N, 3, 5, requires_grad=True)
- >>> target = torch.empty(1, 3, 5, dtype=torch.long).random_(N)
- >>> output = criterion(pred, target)
- >>> output.backward()
- """
- def __init__(self, alpha: float, beta: float, eps: float = 1e-8, ignore_index: Optional[int] = -100) -> None:
- super().__init__()
- self.alpha: float = alpha
- self.beta: float = beta
- self.eps: float = eps
- self.ignore_index: Optional[int] = ignore_index
- def forward(self, pred: torch.Tensor, target: torch.Tensor) -> torch.Tensor:
- return tversky_loss(pred, target, self.alpha, self.beta, self.eps, self.ignore_index)
|