| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152 |
- # Copyright The Lightning team.
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- import torch
- from torch import Tensor
- from typing_extensions import Literal
- from torchmetrics.functional.image.uqi import universal_image_quality_index
- from torchmetrics.utilities.distributed import reduce
- def _spectral_distortion_index_update(preds: Tensor, target: Tensor) -> tuple[Tensor, Tensor]:
- """Update and returns variables required to compute Spectral Distortion Index.
- Args:
- preds: Low resolution multispectral image
- target: High resolution fused image
- """
- if preds.dtype != target.dtype:
- raise TypeError(
- f"Expected `ms` and `fused` to have the same data type. Got ms: {preds.dtype} and fused: {target.dtype}."
- )
- if len(preds.shape) != 4:
- raise ValueError(
- f"Expected `preds` and `target` to have BxCxHxW shape. Got preds: {preds.shape} and target: {target.shape}."
- )
- if preds.shape[:2] != target.shape[:2]:
- raise ValueError(
- "Expected `preds` and `target` to have same batch and channel sizes."
- f"Got preds: {preds.shape} and target: {target.shape}."
- )
- return preds, target
- def _spectral_distortion_index_compute(
- preds: Tensor,
- target: Tensor,
- p: int = 1,
- reduction: Literal["elementwise_mean", "sum", "none"] = "elementwise_mean",
- ) -> Tensor:
- """Compute Spectral Distortion Index (SpectralDistortionIndex_).
- Args:
- preds: Low resolution multispectral image
- target: High resolution fused image
- p: a parameter to emphasize large spectral difference
- reduction: a method to reduce metric score over labels.
- - ``'elementwise_mean'``: takes the mean (default)
- - ``'sum'``: takes the sum
- - ``'none'``: no reduction will be applied
- Example:
- >>> from torch import rand
- >>> preds = rand([16, 3, 16, 16])
- >>> target = rand([16, 3, 16, 16])
- >>> preds, target = _spectral_distortion_index_update(preds, target)
- >>> _spectral_distortion_index_compute(preds, target)
- tensor(0.0234)
- """
- length = preds.shape[1]
- m1 = torch.zeros((length, length), device=preds.device)
- m2 = torch.zeros((length, length), device=preds.device)
- for k in range(length):
- num = length - (k + 1)
- if num == 0:
- continue
- stack1 = target[:, k : k + 1, :, :].repeat(num, 1, 1, 1)
- stack2 = torch.cat([target[:, r : r + 1, :, :] for r in range(k + 1, length)], dim=0)
- score = [
- s.mean() for s in universal_image_quality_index(stack1, stack2, reduction="none").split(preds.shape[0])
- ]
- m1[k, k + 1 :] = torch.stack(score, 0)
- stack1 = preds[:, k : k + 1, :, :].repeat(num, 1, 1, 1)
- stack2 = torch.cat([preds[:, r : r + 1, :, :] for r in range(k + 1, length)], dim=0)
- score = [
- s.mean() for s in universal_image_quality_index(stack1, stack2, reduction="none").split(preds.shape[0])
- ]
- m2[k, k + 1 :] = torch.stack(score, 0)
- m1 = m1 + m1.T
- m2 = m2 + m2.T
- diff = torch.pow(torch.abs(m1 - m2), p)
- # Special case: when number of channels (L) is 1, there will be only one element in M1 and M2. Hence no need to sum.
- if length == 1:
- output = torch.pow(diff, (1.0 / p))
- else:
- output = torch.pow(1.0 / (length * (length - 1)) * torch.sum(diff), (1.0 / p))
- return reduce(output, reduction)
- def spectral_distortion_index(
- preds: Tensor,
- target: Tensor,
- p: int = 1,
- reduction: Literal["elementwise_mean", "sum", "none"] = "elementwise_mean",
- ) -> Tensor:
- """Calculate `Spectral Distortion Index`_ (SpectralDistortionIndex_) also known as D_lambda.
- Metric is used to compare the spectral distortion between two images.
- Args:
- preds: Low resolution multispectral image
- target: High resolution fused image
- p: Large spectral differences
- reduction: a method to reduce metric score over labels.
- - ``'elementwise_mean'``: takes the mean (default)
- - ``'sum'``: takes the sum
- - ``'none'``: no reduction will be applied
- Return:
- Tensor with SpectralDistortionIndex score
- Raises:
- TypeError:
- If ``preds`` and ``target`` don't have the same data type.
- ValueError:
- If ``preds`` and ``target`` don't have ``BxCxHxW shape``.
- ValueError:
- If ``p`` is not a positive integer.
- Example:
- >>> from torch import rand
- >>> from torchmetrics.functional.image import spectral_distortion_index
- >>> preds = rand([16, 3, 16, 16])
- >>> target = rand([16, 3, 16, 16])
- >>> spectral_distortion_index(preds, target)
- tensor(0.0234)
- """
- if not isinstance(p, int) or p <= 0:
- raise ValueError(f"Expected `p` to be a positive integer. Got p: {p}.")
- preds, target = _spectral_distortion_index_update(preds, target)
- return _spectral_distortion_index_compute(preds, target, p, reduction)
|