| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123 |
- # LICENSE HEADER MANAGED BY add-license-header
- #
- # Copyright 2018 Kornia Team
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- #
- from __future__ import annotations
- from typing import Optional, Union
- from kornia.color.gray import grayscale_to_rgb
- from kornia.core import Tensor, tensor
- from kornia.core.external import PILImage as Image
- from kornia.models._hf_models import HFONNXComunnityModel
- __all__ = ["DepthEstimation"]
- class DepthEstimation(HFONNXComunnityModel):
- name: str = "depth_estimation"
- def __call__(self, images: Union[Tensor, list[Tensor]]) -> Union[Tensor, list[Tensor]]: # type: ignore[override]
- """Detect objects in a given list of images.
- Args:
- images: If list of RGB images. Each image is a Tensor with shape :math:`(3, H, W)`.
- If Tensor, a Tensor with shape :math:`(B, 3, H, W)`.
- Returns:
- list of detections found in each image. For item in a batch, shape is :math:`(D, 6)`, where :math:`D` is the
- number of detections in the given image, :math:`6` represents class id, score, and `xywh` bounding box.
- """
- if isinstance(
- images,
- (
- list,
- tuple,
- ),
- ):
- results = [super(DepthEstimation, self).__call__(image[None].cpu().numpy())[0] for image in images]
- results = [
- self.resize_back(tensor(result, device=image.device, dtype=image.dtype), image)
- for result, image in zip(results, images)
- ]
- return results
- result = super().__call__(images.cpu().numpy())[0]
- result = tensor(result, device=images.device, dtype=images.dtype)
- return self.resize_back(result, images)
- def visualize(
- self,
- images: Tensor,
- depth_maps: Optional[Union[Tensor, list[Tensor]]] = None,
- output_type: str = "torch",
- depth_type: str = "relative",
- max_depth: int = 80,
- ) -> Union[Tensor, list[Tensor], list[Image.Image]]: # type: ignore
- """Draw the segmentation results.
- Args:
- images: input tensor.
- depth_maps: estimated depths.
- output_type: type of the output.
- depth_type: 'metric' or 'relative' depth.
- max_depth: maximum depth value. Only valid for metric depth.
- Returns:
- output tensor.
- """
- if depth_maps is None:
- depth_maps = self(images)
- output = []
- for depth_map in depth_maps:
- if depth_type == "metric":
- depth_map = depth_map / max_depth
- elif depth_type == "relative":
- depth_map = depth_map / depth_map.max()
- else:
- raise ValueError(f"Unsupported depth type `{depth_type}`.")
- output.append(grayscale_to_rgb(depth_map))
- return self._tensor_to_type(output, output_type, is_batch=isinstance(images, Tensor))
- def save(
- self,
- images: Tensor,
- depth_maps: Optional[Union[Tensor, list[Tensor]]] = None,
- directory: Optional[str] = None,
- output_type: str = "torch",
- depth_type: str = "relative",
- max_depth: int = 80,
- ) -> None:
- """Save the segmentation results.
- Args:
- images: input tensor.
- depth_maps: estimated depths.
- output_type: type of the output.
- depth_type: 'metric' or 'relative' depth.
- max_depth: maximum depth value. Only valid for metric depth.
- directory: where to store outputs.
- Returns:
- output tensor.
- """
- outputs = self.visualize(images, depth_maps, output_type, depth_type=depth_type, max_depth=max_depth)
- self._save_outputs(images, directory, suffix="_src")
- self._save_outputs(outputs, directory, suffix="_depth")
|