| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889 |
- # LICENSE HEADER MANAGED BY add-license-header
- #
- # Copyright 2018 Kornia Team
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- #
- from typing import Dict
- import torch
- from torch import nn
- from kornia.core.check import KORNIA_CHECK_SHAPE
- urls: Dict[str, str] = {}
- urls["lib"] = "https://github.com/yuruntian/SOSNet/raw/master/sosnet-weights/sosnet_32x32_liberty.pth"
- urls["hp_a"] = "https://github.com/yuruntian/SOSNet/raw/master/sosnet-weights/sosnet_32x32_hpatches_a.pth"
- class SOSNet(nn.Module):
- r"""128-dimensional SOSNet model definition for 32x32 patches.
- This is based on the original code from paper
- "SOSNet:Second Order Similarity Regularization for Local Descriptor Learning".
- Args:
- pretrained: Download and set pretrained weights to the model.
- Shape:
- - Input: :math:`(B, 1, 32, 32)`
- - Output: :math:`(B, 128)`
- Examples:
- >>> input = torch.rand(8, 1, 32, 32)
- >>> sosnet = SOSNet()
- >>> descs = sosnet(input) # 8x128
- """
- patch_size = 32
- def __init__(self, pretrained: bool = False) -> None:
- super().__init__()
- self.layers = nn.Sequential(
- nn.InstanceNorm2d(1, affine=False),
- nn.Conv2d(1, 32, kernel_size=3, padding=1, bias=False),
- nn.BatchNorm2d(32, affine=False),
- nn.ReLU(),
- nn.Conv2d(32, 32, kernel_size=3, padding=1, bias=False),
- nn.BatchNorm2d(32, affine=False),
- nn.ReLU(),
- nn.Conv2d(32, 64, kernel_size=3, stride=2, padding=1, bias=False),
- nn.BatchNorm2d(64, affine=False),
- nn.ReLU(),
- nn.Conv2d(64, 64, kernel_size=3, padding=1, bias=False),
- nn.BatchNorm2d(64, affine=False),
- nn.ReLU(),
- nn.Conv2d(64, 128, kernel_size=3, stride=2, padding=1, bias=False),
- nn.BatchNorm2d(128, affine=False),
- nn.ReLU(),
- nn.Conv2d(128, 128, kernel_size=3, padding=1, bias=False),
- nn.BatchNorm2d(128, affine=False),
- nn.ReLU(),
- nn.Dropout(0.1),
- nn.Conv2d(128, 128, kernel_size=8, bias=False),
- nn.BatchNorm2d(128, affine=False),
- )
- self.desc_norm = nn.Sequential(nn.LocalResponseNorm(256, alpha=256.0, beta=0.5, k=0.0))
- # load pretrained model
- if pretrained:
- pretrained_dict = torch.hub.load_state_dict_from_url(urls["lib"], map_location=torch.device("cpu"))
- self.load_state_dict(pretrained_dict, strict=True)
- self.eval()
- def forward(self, input: torch.Tensor, eps: float = 1e-10) -> torch.Tensor:
- KORNIA_CHECK_SHAPE(input, ["B", "1", "32", "32"])
- descr = self.desc_norm(self.layers(input) + eps)
- descr = descr.view(descr.size(0), -1)
- return descr
|