ameerazam08
/

VOODOO3D-unofficial

Model card Files Files and versions Community

VOODOO3D-unofficial / additional_modules /deeplabv3 /encoder.py

ameerazam08

Upload folder using huggingface_hub

03da825 verified 9 months ago

raw

history blame contribute delete

9.49 kB

	from functools import partial
	from typing import Any, Callable, List, Optional, Type, Union

	import torch
	import torch.nn as nn
	from torch import Tensor


	def conv3x3(in_planes: int, out_planes: int, stride: int = 1, groups: int = 1, dilation: int = 1) -> nn.Conv2d:
	"""3x3 convolution with padding"""
	return nn.Conv2d(
	in_planes,
	out_planes,
	kernel_size=3,
	stride=stride,
	padding=dilation,
	groups=groups,
	bias=True,
	dilation=dilation,
	)


	def conv1x1(in_planes: int, out_planes: int, stride: int = 1) -> nn.Conv2d:
	"""1x1 convolution"""
	return nn.Conv2d(in_planes, out_planes, kernel_size=1, stride=stride, bias=True)


	class BasicBlock(nn.Module):
	expansion: int = 1

	def __init__(
	self,
	inplanes: int,
	planes: int,
	stride: int = 1,
	downsample: Optional[nn.Module] = None,
	groups: int = 1,
	base_width: int = 64,
	dilation: int = 1,
	norm_layer: Optional[Callable[..., nn.Module]] = None,
	) -> None:
	super().__init__()
	if norm_layer is None:
	norm_layer = nn.Identity
	if groups != 1 or base_width != 64:
	raise ValueError("BasicBlock only supports groups=1 and base_width=64")
	if dilation > 1:
	raise NotImplementedError("Dilation > 1 not supported in BasicBlock")
	# Both self.conv1 and self.downsample layers downsample the input when stride != 1
	self.conv1 = conv3x3(inplanes, planes, stride)
	self.bn1 = norm_layer(planes)
	self.relu = nn.ReLU(inplace=True)
	self.conv2 = conv3x3(planes, planes)
	self.bn2 = norm_layer(planes)
	self.downsample = downsample
	self.stride = stride

	def forward(self, x: Tensor) -> Tensor:
	identity = x

	out = self.conv1(x)
	out = self.bn1(out)
	out = self.relu(out)

	out = self.conv2(out)
	out = self.bn2(out)

	if self.downsample is not None:
	identity = self.downsample(x)

	out += identity
	out = self.relu(out)

	return out


	class Bottleneck(nn.Module):
	# Bottleneck in torchvision places the stride for downsampling at 3x3 convolution(self.conv2)
	# while original implementation places the stride at the first 1x1 convolution(self.conv1)
	# according to "Deep residual learning for image recognition" https://arxiv.org/abs/1512.03385.
	# This variant is also known as ResNet V1.5 and improves accuracy according to
	# https://ngc.nvidia.com/catalog/model-scripts/nvidia:resnet_50_v1_5_for_pytorch.

	expansion: int = 4

	def __init__(
	self,
	inplanes: int,
	planes: int,
	stride: int = 1,
	downsample: Optional[nn.Module] = None,
	groups: int = 1,
	base_width: int = 64,
	dilation: int = 1,
	norm_layer: Optional[Callable[..., nn.Module]] = None,
	) -> None:
	super().__init__()
	if norm_layer is None:
	norm_layer = nn.Identity()
	width = int(planes * (base_width / 64.0)) * groups
	# Both self.conv2 and self.downsample layers downsample the input when stride != 1
	self.conv1 = conv1x1(inplanes, width)
	self.bn1 = norm_layer(width)
	self.conv2 = conv3x3(width, width, stride, groups, dilation)
	self.bn2 = norm_layer(width)
	self.conv3 = conv1x1(width, planes * self.expansion)
	self.bn3 = norm_layer(planes * self.expansion)
	self.relu = nn.ReLU(inplace=True)
	self.downsample = downsample
	self.stride = stride

	def forward(self, x: Tensor) -> Tensor:
	identity = x

	out = self.conv1(x)
	out = self.bn1(out)
	out = self.relu(out)

	out = self.conv2(out)
	out = self.bn2(out)
	out = self.relu(out)

	out = self.conv3(out)
	out = self.bn3(out)

	if self.downsample is not None:
	identity = self.downsample(x)

	out += identity
	out = self.relu(out)

	return out


	class ResNet(nn.Module):
	def __init__(
	self,
	block: Type[Union[BasicBlock, Bottleneck]],
	layers: List[int],
	input_channels: int = 5,
	num_classes: int = 1000,
	zero_init_residual: bool = False,
	groups: int = 1,
	width_per_group: int = 64,
	replace_stride_with_dilation: Optional[List[bool]] = None,
	norm_layer: Optional[Callable[..., nn.Module]] = None,
	) -> None:
	super().__init__()
	if norm_layer is None:
	norm_layer = nn.Identity
	self._norm_layer = norm_layer

	self.inplanes = 64
	self.dilation = 1
	if replace_stride_with_dilation is None:
	# each element in the tuple indicates if we should replace
	# the 2x2 stride with a dilated convolution instead
	replace_stride_with_dilation = [False, False, False]
	if len(replace_stride_with_dilation) != 3:
	raise ValueError(
	"replace_stride_with_dilation should be None "
	f"or a 3-element tuple, got {replace_stride_with_dilation}"
	)
	self.groups = groups
	self.base_width = width_per_group
	self.conv1 = nn.Conv2d(input_channels, self.inplanes, kernel_size=7, stride=2, padding=3, bias=False)
	self.bn1 = norm_layer(self.inplanes)
	self.relu = nn.ReLU(inplace=True)
	self.maxpool = nn.MaxPool2d(kernel_size=3, stride=2, padding=1)
	self.layer1 = self._make_layer(block, 64, layers[0])
	self.layer2 = self._make_layer(block, 128, layers[1], stride=2, dilate=replace_stride_with_dilation[0])
	self.layer3 = self._make_layer(block, 256, layers[2], stride=2, dilate=replace_stride_with_dilation[1])
	self.layer4 = self._make_layer(block, 512, layers[3], stride=2, dilate=replace_stride_with_dilation[2])

	for m in self.modules():
	if isinstance(m, nn.Conv2d):
	nn.init.kaiming_normal_(m.weight, mode="fan_out", nonlinearity="relu")
	elif isinstance(m, (nn.BatchNorm2d, nn.GroupNorm)):
	nn.init.constant_(m.weight, 1)
	nn.init.constant_(m.bias, 0)

	def _make_layer(
	self,
	block: Type[Union[BasicBlock, Bottleneck]],
	planes: int,
	blocks: int,
	stride: int = 1,
	dilate: bool = False,
	) -> nn.Sequential:
	norm_layer = self._norm_layer
	downsample = None
	previous_dilation = self.dilation
	if dilate:
	self.dilation *= stride
	stride = 1
	if stride != 1 or self.inplanes != planes * block.expansion:
	downsample = nn.Sequential(
	conv1x1(self.inplanes, planes * block.expansion, stride),
	norm_layer(planes * block.expansion),
	)

	layers = []
	layers.append(
	block(
	self.inplanes, planes, stride, downsample, self.groups, self.base_width, previous_dilation, norm_layer
	)
	)
	self.inplanes = planes * block.expansion
	for _ in range(1, blocks):
	layers.append(
	block(
	self.inplanes,
	planes,
	groups=self.groups,
	base_width=self.base_width,
	dilation=self.dilation,
	norm_layer=norm_layer,
	)
	)

	return nn.Sequential(*layers)

	def _forward_impl(self, x: Tensor) -> Tensor:
	# See note [TorchScript super()]
	features = []

	# Stage 1
	features.append(x)

	# Stage 2
	x = self.conv1(x)
	x = self.bn1(x)
	x = self.relu(x)
	features.append(x)

	# Stage 3
	x = self.maxpool(x)
	x = self.layer1(x)
	features.append(x)

	# Stage 4
	x = self.layer2(x)
	features.append(x)

	# Stage 5
	x = self.layer3(x)
	features.append(x)

	# Stage 6
	x = self.layer4(x)
	features.append(x)

	return features[:4]

	def forward(self, x: Tensor) -> Tensor:
	return self._forward_impl(x)


	def _resnet(
	block: Type[Union[BasicBlock, Bottleneck]],
	layers: List[int],
	progress: bool,
	**kwargs: Any,
	) -> ResNet:

	model = ResNet(block, layers, **kwargs)

	return model


	def resnet34(, progress: bool = True, *kwargs: Any) -> ResNet:
	"""ResNet-34 from `Deep Residual Learning for Image Recognition <https://arxiv.org/abs/1512.03385>`__.

	Args:
	weights (:class:`~torchvision.models.ResNet34_Weights`, optional): The
	pretrained weights to use. See
	:class:`~torchvision.models.ResNet34_Weights` below for
	more details, and possible values. By default, no pre-trained
	weights are used.
	progress (bool, optional): If True, displays a progress bar of the
	download to stderr. Default is True.
	**kwargs: parameters passed to the ``torchvision.models.resnet.ResNet``
	base class. Please refer to the `source code
	<https://github.com/pytorch/vision/blob/main/torchvision/models/resnet.py>`_
	for more details about this class.

	.. autoclass:: torchvision.models.ResNet34_Weights
	:members:
	"""

	return _resnet(BasicBlock, [3, 4, 6, 3], progress, **kwargs)