pengdadaaa
/

SnakeCLEF2024

Model card Files Files and versions Community

SnakeCLEF2024 / pytorch-image-models /timm /layers /norm.py

pengdadaaa

Upload 741 files

786f6a6 verified 7 months ago

raw

history blame contribute delete

6.04 kB

	""" Normalization layers and wrappers

	Norm layer definitions that support fast norm and consistent channel arg order (always first arg).

	Hacked together by / Copyright 2022 Ross Wightman
	"""
	import numbers
	from typing import Tuple

	import torch
	import torch.nn as nn
	import torch.nn.functional as F

	from .fast_norm import is_fast_norm, fast_group_norm, fast_layer_norm, fast_rms_norm


	class GroupNorm(nn.GroupNorm):
	def __init__(self, num_channels, num_groups=32, eps=1e-5, affine=True):
	# NOTE num_channels is swapped to first arg for consistency in swapping norm layers with BN
	super().__init__(num_groups, num_channels, eps=eps, affine=affine)
	self.fast_norm = is_fast_norm() # can't script unless we have these flags here (no globals)

	def forward(self, x):
	if self.fast_norm:
	return fast_group_norm(x, self.num_groups, self.weight, self.bias, self.eps)
	else:
	return F.group_norm(x, self.num_groups, self.weight, self.bias, self.eps)


	class GroupNorm1(nn.GroupNorm):
	""" Group Normalization with 1 group.
	Input: tensor in shape [B, C, *]
	"""

	def __init__(self, num_channels, **kwargs):
	super().__init__(1, num_channels, **kwargs)
	self.fast_norm = is_fast_norm() # can't script unless we have these flags here (no globals)

	def forward(self, x: torch.Tensor) -> torch.Tensor:
	if self.fast_norm:
	return fast_group_norm(x, self.num_groups, self.weight, self.bias, self.eps)
	else:
	return F.group_norm(x, self.num_groups, self.weight, self.bias, self.eps)


	class LayerNorm(nn.LayerNorm):
	""" LayerNorm w/ fast norm option
	"""
	def __init__(self, num_channels, eps=1e-6, affine=True):
	super().__init__(num_channels, eps=eps, elementwise_affine=affine)
	self._fast_norm = is_fast_norm() # can't script unless we have these flags here (no globals)

	def forward(self, x: torch.Tensor) -> torch.Tensor:
	if self._fast_norm:
	x = fast_layer_norm(x, self.normalized_shape, self.weight, self.bias, self.eps)
	else:
	x = F.layer_norm(x, self.normalized_shape, self.weight, self.bias, self.eps)
	return x


	class LayerNorm2d(nn.LayerNorm):
	""" LayerNorm for channels of '2D' spatial NCHW tensors """
	def __init__(self, num_channels, eps=1e-6, affine=True):
	super().__init__(num_channels, eps=eps, elementwise_affine=affine)
	self._fast_norm = is_fast_norm() # can't script unless we have these flags here (no globals)

	def forward(self, x: torch.Tensor) -> torch.Tensor:
	x = x.permute(0, 2, 3, 1)
	if self._fast_norm:
	x = fast_layer_norm(x, self.normalized_shape, self.weight, self.bias, self.eps)
	else:
	x = F.layer_norm(x, self.normalized_shape, self.weight, self.bias, self.eps)
	x = x.permute(0, 3, 1, 2)
	return x


	def _is_contiguous(tensor: torch.Tensor) -> bool:
	# jit is oh so lovely :/
	if torch.jit.is_scripting():
	return tensor.is_contiguous()
	else:
	return tensor.is_contiguous(memory_format=torch.contiguous_format)


	@torch.jit.script
	def _layer_norm_cf(x: torch.Tensor, weight: torch.Tensor, bias: torch.Tensor, eps: float):
	s, u = torch.var_mean(x, dim=1, unbiased=False, keepdim=True)
	x = (x - u) * torch.rsqrt(s + eps)
	x = x * weight[:, None, None] + bias[:, None, None]
	return x


	def _layer_norm_cf_sqm(x: torch.Tensor, weight: torch.Tensor, bias: torch.Tensor, eps: float):
	u = x.mean(dim=1, keepdim=True)
	s = ((x * x).mean(dim=1, keepdim=True) - (u * u)).clamp(0)
	x = (x - u) * torch.rsqrt(s + eps)
	x = x * weight.view(1, -1, 1, 1) + bias.view(1, -1, 1, 1)
	return x


	class LayerNormExp2d(nn.LayerNorm):
	""" LayerNorm for channels_first tensors with 2d spatial dimensions (ie N, C, H, W).

	Experimental implementation w/ manual norm for tensors non-contiguous tensors.

	This improves throughput in some scenarios (tested on Ampere GPU), esp w/ channels_last
	layout. However, benefits are not always clear and can perform worse on other GPUs.
	"""

	def __init__(self, num_channels, eps=1e-6):
	super().__init__(num_channels, eps=eps)

	def forward(self, x) -> torch.Tensor:
	if _is_contiguous(x):
	x = F.layer_norm(
	x.permute(0, 2, 3, 1), self.normalized_shape, self.weight, self.bias, self.eps).permute(0, 3, 1, 2)
	else:
	x = _layer_norm_cf(x, self.weight, self.bias, self.eps)
	return x


	class RmsNorm(nn.Module):
	""" RmsNorm w/ fast (apex) norm if available
	"""
	__constants__ = ['normalized_shape', 'eps', 'elementwise_affine']
	normalized_shape: Tuple[int, ...]
	eps: float
	elementwise_affine: bool

	def __init__(self, channels, eps=1e-6, affine=True, device=None, dtype=None) -> None:
	factory_kwargs = {'device': device, 'dtype': dtype}
	super().__init__()
	normalized_shape = channels
	if isinstance(normalized_shape, numbers.Integral):
	# mypy error: incompatible types in assignment
	normalized_shape = (normalized_shape,) # type: ignore[assignment]
	self.normalized_shape = tuple(normalized_shape) # type: ignore[arg-type]
	self.eps = eps
	self.elementwise_affine = affine
	if self.elementwise_affine:
	self.weight = nn.Parameter(torch.empty(self.normalized_shape, **factory_kwargs))
	else:
	self.register_parameter('weight', None)

	self.reset_parameters()

	def reset_parameters(self) -> None:
	if self.elementwise_affine:
	nn.init.ones_(self.weight)

	def forward(self, x: torch.Tensor) -> torch.Tensor:
	# NOTE fast norm fallback needs our rms norm impl, so both paths through here.
	# Since there is no built-in PyTorch impl, always use APEX RmsNorm if is installed.
	x = fast_rms_norm(x, self.normalized_shape, self.weight, self.eps)
	return x