LogSAD / anomalib /models /components /stats /multi_variate_gaussian.py

zhiqing0205

Add core libraries: anomalib, dinov2, open_clip_local

3de7bf6 6 days ago

5.55 kB

	"""Multi Variate Gaussian Distribution."""

	# Copyright (C) 2022-2024 Intel Corporation
	# SPDX-License-Identifier: Apache-2.0

	from typing import Any

	import torch
	from torch import nn

	from anomalib.models.components.base import DynamicBufferMixin


	class MultiVariateGaussian(DynamicBufferMixin, nn.Module):
	"""Multi Variate Gaussian Distribution."""

	def __init__(self) -> None:
	super().__init__()

	self.register_buffer("mean", torch.empty(0))
	self.register_buffer("inv_covariance", torch.empty(0))

	self.mean: torch.Tensor
	self.inv_covariance: torch.Tensor

	@staticmethod
	def _cov(
	observations: torch.Tensor,
	rowvar: bool = False,
	bias: bool = False,
	ddof: int \| None = None,
	aweights: torch.Tensor \| None = None,
	) -> torch.Tensor:
	"""Estimates covariance matrix like numpy.cov.

	Args:
	observations (torch.Tensor): A 1-D or 2-D array containing multiple variables and observations.
	Each row of `m` represents a variable, and each column a single
	observation of all those variables. Also see `rowvar` below.
	rowvar (bool): If `rowvar` is True (default), then each row represents a
	variable, with observations in the columns. Otherwise, the relationship
	is transposed: each column represents a variable, while the rows
	contain observations. Defaults to False.
	bias (bool): Default normalization (False) is by ``(N - 1)``, where ``N`` is the
	number of observations given (unbiased estimate). If `bias` is True,
	then normalization is by ``N``. These values can be overridden by using
	the keyword ``ddof`` in numpy versions >= 1.5. Defaults to False
	ddof (int \| None): If not ``None`` the default value implied by `bias` is overridden.
	Note that ``ddof=1`` will return the unbiased estimate, even if both
	`fweights` and `aweights` are specified, and ``ddof=0`` will return
	the simple average. See the notes for the details. The default value
	is ``None``.
	aweights (torch.Tensor): 1-D array of observation vector weights. These relative weights are
	typically large for observations considered "important" and smaller for
	observations considered less "important". If ``ddof=0`` the array of
	weights can be used to assign probabilities to observation vectors. (Default value = None)


	Returns:
	The covariance matrix of the variables.
	"""
	# ensure at least 2D
	if observations.dim() == 1:
	observations = observations.view(-1, 1)

	# treat each column as a data point, each row as a variable
	if rowvar and observations.shape[0] != 1:
	observations = observations.t()

	if ddof is None:
	ddof = 1 if bias == 0 else 0

	weights = aweights
	weights_sum: Any

	if weights is not None:
	if not torch.is_tensor(weights):
	weights = torch.tensor(weights, dtype=torch.float) # pylint: disable=not-callable
	weights_sum = torch.sum(weights)
	avg = torch.sum(observations * (weights / weights_sum)[:, None], 0)
	else:
	avg = torch.mean(observations, 0)

	# Determine the normalization
	if weights is None:
	fact = observations.shape[0] - ddof
	elif ddof == 0:
	fact = weights_sum
	elif aweights is None:
	fact = weights_sum - ddof
	else:
	fact = weights_sum - ddof * torch.sum(weights * weights) / weights_sum

	observations_m = observations.sub(avg.expand_as(observations))

	x_transposed = observations_m.t() if weights is None else torch.mm(torch.diag(weights), observations_m).t()

	covariance = torch.mm(x_transposed, observations_m)
	covariance = covariance / fact

	return covariance.squeeze()

	def forward(self, embedding: torch.Tensor) -> list[torch.Tensor]:
	"""Calculate multivariate Gaussian distribution.

	Args:
	embedding (torch.Tensor): CNN features whose dimensionality is reduced via either random sampling or PCA.

	Returns:
	mean and inverse covariance of the multi-variate gaussian distribution that fits the features.
	"""
	device = embedding.device

	batch, channel, height, width = embedding.size()
	embedding_vectors = embedding.view(batch, channel, height * width)
	self.mean = torch.mean(embedding_vectors, dim=0)
	covariance = torch.zeros(size=(channel, channel, height * width), device=device)
	identity = torch.eye(channel).to(device)
	for i in range(height * width):
	covariance[:, :, i] = self._cov(embedding_vectors[:, :, i], rowvar=False) + 0.01 * identity

	# calculate inverse covariance as we need only the inverse
	self.inv_covariance = torch.linalg.inv(covariance.permute(2, 0, 1))

	return [self.mean, self.inv_covariance]

	def fit(self, embedding: torch.Tensor) -> list[torch.Tensor]:
	"""Fit multi-variate gaussian distribution to the input embedding.

	Args:
	embedding (torch.Tensor): Embedding vector extracted from CNN.

	Returns:
	Mean and the covariance of the embedding.
	"""
	return self.forward(embedding)