import torch class SoftmaxPower(torch.nn.Module): dim: int | None power: float mean_mode: bool def __init__( self, power: float = 2.0, dim: int | None = None, mean_mode: bool = False ) -> None: super().__init__() self.dim = dim self.power = power self.mean_mode = mean_mode def __setstate__(self, state): super().__setstate__(state) if not hasattr(self, "dim"): self.dim = None if not hasattr(self, "power"): self.power = 2.0 if not hasattr(self, "mean_mode"): self.mean_mode = False def forward(self, input: torch.Tensor) -> torch.Tensor: output: torch.Tensor = torch.abs(input).pow(self.power) if self.dim is None: output = output / output.sum() else: output = output / output.sum(dim=self.dim, keepdim=True) if self.mean_mode: return torch.abs(input).mean(dim=1, keepdim=True) * output else: return input * output def extra_repr(self) -> str: return f"dim={self.dim} ; power={self.power}"