rwth-i6 · christophmluscher · Dec 17, 2024 · Dec 19, 2024 · Dec 19, 2024 · Dec 19, 2024
diff --git a/i6_models/samplers/__init__.py b/i6_models/samplers/__init__.py
diff --git a/i6_models/samplers/log_uniform.py b/i6_models/samplers/log_uniform.py
@@ -0,0 +1,34 @@
+__all__ = ["LogUniformSampler"]
+
+
+import torch
+from torch import nn
+from typing import Optional
+
+
+class LogUniformSampler(nn.Module):
+    def __init__(self, num_classes: int, *, device: Optional[torch.device] = None):
+        """
+        Samples from a log uniform distribution from classes.
+
+        :param num_classes: number of classes from which the distribution is sampled.
+        :param device: device on which the distribution is sampled.
+        """
+        super().__init__()
+
+        # assumes count-sorted vocabulary, descending
+        self.num_classes = num_classes
+
+        # approximately zipf distribution
+        ws = torch.arange(self.num_classes, dtype=torch.get_default_dtype(), device=device)
+        self._distribution = (torch.log1p(ws + 1) - torch.log1p(ws)) / torch.log1p(torch.tensor(self.num_classes))
+        self._distribution.clamp_(min=1e-10)
+        self._distribution /= self._distribution.sum()
+
+        self._cat_sampler = torch.distributions.categorical.Categorical(probs=self._distribution)
+
+    def sample(self, num_samples: int) -> torch.Tensor:
+        return self._cat_sampler.sample(torch.Size([num_samples]))
+
+    def log_prob(self, indices: torch.Tensor) -> torch.Tensor:
+        return self._cat_sampler.log_prob(indices)