add deterministic on eval option for binary mapper

lucidrains · lucidrains · commit eef94eaaff93 · 2025-11-09T06:01:48.000-08:00
diff --git a/pyproject.toml b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "vector-quantize-pytorch"
-version = "1.25.0"
+version = "1.25.1"
 description = "Vector Quantization - Pytorch"
 authors = [
     { name = "Phil Wang", email = "lucidrains@gmail.com" }
diff --git a/vector_quantize_pytorch/binary_mapper.py b/vector_quantize_pytorch/binary_mapper.py
@@ -46,7 +46,8 @@ class BinaryMapper(Module):
     def __init__(
         self,
         bits = 1,
-        kl_loss_threshold = NAT # 1 bit
+        kl_loss_threshold = NAT, # 1 bit
+        deterministic_on_eval = False
     ):
         super().__init__()
 
@@ -64,14 +65,21 @@ def __init__(
         self.kl_loss_threshold = kl_loss_threshold
         self.register_buffer('zero', tensor(0.), persistent = False)
 
+        # eval behavior
+
+        self.deterministic_on_eval = deterministic_on_eval
+
     def forward(
         self,
         logits,
         temperature = 1.,
         straight_through = None,
         calc_aux_loss = None,
-        return_indices = False
+        deterministic = None,
+        return_indices = False,
     ):
+        deterministic = default(deterministic, self.deterministic_on_eval and not self.training)
+
         straight_through = default(straight_through, self.training)
         calc_aux_loss = default(calc_aux_loss, self.training)
 
@@ -87,7 +95,10 @@ def forward(
 
         # sampling
 
-        sampled_bits = (torch.rand_like(logits) <= prob_for_sample).long()
+        compare_target = torch.rand_like(logits) if not deterministic else 0.5
+
+        sampled_bits = (compare_target <= prob_for_sample).long()
+
         indices = (self.power_two * sampled_bits).sum(dim = -1)
 
         one_hot = F.one_hot(indices, self.num_codes).float()
@@ -143,3 +154,8 @@ def forward(
     assert sparse_one_hot.shape == (3, 4, 2 ** 8)
     assert indices.shape == (3, 4)
     assert aux_loss.numel() == 1
+
+    binary_mapper.eval()
+    sparse_one_hot1, _ = binary_mapper(logits, deterministic = True)
+    sparse_one_hot2, _ = binary_mapper(logits, deterministic = True)
+    assert torch.allclose(sparse_one_hot1, sparse_one_hot2)