update OT and add tutorial

Signed-off-by: Danny <[email protected]>
NVIDIA · Jan 8, 2025 · dc8e680 · dc8e680
1 parent 87afa0a
commit dc8e680
Show file tree

Hide file tree

Showing 12 changed files with 1,784 additions and 86 deletions.
diff --git a/sub-packages/bionemo-moco/documentation.md b/sub-packages/bionemo-moco/documentation.md
diff --git a/sub-packages/bionemo-moco/examples/ot_sampler_tutorial.ipynb b/sub-packages/bionemo-moco/examples/ot_sampler_tutorial.ipynb
diff --git a/sub-packages/bionemo-moco/src/bionemo/moco/interpolants/__init__.py b/sub-packages/bionemo-moco/src/bionemo/moco/interpolants/__init__.py
@@ -15,11 +15,24 @@
 
 
 from .continuous_time.continuous.continuous_flow_matching import ContinuousFlowMatcher
+from .continuous_time.continuous.optimal_transport.equivariant_ot_sampler import EquivariantOTSampler
+from .continuous_time.continuous.optimal_transport.kabsch_augmentation import KabschAugmentation
+from .continuous_time.continuous.optimal_transport.ot_sampler import OTSampler
 from .continuous_time.continuous.vdm import VDM
 from .continuous_time.discrete.discrete_flow_matching import DiscreteFlowMatcher
 from .continuous_time.discrete.mdlm import MDLM
 from .discrete_time.continuous.ddpm import DDPM
 from .discrete_time.discrete.d3pm import D3PM
 
 
-__all__ = ["DDPM", "D3PM", "VDM", "MDLM", "ContinuousFlowMatcher", "DiscreteFlowMatcher"]
+__all__ = [
+    "DDPM",
+    "D3PM",
+    "VDM",
+    "MDLM",
+    "ContinuousFlowMatcher",
+    "DiscreteFlowMatcher",
+    "EquivariantOTSampler",
+    "OTSampler",
+    "KabschAugmentation",
+]
diff --git a/sub-packages/bionemo-moco/src/bionemo/moco/interpolants/batch_augmentation.py b/sub-packages/bionemo-moco/src/bionemo/moco/interpolants/batch_augmentation.py
@@ -0,0 +1,62 @@
+# SPDX-FileCopyrightText: Copyright (c) 2024 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: LicenseRef-Apache2
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+
+from bionemo.moco.interpolants.continuous_time.continuous.optimal_transport.equivariant_ot_sampler import (
+    EquivariantOTSampler,
+)
+from bionemo.moco.interpolants.continuous_time.continuous.optimal_transport.kabsch_augmentation import (
+    KabschAugmentation,
+)
+from bionemo.moco.interpolants.continuous_time.continuous.optimal_transport.ot_sampler import OTSampler
+from bionemo.moco.interpolants.continuous_time.continuous.optimal_transport.ot_types import OptimalTransportType
+
+
+class BatchAugmentation:
+    """Facilitates the creation of batch augmentation objects based on specified optimal transport types.
+
+    Args:
+        device (str): The device to use for computations (e.g., 'cpu', 'cuda').
+        num_threads (int): The number of threads to utilize.
+    """
+
+    def __init__(self, device, num_threads):
+        """Initializes a BatchAugmentation instance.
+
+        Args:
+            device (str): Device for computation.
+            num_threads (int): Number of threads to use.
+        """
+        self.device = device
+        self.num_threads = num_threads
+
+    def create(self, method_type: OptimalTransportType):
+        """Creates a batch augmentation object of the specified type.
+
+        Args:
+            method_type (OptimalTransportType): The type of optimal transport method.
+
+        Returns:
+            The augmentation object if the type is supported, otherwise **None**.
+        """
+        if method_type == OptimalTransportType.EXACT:
+            augmentation = OTSampler(method="exact", device=self.device, num_threads=self.num_threads)
+        elif method_type == OptimalTransportType.KABSCH:
+            augmentation = KabschAugmentation()
+        elif method_type == OptimalTransportType.EQUIVARIANT:
+            augmentation = EquivariantOTSampler(method="exact", device=self.device, num_threads=self.num_threads)
+        else:
+            return None
+        return augmentation
diff --git a/...moco/src/bionemo/moco/interpolants/continuous_time/continuous/continuous_flow_matching.py b/...moco/src/bionemo/moco/interpolants/continuous_time/continuous/continuous_flow_matching.py
@@ -14,7 +14,6 @@
 # limitations under the License.
 
 
-from enum import Enum
 from typing import Optional, Union
 
 import torch
@@ -26,22 +25,8 @@
 from bionemo.moco.distributions.prior.distribution import PriorDistribution
 from bionemo.moco.distributions.time.distribution import TimeDistribution
 from bionemo.moco.interpolants.base_interpolant import Interpolant, PredictionType, pad_like, string_to_enum
-from bionemo.moco.interpolants.continuous_time.continuous.optimal_transport import OTSampler
-
-
-class OptimalTransportType(Enum):
-    """An enumeration representing the type ofOptimal Transport that can be used in Continuous Flow Matching.
-
-    - **EXACT**: Standard mini batch optimal transport defined in  https://arxiv.org/pdf/2302.00482.
-    - **EQUIVARIANT**: Adding roto/translation optimization to mini batch OT see https://arxiv.org/pdf/2306.15030  https://arxiv.org/pdf/2312.07168 4.2.
-    - **KABSCH**: Simple Kabsch alignment between each data and noise point, No permuation # https://arxiv.org/pdf/2410.22388 Sec 3.2
-
-    These prediction types can be used to train neural networks for specific tasks, such as denoising, image synthesis, or time-series forecasting.
-    """
-
-    EXACT = "exact"
-    EQUIVARIANT = "equivariant"
-    KABSCH = "kabsch"
+from bionemo.moco.interpolants.batch_augmentation import BatchAugmentation
+from bionemo.moco.interpolants.continuous_time.continuous.optimal_transport.ot_types import OptimalTransportType
 
 
 class ContinuousFlowMatcher(Interpolant):
@@ -95,6 +80,7 @@ def __init__(
         prediction_type: Union[PredictionType, str] = PredictionType.DATA,
         sigma: Float = 0,
         ot_type: Optional[Union[OptimalTransportType, str]] = None,
+        ot_num_threads: int = 1,
         data_scale: Float = 1.0,
         device: Union[str, torch.device] = "cpu",
         rng_generator: Optional[torch.Generator] = None,
@@ -108,6 +94,7 @@ def __init__(
             prediction_type (PredictionType, optional): The type of prediction, either "flow" or another type. Defaults to PredictionType.DATA.
             sigma (Float, optional): The standard deviation of the Gaussian noise added to the interpolated data. Defaults to 0.
             ot_type (Optional[Union[OptimalTransportType, str]], optional): The type of optimal transport, if applicable. Defaults to None.
+            ot_num_threads:  Number of threads to use for OT solver. If "max", uses the maximum number of threads. Default is 1.
             data_scale (Float, optional): The scale factor for the data. Defaults to 1.0.
             device (Union[str, torch.device], optional): The device on which to run the interpolant, either "cpu" or a CUDA device (e.g. "cuda:0"). Defaults to "cpu".
             rng_generator: An optional :class:`torch.Generator` for reproducible sampling. Defaults to None.
@@ -123,44 +110,37 @@ def __init__(
             raise ValueError("Data Scale must be > 0")
         if ot_type is not None:
             self.ot_type = ot_type = string_to_enum(ot_type, OptimalTransportType)
-            self.ot_sampler = self._build_ot_sampler(sampler_type=ot_type)
+            self.ot_sampler = self._build_ot_sampler(method_type=ot_type, num_threads=ot_num_threads)
         self._loss_function = nn.MSELoss(reduction="none")
 
-    def _build_ot_sampler(self, sampler_type: Union[str, OptimalTransportType], num_threads: int = 1) -> OTSampler:
+    def _build_ot_sampler(self, method_type: OptimalTransportType, num_threads: int = 1):
         """Build the optimal transport sampler for the given optimal transport type.
 
         Args:
-            sampler_type (OptimalTransportType): The OT type to build the sampler for.
+            method_type (OptimalTransportType): The type of augmentation.
             num_threads (int): The number of threads to use for the OT sampler, default to 1.
 
         Returns:
-            The optimal transport sampler object or None if the optimal transport type is not specified.
+            The augmentation object.
         """
-        ot_sampler = None
-        sampler_type = string_to_enum(sampler_type, OptimalTransportType)
-        if sampler_type == OptimalTransportType.EXACT:
-            ot_sampler = OTSampler(method="exact", num_threads=num_threads)
-        elif sampler_type == OptimalTransportType.EQUIVARIANT:
-            raise NotImplementedError("Equivariant OT currently not implemented")
-        elif sampler_type == OptimalTransportType.KABSCH:
-            raise NotImplementedError("Kabsch OT currently not implemented")
-        return ot_sampler
-
-    def apply_ot(self, x0: Tensor, x1: Tensor, mask: Optional[Tensor] = None, replace: Bool = False) -> tuple:
+        return BatchAugmentation(self.device, num_threads).create(method_type)
+
+    def apply_ot(self, x0: Tensor, x1: Tensor, mask: Optional[Tensor] = None, **kwargs) -> tuple:
         """Sample and apply the optimal transport plan between batched (and masked) x0 and x1.
 
         Args:
             x0 (Tensor): shape (bs, *dim), noise from source minibatch.
             x1 (Tensor): shape (bs, *dim), data from source minibatch.
             mask (Optional[Tensor], optional): mask to apply to the output, shape (batchsize, nodes), if not provided no mask is applied. Defaults to None.
-            replace (bool): sampling w/ or w/o replacement from the OT plan, default to False.
+            **kwargs: Additional keyword arguments to be passed to self.ot_sampler.apply_ot or handled within this method.
+
 
         Returns:
             Tuple: tuple of 2 tensors, represents the noise and data samples following OT plan pi.
         """
         if self.ot_sampler is None:
             raise ValueError("Optimal Transport Sampler is not defined")
-        return self.ot_sampler.apply_ot(x0, x1, mask=mask, replace=replace)
+        return self.ot_sampler.apply_ot(x0, x1, mask=mask, **kwargs)
 
     def undo_scale_data(self, data: Tensor) -> Tensor:
         """Downscale the input data by the data scale factor.