tabR lazy imports

bishnukhadka · bishnukhadka · commit 74088a7c2589 · 2025-04-01T13:13:12.000+05:45
diff --git a/mambular/base_models/tabr.py b/mambular/base_models/tabr.py
@@ -9,9 +9,11 @@
 from torch import Tensor
 import math
 
-
-
 class TabR(BaseModel):
+    delu = None
+    faiss = None
+    faiss_torch_utils = None
+
     def __init__(
         self,
         feature_information: tuple,
@@ -22,6 +24,10 @@ def __init__(
         super().__init__(config=config, **kwargs)
         self.save_hyperparameters(ignore=["feature_information"])
 
+        # lazy import 
+        if TabR.delu or TabR.faiss or TabR.faiss_torch_utils is None: 
+            self._lazy_import_dependencies()
+
         self.returns_ensemble = False
         self.uses_candidates = True
 
@@ -86,12 +92,8 @@ def make_block(prenorm: bool) -> nn.Sequential:
 
         # Retrieval Module: R
         self.normalization = Normalization(d_main) if mixer_normalization else None
-        
-        # lazy import
-        import delu
-        import faiss
-        import faiss.contrib.torch_utils
 
+        delu = TabR.delu
         self.label_encoder = (
             nn.Linear(1, d_main)
             if num_classes == 1
@@ -134,6 +136,31 @@ def reset_parameters(self):
             assert isinstance(self.label_encoder[0], nn.Embedding)
             nn.init.uniform_(self.label_encoder[0].weight, -1.0, 1.0)  # type: ignore[code]  # noqa: E501
 
+    def _lazy_import_dependencies(self):
+        """Lazily import external dependencies and store them as class attributes."""
+        if TabR.delu is None: 
+            try:
+                import delu
+                TabR.delu = delu
+                print("Successfully lazy imported delu dependency.")
+
+            except ImportError:
+                raise ImportError("Failed to import delu module for TabR. Ensure all dependencies are installed\n" 
+                "You can install faiss running 'pip install delu'.") from None
+
+        if TabR.faiss is None: 
+            try: 
+                import faiss
+                import faiss.contrib.torch_utils
+                
+                TabR.faiss = faiss
+                TabR.faiss_torch_utils = faiss.contrib.torch_utils
+                print("Successfully lazy imported faiss dependency")
+
+            except ImportError as e:
+                raise ImportError("Failed to import a required module for TabR. Ensure all dependencies are installed\n" 
+                "You can install delu by running 'pip install delu'.") from None
+
     def _encode(
             self, 
             a
@@ -210,7 +237,8 @@ def train_with_candidates(
                 else torch.cat(
                     [
                         self._encode(x)[1] # normalized x
-                        for x in delu.iter_batches(
+                        # for x in delu.iter_batches(
+                        for x in TabR.delu.iter_batches(
                             candidate_x, 
                             self.candidate_encoding_batch_size
                         )
@@ -229,12 +257,12 @@ def train_with_candidates(
             # initializing the search index
             if self.search_index is None:
                 self.search_index = (
-                    faiss.GpuIndexFlatL2(
-                        faiss.StandardGpuResources(), 
+                    TabR.faiss.GpuIndexFlatL2(
+                        TabR.faiss.StandardGpuResources(), 
                         d_main
                     )
                     if device.type == 'cuda'
-                    else faiss.IndexFlatL2(d_main)
+                    else TabR.faiss.IndexFlatL2(d_main)
                 )
             # Updating the index is much faster than creating a new one.
             self.search_index.reset()
@@ -318,7 +346,7 @@ def validate_with_candidates(
                 else torch.cat(
                     [
                         self._encode(x)[1] # normalized x
-                        for x in delu.iter_batches(
+                        for x in TabR.delu.iter_batches(
                             candidate_x, 
                             self.candidate_encoding_batch_size
                         )
@@ -333,19 +361,15 @@ def validate_with_candidates(
         device = k.device
         context_size = self.context_size
 
-        # lazy import 
-        import faiss
-        import faiss.contrib.torch_utils
         if self.search_index is None:
             self.search_index = (
-                faiss.GpuIndexFlatL2(faiss.StandardGpuResources(), d_main)
+                TabR.faiss.GpuIndexFlatL2(TabR.faiss.StandardGpuResources(), d_main)
                 if device.type == 'cuda'
-                else faiss.IndexFlatL2(d_main)
+                else TabR.faiss.IndexFlatL2(d_main)
             )
             
         # Updating the index is much faster than creating a new one.
         self.search_index.reset()
-        # print(candidate_k)
         self.search_index.add(candidate_k.to(torch.float32))  # type: ignore[code]
         distances: Tensor
         context_idx: Tensor
@@ -407,7 +431,7 @@ def predict_with_candidates(
                 else torch.cat(
                     [
                         self._encode(x)[1] # normalized x
-                        for x in delu.iter_batches(
+                        for x in TabR.delu.iter_batches(
                             candidate_x, 
                             self.candidate_encoding_batch_size
                         )
@@ -422,19 +446,16 @@ def predict_with_candidates(
         device = k.device
         context_size = self.context_size
 
-        # lazy import 
-        import faiss
-        import faiss.contrib.torch_utils
         if self.search_index is None:
             self.search_index = (
-                faiss.GpuIndexFlatL2(faiss.StandardGpuResources(), d_main)
+                TabR.faiss.GpuIndexFlatL2(TabR.faiss.StandardGpuResources(), d_main)
                 if device.type == 'cuda'
-                else faiss.IndexFlatL2(d_main)
+                else TabR.faiss.IndexFlatL2(d_main)
             )
+
             
         # Updating the index is much faster than creating a new one.
         self.search_index.reset()
-        # print(candidate_k)
         self.search_index.add(candidate_k.to(torch.float32))  # type: ignore[code]
         distances: Tensor
         context_idx: Tensor
diff --git a/mambular/configs/tabr_config.py b/mambular/configs/tabr_config.py
@@ -32,8 +32,7 @@ class DefaultTabRConfig(BaseConfig):
     context_size:int=96
 
     # Embedding Parameters
-    emebedding_type: str = "plr"
+    embedding_type: str = "plr"
     plr_lite: bool = True
     n_frequencies: int = 75
-    frequencies_init_scale: float = 0.045
-
+    frequencies_init_scale: float = 0.045