[FEAT][ImgPatchEmbed] [chore][disable_warnings_and_logs]

kyegomez · Dec 21, 2023 · 6a550fc · 6a550fc
1 parent bbb360a
commit 6a550fc
Show file tree

Hide file tree

Showing 7 changed files with 195 additions and 17 deletions.
diff --git a/tests/nn/modules/test_img_patch_embed.py b/tests/nn/modules/test_img_patch_embed.py
@@ -0,0 +1,76 @@
+# FILEPATH: /Users/defalt/Desktop/Athena/research/zeta/tests/nn/modules/test_img_patch_embed.py
+
+import pytest
+from torch import nn
+import torch
+from zeta.nn.modules.img_patch_embed import ImgPatchEmbed
+
+
+def test_class_init():
+    model = ImgPatchEmbed()
+
+    assert isinstance(model.proj, nn.Conv2d)
+    assert model.img_size == 224
+    assert model.patch_size == 16
+    assert model.num_patches == 196
+
+
+def test_class_init_with_args():
+    model = ImgPatchEmbed(
+        img_size=448, patch_size=32, in_chans=1, embed_dim=512
+    )
+
+    assert isinstance(model.proj, nn.Conv2d)
+    assert model.img_size == 448
+    assert model.patch_size == 32
+    assert model.num_patches == 196
+    assert model.proj.in_channels == 1
+    assert model.proj.out_channels == 512
+
+
+def test_forward():
+    model = ImgPatchEmbed()
+    x = torch.randn(1, 3, 224, 224)
+    out = model(x)
+
+    assert out.shape == torch.Size([1, 196, 768])
+
+
+def test_forward_with_different_input():
+    model = ImgPatchEmbed()
+    x = torch.randn(2, 3, 224, 224)
+    out = model(x)
+
+    assert out.shape == torch.Size([2, 196, 768])
+
+
+def test_forward_with_different_img_size():
+    model = ImgPatchEmbed(img_size=448)
+    x = torch.randn(1, 3, 448, 448)
+    out = model(x)
+
+    assert out.shape == torch.Size([1, 196, 768])
+
+
+def test_forward_with_different_patch_size():
+    model = ImgPatchEmbed(patch_size=32)
+    x = torch.randn(1, 3, 224, 224)
+    out = model(x)
+
+    assert out.shape == torch.Size([1, 49, 768])
+
+
+def test_forward_with_different_in_chans():
+    model = ImgPatchEmbed(in_chans=1)
+    x = torch.randn(1, 1, 224, 224)
+    out = model(x)
+
+    assert out.shape == torch.Size([1, 196, 768])
+
+
+def test_forward_with_different_embed_dim():
+    model = ImgPatchEmbed(embed_dim=512)
+    x = torch.randn(1, 3, 224, 224)
+    out = model(x)
+
+    assert out.shape == torch.Size([1, 196, 512])
diff --git a/tests/nn/modules/test_simple_mamba.py b/tests/nn/modules/test_simple_mamba.py
@@ -5,6 +5,7 @@
 from torch import nn
 from zeta.nn.modules.simple_mamba import Mamba, ResidualBlock, RMSNorm
 
+
 def test_mamba_class_init():
     model = Mamba(10000, 512, 6)
 
@@ -13,13 +14,15 @@ def test_mamba_class_init():
     assert isinstance(model.norm_f, RMSNorm)
     assert isinstance(model.lm_head, nn.Linear)
 
+
 def test_mamba_forward():
     model = Mamba(10000, 512, 6)
     x = torch.randint(0, 10000, (1, 50))
     out = model(x)
 
     assert out.shape == torch.Size([1, 50, 10000])
 
+
 def test_residual_block_class_init():
     block = ResidualBlock(512)
 
@@ -28,55 +31,63 @@ def test_residual_block_class_init():
     assert isinstance(block.fc1, nn.Linear)
     assert isinstance(block.fc2, nn.Linear)
 
+
 def test_residual_block_forward():
     block = ResidualBlock(512)
     x = torch.randn(1, 50, 512)
     out = block(x)
 
     assert out.shape == torch.Size([1, 50, 512])
 
+
 def test_mamba_different_vocab_size():
     model = Mamba(20000, 512, 6)
     x = torch.randint(0, 20000, (1, 50))
     out = model(x)
 
     assert out.shape == torch.Size([1, 50, 20000])
 
+
 def test_mamba_different_dim():
     model = Mamba(10000, 1024, 6)
     x = torch.randint(0, 10000, (1, 50))
     out = model(x)
 
     assert out.shape == torch.Size([1, 50, 10000])
 
+
 def test_mamba_different_depth():
     model = Mamba(10000, 512, 12)
     x = torch.randint(0, 10000, (1, 50))
     out = model(x)
 
     assert out.shape == torch.Size([1, 50, 10000])
 
+
 def test_residual_block_different_dim():
     block = ResidualBlock(1024)
     x = torch.randn(1, 50, 1024)
     out = block(x)
 
     assert out.shape == torch.Size([1, 50, 1024])
 
+
 def test_mamba_with_dropout():
     model = Mamba(10000, 512, 6, dropout=0.5)
     x = torch.randint(0, 10000, (1, 50))
     out = model(x)
 
     assert out.shape == torch.Size([1, 50, 10000])
 
+
 def test_residual_block_with_dropout():
     block = ResidualBlock(512, dropout=0.5)
     x = torch.randn(1, 50, 512)
     out = block(x)
 
     assert out.shape == torch.Size([1, 50, 512])
 
+
 def test_mamba_with_custom_layer():
     class CustomLayer(nn.Module):
         def forward(self, x):
@@ -86,4 +97,4 @@ def forward(self, x):
     x = torch.randint(0, 10000, (1, 50))
     out = model(x)
 
-    assert out.shape == torch.Size([1, 50, 10000])
+    assert out.shape == torch.Size([1, 50, 10000])
diff --git a/zeta/nn/biases/relative_position_bias.py b/zeta/nn/biases/relative_position_bias.py
@@ -6,6 +6,7 @@
 import torch
 from torch import nn
 
+
 class RelativePositionBias(nn.Module):
     def __init__(
         self,

diff --git a/zeta/nn/modules/__init__.py b/zeta/nn/modules/__init__.py
@@ -46,6 +46,7 @@
 from zeta.nn.modules.visual_expert import VisualExpert
 from zeta.nn.modules.yolo import yolo
 from zeta.nn.modules.swiglu import SwiGLU, SwiGLUStacked
+from zeta.nn.modules.img_patch_embed import ImgPatchEmbed
 
 # from zeta.nn.modules.img_reshape import image_reshape
 # from zeta.nn.modules.flatten_features import flatten_features
@@ -111,4 +112,5 @@
     "AdaptiveLayerNorm",
     "SwiGLU",
     "SwiGLUStacked",
+    "ImgPatchEmbed",
 ]
diff --git a/zeta/nn/modules/img_patch_embed.py b/zeta/nn/modules/img_patch_embed.py
@@ -0,0 +1,45 @@
+from torch import nn
+
+
+class ImgPatchEmbed(nn.Module):
+    """patch embedding module
+
+
+    Args:
+        img_size (int, optional): image size. Defaults to 224.
+        patch_size (int, optional): patch size. Defaults to 16.
+        in_chans (int, optional): input channels. Defaults to 3.
+        embed_dim (int, optional): embedding dimension. Defaults to 768.
+
+    Examples:
+        >>> x = torch.randn(1, 3, 224, 224)
+        >>> model = ImgPatchEmbed()
+        >>> model(x).shape
+        torch.Size([1, 196, 768])
+
+
+    """
+
+    def __init__(self, img_size=224, patch_size=16, in_chans=3, embed_dim=768):
+        super().__init__()
+        num_patches = (img_size // patch_size) * (img_size // patch_size)
+        self.img_size = img_size
+        self.patch_size = patch_size
+        self.num_patches = num_patches
+
+        self.proj = nn.Conv2d(
+            in_chans, embed_dim, kernel_size=patch_size, stride=patch_size
+        )
+
+    def forward(self, x):
+        """Forward
+
+        Args:
+            x (_type_): _description_
+
+        Returns:
+            _type_: _description_
+        """
+        B, C, H, W = x.shape
+        x = self.proj(x).flatten(2).transpose(1, 2)
+        return x
diff --git a/zeta/nn/modules/simple_mamba.py b/zeta/nn/modules/simple_mamba.py
@@ -6,7 +6,6 @@
 from typing import Optional, Union
 
 
-
 # [HELPERS] ----------------------------------------------------------------------------------------
 class RMSNorm(nn.Module):
     def __init__(self, dim: int, eps: float = 1e-5):
@@ -57,8 +56,6 @@ def forward(self, x):
         return output
 
 
-
-
 class Mamba(nn.Module):
     def __init__(
         self, vocab_size: int = None, dim: int = None, depth: int = None
@@ -98,7 +95,6 @@ class MambaLMHeadModel, https://github.com/state-spaces/mamba/blob/main/mamba_ss
         return logits
 
 
-
 class MambaBlock(nn.Module):
     def __init__(
         self,
@@ -107,7 +103,7 @@ def __init__(
         depth: int,
         d_state: int = 16,
         expand: int = 2,
-        dt_rank: Union[int, str] = 'auto',
+        dt_rank: Union[int, str] = "auto",
         d_conv: int = 4,
         conv_bias: bool = True,
         bias: bool = False,
@@ -136,7 +132,6 @@ def __init__(
         self.A_log = nn.Parameter(torch.log(A))
         self.D = nn.Parameter(torch.ones(dim_inner))
         self.out_proj = nn.Linear(dim_inner, dim, bias=bias)
-
 
     def forward(self, x):
         """Mamba block forward. This looks the same as Figure 3 in Section 3.4 in the Mamba paper [1].
@@ -260,4 +255,3 @@ def selective_scan(self, u, delta, A, B, C, D):
             y = y + u * rearrange(D, "d_in -> d_in 1")
 
         return y
-
diff --git a/zeta/utils/disable_logging.py b/zeta/utils/disable_logging.py
@@ -1,13 +1,55 @@
+# import logging
+# import os
+# import warnings
+
+
+# def disable_warnings_and_logs():
+#     """
+#     Disables various warnings and logs.
+#     """
+#     # disable warnings
+#     warnings.filterwarnings("ignore")
+
+#     # disable tensorflow warnings
+#     os.environ["TF_CPP_MIN_LOG_LEVEL"] = "2"
+
+#     # disable bnb warnings and others
+#     logging.getLogger().setLevel(logging.WARNING)
+
+#     class CustomFilter(logging.Filter):
+#         def filter(self, record):
+#             unwanted_logs = [
+#                 "Setting ds_accelerator to mps (auto detect)",
+#                 (
+#                     "NOTE: Redirects are currently not supported in Windows or"
+#                     " MacOs."
+#                 ),
+#             ]
+#             return not any(log in record.getMessage() for log in unwanted_logs)
+
+#     # add custom filter to root logger
+#     logger = logging.getLogger()
+#     f = CustomFilter()
+#     logger.addFilter(f)
+
+#     # disable specific loggers
+#     loggers = [
+#         "real_accelerator",
+#         "torch.distributed.elastic.multiprocessing.redirects",
+#     ]
+
+#     for logger_name in loggers:
+#         logger = logging.getLogger(logger_name)
+#         logger.setLevel(logging.CRITICAL)
+
+
 import logging
 import os
 import warnings
 
-
 def disable_warnings_and_logs():
-    """Disable warnings and logs.
-
-    Returns:
-        _type_: _description_
+    """
+    Disables various warnings and logs.
     """
     # disable warnings
     warnings.filterwarnings("ignore")
@@ -20,12 +62,19 @@ def disable_warnings_and_logs():
 
     class CustomFilter(logging.Filter):
         def filter(self, record):
-            msg = "Created a temporary directory at"
-            return msg not in record.getMessage()
+            unwanted_logs = [
+                "Setting ds_accelerator to mps (auto detect)",
+                (
+                    "NOTE: Redirects are currently not supported in Windows or"
+                    " MacOs."
+                ),
+            ]
+            return not any(log in record.getMessage() for log in unwanted_logs)
 
+    # add custom filter to root logger
     logger = logging.getLogger()
     f = CustomFilter()
     logger.addFilter(f)
 
-
-disable_warnings_and_logs()
+    # disable all loggers
+    logging.disable(logging.CRITICAL)