ConvolutionLanguageBlock with tests

kyegomez · Nov 29, 2023 · b62e95c · b62e95c
1 parent 6f029ba
commit b62e95c
Show file tree

Hide file tree

Showing 5 changed files with 212 additions and 9 deletions.
diff --git a/tests/nn/modules/test_conv_lang.py b/tests/nn/modules/test_conv_lang.py
@@ -0,0 +1,98 @@
+from unittest.mock import Mock
+
+import pytest
+import torch
+from torch import nn
+
+from zeta.nn.modules.lang_conv_module import ConvolutionLanguageBlock
+
+
+# 1. Basic Tests
+def test_convolution_language_block_creation():
+ block = ConvolutionLanguageBlock(256, 512, 3, 1)
+ assert isinstance(block, ConvolutionLanguageBlock)
+
+
+def test_forward_pass():
+ block = ConvolutionLanguageBlock(256, 512, 3, 1)
+ x = torch.randn(1, 256, 1024)
+ output = block(x)
+ assert output.shape == torch.Size([1, 512, 1024])
+
+
+# 2. Utilize Fixtures
+@pytest.fixture
+def sample_block():
+ return ConvolutionLanguageBlock(128, 256, 3, 1)
+
+
+def test_fixture_usage(sample_block):
+ x = torch.randn(1, 128, 1024)
+ output = sample_block(x)
+ assert output.shape == torch.Size([1, 256, 1024])
+
+
+# 3. Parameterized Testing
+@pytest.mark.parametrize(
+ (
+ "in_channels, out_channels, kernel_size, padding, depth, stride,"
+ " activation, batchnorm, dilation, dropout"
+ ),
+ [
+ (128, 256, 3, 1, 2, 1, "relu", True, 1, 0.1),
+ (256, 512, 3, 1, 3, 1, "gelu", False, 2, 0.2),
+ # Add more parameter combinations as needed
+ ],
+)
+def test_parameterized_block(
+ in_channels,
+ out_channels,
+ kernel_size,
+ padding,
+ depth,
+ stride,
+ activation,
+ batchnorm,
+ dilation,
+ dropout,
+):
+ block = ConvolutionLanguageBlock(
+ in_channels,
+ out_channels,
+ kernel_size,
+ padding,
+ depth,
+ stride,
+ activation,
+ batchnorm,
+ dilation,
+ dropout,
+ )
+ x = torch.randn(1, in_channels, 1024)
+ output = block(x)
+ assert output.shape == torch.Size([1, out_channels, 1024])
+
+
+def test_with_mocked_convolution_layer():
+ mock_convolution = Mock(spec=nn.Conv1d)
+ block = ConvolutionLanguageBlock(128, 256, 3, 1)
+ block.conv_layers[0] = mock_convolution
+ x = torch.randn(1, 128, 1024)
+ output = block(x)
+ assert mock_convolution.called
+
+
+# 5. Exception Testing
+def test_invalid_activation_raises_error():
+ with pytest.raises(ValueError):
+ ConvolutionLanguageBlock(
+ 128, 256, 3, 1, activation="invalid_activation"
+ )
+
+
+# 6. Test Coverage (requires pytest-cov)
+def test_coverage():
+ pytest.main(["--cov=your_module", "test_your_module.py"])
+
+
+# Add more tests as needed...
diff --git a/zeta/nn/modules/__init__.py b/zeta/nn/modules/__init__.py
@@ -55,7 +55,7 @@
 from zeta.nn.modules.polymorphic_activation import PolymorphicActivation
 from zeta.nn.modules.prenorm import PreNorm
 from zeta.nn.modules.itca import IterativeCrossSelfAttention
-
+from zeta.nn.modules.lang_conv_module import ConvolutionLanguageBlock
 __all__ = [
  "CNNNew",
  "CombinedLinear",
@@ -100,4 +100,5 @@
  "PolymorphicActivation",
  "PreNorm",
  "IterativeCrossSelfAttention",
+ "ConvolutionLanguageBlock"
 ]
diff --git a/zeta/nn/modules/itca.py b/zeta/nn/modules/itca.py
@@ -69,21 +69,22 @@ def forward(self, x, context=None):
  return out
 
 
-class IterativeCrossSelfAttention(nn.Module): 
- """Iterative 
+class IterativeCrossSelfAttention(nn.Module):
+ """Iterative
 
  Args:
  dim (_type_): _description_
  depth (_type_): _description_
  heads (_type_): _description_
  dim_head (_type_): _description_
- dropout (float, optional): _description_. Defaults to 0.1. 
- 
+ dropout (float, optional): _description_. Defaults to 0.1.
+
  Methods:
  forward(x, context=None): _description_
- 
+
  Examples:
- """ 
+ """
+
  def __init__(
  self,
  dim,

diff --git a/zeta/nn/modules/lang_conv_module.py b/zeta/nn/modules/lang_conv_module.py
@@ -0,0 +1,104 @@
+import torch
+from torch import nn
+
+
+class ConvolutionLanguageBlock(nn.Module):
+ """
+ Convolutional block for language modeling.
+ --------------------------------------------
+ A convolutional block that consists of multiple 1D convolutional layers,
+ optional batch normalization, dropout, and a flexible choice of activation functions.
+ This block is designed to maintain the input's dimensionality through the network,
+ making it suitable for tasks that require consistent input and output dimensions.
+
+ Parameters:
+ - in_channels (int): Number of channels in the input tensor.
+ - out_channels (int): Number of channels produced by the convolution.
+ - kernel_size (int): Size of the convolving kernel.
+ - num_layers (int, optional): Number of convolutional layers. Default: 1
+ - stride (int, optional): Stride of the convolution. Default: 1
+ - padding (int, optional): Zero-padding added to both sides of the input. Default: 1
+ - dilation (int, optional): Spacing between kernel elements. Default: 1
+ - activation (str, optional): Type of activation function. Options: 'relu', 'gelu'. Default: 'relu'
+ - use_batchnorm (bool, optional): If True, includes batch normalization. Default: False
+ - dropout (float, optional): Dropout rate. Default: 0.0
+
+ Examples:
+ >>> import torch
+ >>> from attnconv.main import ConvolutionLanguageBlock
+ >>> x = torch.randn(1, 512, 1024)
+ >>> block = ConvolutionLanguageBlock(512, 512, 3, 1, 1, 1)
+ >>> out = block(x)
+ >>> out.shape
+ torch.Size([1, 512, 1024])
+ """
+
+ def __init__(
+ self,
+ in_channels,
+ out_channels,
+ kernel_size,
+ padding,
+ depth=1,
+ stride=1,
+ activation="gelu",
+ batchnorm=False,
+ dilation=1,
+ dropout=0.1,
+ ):
+ super(ConvolutionLanguageBlock, self).__init__()
+ self.in_channels = in_channels
+ self.out_channels = out_channels
+ self.kernel_size = kernel_size
+ self.padding = padding
+ self.depth = depth
+ self.stride = stride
+ self.activation = activation
+ self.batchnorm = batchnorm
+ self.dilation = dilation
+
+ layers = []
+ for _ in range(depth):
+ layers.append(
+ nn.Conv1d(
+ in_channels,
+ out_channels,
+ kernel_size,
+ stride=stride,
+ padding=padding,
+ dilation=dilation,
+ )
+ )
+ if batchnorm:
+ layers.append(nn.BatchNorm1d(out_channels))
+ if activation == "relu":
+ layers.append(nn.ReLU())
+ elif activation == "gelu":
+ layers.append(nn.GELU())
+ if dropout > 0:
+ layers.append(nn.Dropout(dropout))
+ in_channels = out_channels # For stacking layers
+
+ self.conv_layers = nn.Sequential(*layers)
+
+ def forward(self, x):
+ """Forward pass with residual connection.
+
+ Args:
+ x (_type_): _description_
+
+ Returns:
+ _type_: _description_
+ """
+ # Apply residual connection if dimensions match
+ residual = x if x.size(1) == self.conv_layers[0].in_channels else None
+
+ # Apply convolutional layers
+ x = self.conv_layers(x)
+
+ # Apply residual connection
+ if residual is not None:
+ x = x + residual
+
+ # Return output
+ return x
diff --git a/zeta/nn/modules/prenorm.py b/zeta/nn/modules/prenorm.py
@@ -1,4 +1,3 @@
-
 from torch import nn
 
 
@@ -23,4 +22,4 @@ def forward(self, x, context=None):
  Args:
  x (_type_): _description_
  """
- return self.fn(self.norm(x), context=context)
+ return self.fn(self.norm(x), context=context)