Initial conv2d attempts prior to backprop integration.

DeepBlockDeepak · DeepBlockDeepak · commit 82b9463c4216 · 2025-01-01T01:59:32.000-07:00
diff --git a/pyproject.toml b/pyproject.toml
@@ -8,7 +8,8 @@ readme = "README.md"
 
 packages = [
     { include = "activation_functions", from = "src" },
-    { include = "my_neural_network", from = "src" }
+    { include = "my_neural_network", from = "src" },
+    { include = "cnn", from = "src" }
 ]
 
 # Python version and any project dependencies here
diff --git a/src/cnn/__init__.py b/src/cnn/__init__.py
@@ -0,0 +1 @@
+from .conv2d import Conv2D
diff --git a/src/cnn/conv2d.py b/src/cnn/conv2d.py
@@ -0,0 +1,81 @@
+import numpy as np
+
+
+class Conv2D:
+    def __init__(self, in_channels, out_channels, kernel_size=3, stride=1, padding=1):
+        self.in_channels = in_channels
+        self.out_channels = out_channels
+        self.kernel_size = kernel_size
+        self.stride = stride
+        self.padding = padding
+
+        # init kernels and biases
+        self.kernels = (
+            np.random.randn(out_channels, in_channels, kernel_size, kernel_size) * 0.1
+        )
+        self.biases = np.zeros((out_channels, 1))
+
+    def _pad_input(self, X):
+        if self.padding > 0:
+            return np.pad(
+                X,
+                (
+                    (0, 0),
+                    (0, 0),
+                    (self.padding, self.padding),
+                    (self.padding, self.padding),
+                ),
+                mode="constant",
+            )
+        return X
+
+    def forward(self, X):
+        """
+        Perform forward propagation for convolutional layer.
+
+        Args:
+            X: Input tensor of shape (batch_size, in_channels, height, width)
+
+        Returns:
+            np.ndarray: Output tensor after convolution
+        """
+        batch_size, in_channels, height, width = X.shape
+        assert (
+            in_channels == self.in_channels
+        ), "Input channels must match kernel channels."
+
+        # calculate output dimensions
+        out_height = (height + 2 * self.padding - self.kernel_size) // self.stride + 1
+        out_width = (width + 2 * self.padding - self.kernel_size) // self.stride + 1
+
+        # apply padding
+        X_padded = self._pad_input(X)
+
+        # allocate output tensor to store convolution results
+        output = np.zeros((batch_size, self.out_channels, out_height, out_width))
+
+        # convolve
+        for b in range(batch_size):  # iterate over each sample in batch
+            for o in range(
+                self.out_channels
+            ):  # for each filter (each filter makes one feature map)
+                for i in range(
+                    out_height
+                ):  # traverse over the locations of the feature map
+                    for j in range(out_width):
+                        # region of the input matrix that the kernel processes
+                        h_start = i * self.stride
+                        h_end = h_start + self.kernel_size
+                        w_start = j * self.stride
+                        w_end = w_start + self.kernel_size
+
+                        # extract the input region
+                        input_region = X_padded[b, :, h_start:h_end, w_start:w_end]
+
+                        # element-wise multiplication and summation
+                        output[b, o, i, j] = (
+                            np.sum(input_region * self.kernels[o, :, :, :])
+                            + self.biases[o]
+                        )
+
+        return output
diff --git a/src/cnn/simple_cnn.py b/src/cnn/simple_cnn.py
@@ -0,0 +1,17 @@
+from cnn import Conv2D
+from my_neural_network import SimpleNeuralNetwork
+
+
+class SimpleNeuralNetworkWithConv(SimpleNeuralNetwork):
+    def __init__(self, config, conv_params):
+        super().__init__(config)
+        self.conv_layer = Conv2D(**conv_params)  # add a convolutional layer
+
+    def forward_propagation(self, X, mode="train"):
+        conv_output = self.conv_layer.forward(X)
+
+        # flatten output of convolutional layer (needed for input to FFNN?)
+        flat_output = conv_output.reshape(conv_output.shape[0], -1).T
+
+        # pass to fully connected layers
+        return super().forward_propagation(flat_output, mode)

Original file line number	Diff line number	Diff line change
`@@ -8,7 +8,8 @@ readme = "README.md"`
`8`	`8`
`9`	`9`	`packages = [`
`10`	`10`	`{ include = "activation_functions", from = "src" },`
`11`		`- { include = "my_neural_network", from = "src" }`
	`11`	`+ { include = "my_neural_network", from = "src" },`
	`12`	`+ { include = "cnn", from = "src" }`
`12`	`13`	`]`
`13`	`14`
`14`	`15`	`# Python version and any project dependencies here`