cMancio00
diff --git a/‎.github/workflows/CI.yml
Lines changed: 0 additions & 35 deletions b/‎.github/workflows/CI.yml
Lines changed: 0 additions & 35 deletions
diff --git a/‎.idea/Super-Resolution.iml
Lines changed: 1 addition & 1 deletion b/‎.idea/Super-Resolution.iml
Lines changed: 1 addition & 1 deletion
diff --git a/‎ModelDemonstration.pdf
572 KB b/‎ModelDemonstration.pdf
572 KB
diff --git a/‎README.md
Lines changed: 1 addition & 1 deletion b/‎README.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎SRM/modules.py
Lines changed: 90 additions & 4 deletions b/‎SRM/modules.py
Lines changed: 90 additions & 4 deletions
diff --git a/‎SRM/network.py
Lines changed: 2 additions & 2 deletions b/‎SRM/network.py
Lines changed: 2 additions & 2 deletions
diff --git a/‎checkpoint/SR_c64_rb8_e150_202409132017.pth
2.84 MB b/‎checkpoint/SR_c64_rb8_e150_202409132017.pth
2.84 MB
diff --git a/‎checkpoint/SR_c64_rb8_e50_202409131926.pth
2.84 MB b/‎checkpoint/SR_c64_rb8_e50_202409131926.pth
2.84 MB
diff --git a/‎dataset/data_preparation.py
Lines changed: 23 additions & 1 deletion b/‎dataset/data_preparation.py
Lines changed: 23 additions & 1 deletion
diff --git a/‎dataset/super_resolution_dataset.py
Lines changed: 6 additions & 3 deletions b/‎dataset/super_resolution_dataset.py
Lines changed: 6 additions & 3 deletions
@@ -38,7 +38,7 @@ python3 main.py
 # Export the notebook as pdf
 
 ```bash
-jupyter nbconvert --to pdf notebook.ipynb --output "ModelDemonstration" --LatexPreprocessor.title "Super Resolution Demonstration" --LatexPreprocessor.date "August, 2024" --LatexPreprocessor.author_names "Christian Mancini"
+jupyter nbconvert --to pdf notebook.ipynb --output "ModelDemonstration" --LatexPreprocessor.title "Super Resolution Demonstration" --LatexPreprocessor.date "September, 2024" --LatexPreprocessor.author_names "Christian Mancini"
 ```
 
 # Installation of Requirements and Kernel
 
@@ -1,13 +1,30 @@
+import torch
 from torch import nn
+import numpy as np
 
 
+def _im2col(input, kernel_size, stride=1, padding=0):
+    input_padded = torch.nn.functional.pad(input, (padding, padding, padding, padding))
+    batch_size, in_channels, height, width = input_padded.size()
+    kernel_height, kernel_width = kernel_size
+    out_height = (height - kernel_height) // stride + 1
+    out_width = (width - kernel_width) // stride + 1
+    col = torch.empty(batch_size, in_channels, kernel_height, kernel_width, out_height, out_width)
+
+    for y in range(kernel_height):
+        for x in range(kernel_width):
+            col[:, :, y, x, :, :] = input_padded[:, :, y: y + out_height * stride: stride,
+                                    x: x + out_width * stride: stride]
+
+    return col.view(batch_size, in_channels * kernel_height * kernel_width, -1)
+
 class ResidualBlock(nn.Module):
 
     def __init__(self, num_channels):
         super().__init__()
-        self.conv1 = nn.Conv2d(num_channels, num_channels, kernel_size=3, padding=1)
+        self.conv1 = Conv2d(num_channels, num_channels, kernel_size=3, padding=1)
         self.relu = nn.ReLU()
-        self.conv2 = nn.Conv2d(num_channels, num_channels, kernel_size=3, padding=1)
+        self.conv2 = Conv2d(num_channels, num_channels, kernel_size=3, padding=1)
 
     def forward(self, x):
         res = x
@@ -22,11 +39,80 @@ class Upsample(nn.Module):
 
     def __init__(self, num_channel):
         super().__init__()
-        self.conv = nn.Conv2d(num_channel, num_channel * 4, kernel_size=3, padding=1)
-        self.shuffle = nn.PixelShuffle(2)
+        self.conv = Conv2d(num_channel, num_channel * 4, kernel_size=3, padding=1)
+        self.shuffle = PixelShuffle(2)
 
     def forward(self, x):
         out = self.conv(x)
         out = self.shuffle(out)
         return out
 
+
+class Conv2d(nn.Module):
+    def __init__(self, in_channels: int, out_channels: int, kernel_size: int, padding=1, bias=True):
+        super().__init__()
+        self.in_channels = in_channels
+        self.out_channels = out_channels
+        self.kernel_size = kernel_size
+        self.padding = padding
+        self.k = 1/(in_channels * np.power(kernel_size, 2))
+
+        if bias:
+            self.bias = nn.Parameter(
+                torch.empty(out_channels).uniform_(-np.sqrt(self.k),np.sqrt(self.k)))
+        else:
+            self.bias = torch.zeros(out_channels)
+
+        self.weight = nn.Parameter(
+            torch.empty(
+                out_channels, in_channels, kernel_size, kernel_size).uniform_(-np.sqrt(self.k),np.sqrt(self.k)))
+
+
+    def _conv_forward(self, input, weight, bias=None, stride=1, padding=0):
+        col = _im2col(input, weight.size()[2:], stride, padding)
+        # (out_channels, in_channels * kernel_height * kernel_width)
+        weight_col = weight.view(weight.size(0), -1)
+        out = torch.matmul(weight_col, col)
+
+        if bias is not None:
+            out += bias.view(1, -1, 1)
+
+        batch_size, out_channels = out.size(0), weight.size(0)
+        out_height = (input.size(2) + 2 * padding - weight.size(2)) // stride + 1
+        out_width = (input.size(3) + 2 * padding - weight.size(3)) // stride + 1
+        return out.view(batch_size, out_channels, out_height, out_width)
+
+    def forward(self, input):
+        return self._conv_forward(input, self.weight, self.bias, padding=self.padding)
+
+
+    def slow_forward(self, image):
+        image = nn.functional.pad(image, (self.padding,) * 4, "constant", 0)
+        batch_size, in_channels, height, width = image.shape
+        out_channels, in_channels_kernel, m, n = self.weight.shape
+        if self.in_channels != in_channels:
+            raise ValueError(
+                f"Input channels are different: Declared {self.in_channels}, but got Image with {in_channels}")
+        output_height = height - m + 1
+        output_width = width - n + 1
+        new_image = torch.zeros((batch_size, out_channels, output_height, output_width))
+
+        for b in range(batch_size):
+            for c in range(out_channels):
+                for i in range(output_height):
+                    for j in range(output_width):
+                        new_image[b, c, i, j] = torch.sum(image[b, :, i:i + m, j:j + n] * self.weight[c]) + self.bias[c]
+        return new_image
+
+
+class PixelShuffle(nn.Module):
+    def __init__(self, upscale_factor: int):
+        super().__init__()
+        self.upscale_factor = upscale_factor
+
+    def forward(self, x):
+        batch_size, channels, height, width = x.shape
+        channels //= (self.upscale_factor ** 2)
+        x = x.view(batch_size, channels, self.upscale_factor, self.upscale_factor, height, width)
+        x = x.permute(0, 1, 4, 2, 5, 3)
+        return x.contiguous().view(batch_size, channels, height * self.upscale_factor, width * self.upscale_factor)
@@ -9,12 +9,12 @@ class SuperResolution(nn.Module):
     def __init__(self, num_channels: int, num_res_block: int):
         super().__init__()
         self.layers = nn.ModuleList([
-            nn.Conv2d(3, num_channels, kernel_size=3, padding=1)
+            Conv2d(3, num_channels, kernel_size=3, padding=1)
         ])
         for _ in range(num_res_block):
             self.layers.append(ResidualBlock(num_channels))
         self.layers.append(Upsample(num_channels))
-        self.layers.append(nn.Conv2d(num_channels, 3, kernel_size=3, padding=1))
+        self.layers.append(Conv2d(num_channels, 3, kernel_size=3, padding=1))
 
     def forward(self, x):
         for layer in self.layers:
 
@@ -29,6 +29,28 @@ def download(path: str, dataset: str):
         print(f"Dataset {dataset} already exists, skipping download.")
 
 
+def _random_split(dataset: Dataset, lengths: list[int]) -> list[Subset]:
+    """
+    Utility method that simulate pytorch random split
+    Args:
+        dataset: Dataset to be split
+        lengths: List of lengths to split the dataset into
+
+    Returns:
+        List of Subsets
+    """
+    if sum(lengths) != len(dataset):
+        raise ValueError("Sum of input lengths does not equal the length of the input dataset!")
+
+    indices = torch.randperm(len(dataset)).tolist()
+    subsets = []
+    offset = 0
+    for length in lengths:
+        subset = torch.utils.data.Subset(dataset, indices[offset:offset + length])
+        subsets.append(subset)
+        offset += length
+    return subsets
+
 def split_dataset(dataset: Dataset, sizes: dict[str, float]) -> list[Subset]:
     """
         Splits a dataset into training, validation, and test sets based on the provided sizes.
@@ -52,4 +74,4 @@ def split_dataset(dataset: Dataset, sizes: dict[str, float]) -> list[Subset]:
     train_size = int(sizes["train"] * len(dataset))
     validation_size = int(sizes["validation"] * len(dataset))
     test_size = len(dataset) - train_size - validation_size
-    return torch.utils.data.random_split(dataset, [train_size, validation_size, test_size])
+    return _random_split(dataset, [train_size, validation_size, test_size])
@@ -6,10 +6,13 @@
 
 
 class SuperResolutionDataset(Dataset):
-    def __init__(self, root_dir, transform=transforms.Compose([transforms.ToTensor()])) -> None:
+    def __init__(self, root_dir, low_resolution=(128, 64), high_resolution=(256, 128),
+                 transform=transforms.Compose([transforms.ToTensor()])) -> None:
         self.root_dir = root_dir
         self.transform = transform
         self.file_names = os.listdir(root_dir)
+        self.low_resolution = low_resolution
+        self.high_resolution = high_resolution
 
     def __len__(self) -> int:
         return len(self.file_names)
@@ -25,8 +28,8 @@ def __getitem__(self, idx) -> tuple[torch.Tensor, torch.Tensor]:
         """
         img_path = os.path.join(self.root_dir, self.file_names[idx])
         image = Image.open(img_path)
-        low_res = image.resize((128, 64))
-        high_res = image.resize((256, 128))
+        low_res = image.resize(self.low_resolution)
+        high_res = image.resize(self.high_resolution)
 
         if self.transform:
             low_res = self.transform(low_res)