From 6d0cf77e9fff49f986401072cbbf9fdcefe4fcfe Mon Sep 17 00:00:00 2001
From: Jeremy Sadler <53983960+jezsadler@users.noreply.github.com>
Date: Fri, 17 Nov 2023 00:51:53 +0000
Subject: [PATCH 1/3] Including dilations for 2D layers

---
 src/omlt/io/onnx_parser.py  | 30 ++++++++++--------
 src/omlt/neuralnet/layer.py | 61 +++++++++++++++++++++++++++++++++++--
 2 files changed, 76 insertions(+), 15 deletions(-)

diff --git a/src/omlt/io/onnx_parser.py b/src/omlt/io/onnx_parser.py
index 5a15b8b0..3ddb8005 100644
--- a/src/omlt/io/onnx_parser.py
+++ b/src/omlt/io/onnx_parser.py
@@ -359,24 +359,29 @@ def _consume_conv_nodes(self, node, next_nodes):
                 f"Input/output size ({input_output_size}) first dimension must match input weights channels ({in_channels})."
             )
 
+        # TODO: need to check pads and dilations also have correct dimensions. Also should
+        # add support for autopad.
+        if "pads" in attr:
+            pads = attr["pads"]
+        else:
+            pads = 2*(len(input_output_size)-1)*[0]
+
+        if "dilations" in attr:
+            dilations = attr["dilations"]
+        else:
+            dilations = (len(input_output_size)-1)*[1]
+
         # Other attributes are not supported
-        if "dilations" in attr and attr["dilations"] != [1, 1]:
-            raise ValueError(
-                f"{node} has non-identity dilations ({attr['dilations']}). This is not supported."
-            )
         if attr["group"] != 1:
             raise ValueError(
                 f"{node} has multiple groups ({attr['group']}). This is not supported."
             )
-        if "pads" in attr:
-            pads = attr["pads"]
-        else:
-            pads = 2*(len(input_output_size)-1)*[0]
 
         # generate new nodes for the node output
         padding = [
             pads[i] + pads[i + len(input_output_size)-1]
-            for i in range(len(input_output_size)-1)]
+            for i in range(len(input_output_size)-1)
+        ]
         output_size = [out_channels]
         for w, k, s, p in zip(input_output_size[1:], kernel_shape, strides, padding):
             new_w = int((w - k + p) / s) + 1
@@ -404,6 +409,7 @@ def _consume_conv_nodes(self, node, next_nodes):
             strides,
             weights,
             pads=pads,
+            dilations=dilations,
             activation=activation,
             input_index_mapper=transformer,
         )
@@ -471,13 +477,10 @@ def _consume_pool_nodes(self, node, next_nodes):
         kernel_shape = attr["kernel_shape"][1:]
         strides = attr["strides"] if "strides" in attr else [1] * len(kernel_shape)
         pads = attr["pads"] if "pads" in attr else None
+        dilations = attr["dilations"] if "dilations" in attr else None
 
         # check only kernel shape, stride, storage order are set
         # everything else is not supported
-        if "dilations" in attr and attr["dilations"] != [1, 1]:
-            raise ValueError(
-                f"{node.name} has non-identity dilations ({attr['dilations']}). This is not supported."
-            )
         if ("auto_pad" in attr) and (attr["auto_pad"] != "NOTSET"):
             raise ValueError(
                 f"{node.name} has autopad set ({attr['auto_pad']}). This is not supported."
@@ -520,6 +523,7 @@ def _consume_pool_nodes(self, node, next_nodes):
             tuple(kernel_shape),
             kernel_depth,
             pads=pads,
+            dilations=dilations,
             activation=activation,
             input_index_mapper=transformer,
         )
diff --git a/src/omlt/neuralnet/layer.py b/src/omlt/neuralnet/layer.py
index 956da4bf..f38fc747 100644
--- a/src/omlt/neuralnet/layer.py
+++ b/src/omlt/neuralnet/layer.py
@@ -227,6 +227,8 @@ class Layer2D(Layer):
         stride of the kernel.
     pads : matrix-like
         Padding for the kernel. Given as [left, bottom, right, top]
+    dilations : matrix-like
+        Dilations of the kernel
     activation : str or None
         activation function name
     input_index_mapper : IndexMapper or None
@@ -240,6 +242,7 @@ def __init__(
         strides,
         *,
         pads=None,
+        dilations=None,
         activation=None,
         input_index_mapper=None,
     ):
@@ -254,6 +257,10 @@ def __init__(
             self.__pads = [0, 0, 0, 0]
         else:
             self.__pads = pads
+        if dilations is None:
+            self.__dilations = [1, 1]
+        else:
+            self.__dilations = dilations
 
     @property
     def strides(self):
@@ -275,6 +282,20 @@ def kernel_depth(self):
         """Return the depth of the kernel"""
         raise NotImplementedError()
 
+    @property
+    def dilations(self):
+        """Return the kernel dilation of the layer"""
+        return self.__dilations
+
+    @property
+    def dilated_kernel_shape(self):
+        """Return the shape of the kernel after dilation"""
+        dilated_dims = [
+            self.dilations[i]*(self.kernel_shape[i]-1) + 1
+            for i in range(len(self.kernel_shape))
+        ]
+        return tuple(dilated_dims)
+
     def kernel_index_with_input_indexes(self, out_d, out_r, out_c):
         """
         Returns an iterator over the index within the kernel and input index
@@ -290,9 +311,9 @@ def kernel_index_with_input_indexes(self, out_d, out_r, out_c):
             the output column.
         """
         kernel_d = self.kernel_depth
-        [kernel_r, kernel_c] = self.kernel_shape
+        [kernel_r, kernel_c] = self.dilated_kernel_shape
         [rows_stride, cols_stride] = self.__strides
-        [pads_row, pads_col] = self.__pads[:1]
+        [pads_row, pads_col] = self.__pads[:2]
         start_in_d = 0
         start_in_r = out_r * rows_stride - pads_row
         start_in_c = out_c * cols_stride - pads_col
@@ -362,6 +383,8 @@ class PoolingLayer2D(Layer2D):
         stride of the kernel.
     pads : matrix-like
         Padding for the kernel. Given as [left, bottom, right, top]
+    dilations : matrix-like
+        Dilations of the kernel
     pool_func : str
         name of function used to pool values in a kernel to a single value.
     transpose : bool
@@ -385,6 +408,7 @@ def __init__(
         kernel_depth,
         *,
         pads=None,
+        dilations=None,
         activation=None,
         input_index_mapper=None,
     ):
@@ -393,6 +417,7 @@ def __init__(
             output_size,
             strides,
             pads=pads,
+            dilations=dilations,
             activation=activation,
             input_index_mapper=input_index_mapper,
         )
@@ -442,6 +467,8 @@ class ConvLayer2D(Layer2D):
         the cross-correlation kernel.
     pads : matrix-like
         Padding for the kernel. Given as [left, bottom, right, top]
+    dilations : matrix-like
+        Dilations of the kernel
     activation : str or None
         activation function name
     input_index_mapper : IndexMapper or None
@@ -456,6 +483,7 @@ def __init__(
         kernel,
         *,
         pads=None,
+        dilations=None,
         activation=None,
         input_index_mapper=None,
     ):
@@ -464,10 +492,34 @@ def __init__(
             output_size,
             strides,
             pads=pads,
+            dilations=dilations,
             activation=activation,
             input_index_mapper=input_index_mapper,
         )
         self.__kernel = kernel
+        if self.dilations != [1, 1]:
+            dilate_rows = np.hstack([
+                np.hstack([
+                    np.hstack([
+                        kernel[:, :, i, :].reshape((
+                            kernel.shape[0], kernel.shape[1], 1, kernel.shape[3])),
+                        np.zeros((
+                            kernel.shape[0], kernel.shape[1], self.dilations[0] - 1, kernel.shape[3]))])
+                    for i in range(kernel.shape[2]-1)]),
+                kernel[:, :, -1, :].reshape((kernel.shape[0], kernel.shape[1], 1, kernel.shape[3]))
+            ])
+            dilate_kernel = np.dstack([
+                np.dstack([
+                    np.dstack([
+                        dilate_rows[:, :, :, i].reshape((
+                            dilate_rows.shape[0], dilate_rows.shape[1], dilate_rows.shape[2], 1)),
+                        np.zeros((dilate_rows.shape[0], dilate_rows.shape[1], dilate_rows.shape[2], self.dilations[1] - 1))])
+                    for i in range(dilate_rows.shape[3]-1)]),
+                dilate_rows[:, :, :, -1].reshape((dilate_rows.shape[0], dilate_rows.shape[1], dilate_rows.shape[2], 1))
+            ])
+            self.__dilated_kernel = dilate_kernel
+        else:
+            self.__dilated_kernel = kernel
 
     def kernel_with_input_indexes(self, out_d, out_r, out_c):
         """
@@ -504,6 +556,11 @@ def kernel(self):
         """Return the cross-correlation kernel"""
         return self.__kernel
 
+    @property
+    def dilated_kernel(self):
+        """Return the dilated cross-correlation kernel"""
+        return self.__dilated_kernel
+
     def __str__(self):
         return f"ConvLayer(input_size={self.input_size}, output_size={self.output_size}, strides={self.strides}, kernel_shape={self.kernel_shape})"
 

From 668f192e433c4219fb5aa35dda8cf1700e429e28 Mon Sep 17 00:00:00 2001
From: Jeremy Sadler <53983960+jezsadler@users.noreply.github.com>
Date: Fri, 17 Nov 2023 01:26:29 +0000
Subject: [PATCH 2/3] Linting for dilations pt 1

---
 src/omlt/io/onnx_parser.py  |  8 ++--
 src/omlt/neuralnet/layer.py | 88 +++++++++++++++++++++++++++----------
 2 files changed, 70 insertions(+), 26 deletions(-)

diff --git a/src/omlt/io/onnx_parser.py b/src/omlt/io/onnx_parser.py
index 3ddb8005..1d1a3d6e 100644
--- a/src/omlt/io/onnx_parser.py
+++ b/src/omlt/io/onnx_parser.py
@@ -364,12 +364,12 @@ def _consume_conv_nodes(self, node, next_nodes):
         if "pads" in attr:
             pads = attr["pads"]
         else:
-            pads = 2*(len(input_output_size)-1)*[0]
+            pads = 2 * (len(input_output_size) - 1) * [0]
 
         if "dilations" in attr:
             dilations = attr["dilations"]
         else:
-            dilations = (len(input_output_size)-1)*[1]
+            dilations = (len(input_output_size) - 1) * [1]
 
         # Other attributes are not supported
         if attr["group"] != 1:
@@ -379,8 +379,8 @@ def _consume_conv_nodes(self, node, next_nodes):
 
         # generate new nodes for the node output
         padding = [
-            pads[i] + pads[i + len(input_output_size)-1]
-            for i in range(len(input_output_size)-1)
+            pads[i] + pads[i + len(input_output_size) - 1]
+            for i in range(len(input_output_size) - 1)
         ]
         output_size = [out_channels]
         for w, k, s, p in zip(input_output_size[1:], kernel_shape, strides, padding):
diff --git a/src/omlt/neuralnet/layer.py b/src/omlt/neuralnet/layer.py
index f38fc747..9cd0a039 100644
--- a/src/omlt/neuralnet/layer.py
+++ b/src/omlt/neuralnet/layer.py
@@ -291,7 +291,7 @@ def dilations(self):
     def dilated_kernel_shape(self):
         """Return the shape of the kernel after dilation"""
         dilated_dims = [
-            self.dilations[i]*(self.kernel_shape[i]-1) + 1
+            self.dilations[i] * (self.kernel_shape[i] - 1) + 1
             for i in range(len(self.kernel_shape))
         ]
         return tuple(dilated_dims)
@@ -333,8 +333,7 @@ def kernel_index_with_input_indexes(self, out_d, out_r, out_c):
                     # as this could require using a partial kernel
                     # even though we loop over ALL kernel indexes.
                     if not all(
-                        input_index[i] < self.input_size[i]
-                        and input_index[i] >= 0
+                        input_index[i] < self.input_size[i] and input_index[i] >= 0
                         for i in range(len(input_index))
                     ):
                         continue
@@ -498,25 +497,70 @@ def __init__(
         )
         self.__kernel = kernel
         if self.dilations != [1, 1]:
-            dilate_rows = np.hstack([
-                np.hstack([
-                    np.hstack([
-                        kernel[:, :, i, :].reshape((
-                            kernel.shape[0], kernel.shape[1], 1, kernel.shape[3])),
-                        np.zeros((
-                            kernel.shape[0], kernel.shape[1], self.dilations[0] - 1, kernel.shape[3]))])
-                    for i in range(kernel.shape[2]-1)]),
-                kernel[:, :, -1, :].reshape((kernel.shape[0], kernel.shape[1], 1, kernel.shape[3]))
-            ])
-            dilate_kernel = np.dstack([
-                np.dstack([
-                    np.dstack([
-                        dilate_rows[:, :, :, i].reshape((
-                            dilate_rows.shape[0], dilate_rows.shape[1], dilate_rows.shape[2], 1)),
-                        np.zeros((dilate_rows.shape[0], dilate_rows.shape[1], dilate_rows.shape[2], self.dilations[1] - 1))])
-                    for i in range(dilate_rows.shape[3]-1)]),
-                dilate_rows[:, :, :, -1].reshape((dilate_rows.shape[0], dilate_rows.shape[1], dilate_rows.shape[2], 1))
-            ])
+            dilate_rows = np.hstack(
+                [
+                    np.hstack(
+                        [
+                            np.hstack(
+                                [
+                                    kernel[:, :, i, :].reshape(
+                                        (
+                                            kernel.shape[0],
+                                            kernel.shape[1],
+                                            1,
+                                            kernel.shape[3]
+                                        )
+                                    ),
+                                    np.zeros(
+                                        (
+                                            kernel.shape[0],
+                                            kernel.shape[1],
+                                            self.dilations[0] - 1,
+                                            kernel.shape[3]
+                                        )
+                                    )
+                                ]
+                            )
+                            for i in range(kernel.shape[2] - 1)
+                        ]
+                    ),
+                    kernel[:, :, -1, :].reshape(
+                        (kernel.shape[0], kernel.shape[1], 1, kernel.shape[3])
+                    ),
+                ]
+            )
+            dilate_kernel = np.dstack(
+                [
+                    np.dstack(
+                        [
+                            np.dstack(
+                                [
+                                    dilate_rows[:, :, :, i].reshape(
+                                        (
+                                            dilate_rows.shape[0],
+                                            dilate_rows.shape[1],
+                                            dilate_rows.shape[2],
+                                            1
+                                        )
+                                    ),
+                                    np.zeros(
+                                        (
+                                            dilate_rows.shape[0],
+                                            dilate_rows.shape[1],
+                                            dilate_rows.shape[2],
+                                            self.dilations[1] - 1
+                                        )
+                                    )
+                                ]
+                            )
+                            for i in range(dilate_rows.shape[3]-1)
+                        ]
+                    ),
+                    dilate_rows[:, :, :, -1].reshape(
+                        (dilate_rows.shape[0], dilate_rows.shape[1], dilate_rows.shape[2], 1)
+                    ),
+                ]
+            )
             self.__dilated_kernel = dilate_kernel
         else:
             self.__dilated_kernel = kernel

From 4a83a22586292aae15b0df554993dd367363c451 Mon Sep 17 00:00:00 2001
From: Jeremy Sadler <53983960+jezsadler@users.noreply.github.com>
Date: Fri, 17 Nov 2023 01:26:29 +0000
Subject: [PATCH 3/3] Linting for dilations pt 1

---
 src/omlt/neuralnet/layer.py | 21 +++++++++++++--------
 1 file changed, 13 insertions(+), 8 deletions(-)

diff --git a/src/omlt/neuralnet/layer.py b/src/omlt/neuralnet/layer.py
index 9cd0a039..8deaa1d3 100644
--- a/src/omlt/neuralnet/layer.py
+++ b/src/omlt/neuralnet/layer.py
@@ -508,7 +508,7 @@ def __init__(
                                             kernel.shape[0],
                                             kernel.shape[1],
                                             1,
-                                            kernel.shape[3]
+                                            kernel.shape[3],
                                         )
                                     ),
                                     np.zeros(
@@ -516,9 +516,9 @@ def __init__(
                                             kernel.shape[0],
                                             kernel.shape[1],
                                             self.dilations[0] - 1,
-                                            kernel.shape[3]
+                                            kernel.shape[3],
                                         )
-                                    )
+                                    ),
                                 ]
                             )
                             for i in range(kernel.shape[2] - 1)
@@ -540,7 +540,7 @@ def __init__(
                                             dilate_rows.shape[0],
                                             dilate_rows.shape[1],
                                             dilate_rows.shape[2],
-                                            1
+                                            1,
                                         )
                                     ),
                                     np.zeros(
@@ -548,16 +548,21 @@ def __init__(
                                             dilate_rows.shape[0],
                                             dilate_rows.shape[1],
                                             dilate_rows.shape[2],
-                                            self.dilations[1] - 1
+                                            self.dilations[1] - 1,
                                         )
-                                    )
+                                    ),
                                 ]
                             )
-                            for i in range(dilate_rows.shape[3]-1)
+                            for i in range(dilate_rows.shape[3] - 1)
                         ]
                     ),
                     dilate_rows[:, :, :, -1].reshape(
-                        (dilate_rows.shape[0], dilate_rows.shape[1], dilate_rows.shape[2], 1)
+                        (
+                            dilate_rows.shape[0],
+                            dilate_rows.shape[1],
+                            dilate_rows.shape[2],
+                            1,
+                        )
                     ),
                 ]
             )