diff --git a/include/ttmlir/Dialect/TTIR/IR/CMakeLists.txt b/include/ttmlir/Dialect/TTIR/IR/CMakeLists.txt
index 7af485250..e04bf3f3e 100644
--- a/include/ttmlir/Dialect/TTIR/IR/CMakeLists.txt
+++ b/include/ttmlir/Dialect/TTIR/IR/CMakeLists.txt
@@ -2,6 +2,12 @@ add_mlir_dialect(TTIROps ttir)
 add_mlir_doc(TTIRBase TTIRDialect src/autogen/md/Dialect/ -gen-dialect-doc)
 add_mlir_doc(TTIROps TTIROp src/autogen/md/Dialect/ -gen-op-doc)
 
+set(LLVM_TARGET_DEFINITIONS TTIROpsAttrs.td)
+mlir_tablegen(TTIROpsAttrs.h.inc -gen-attrdef-decls)
+mlir_tablegen(TTIROpsAttrs.cpp.inc -gen-attrdef-defs)
+add_public_tablegen_target(TTIROpsAttrsIncGen)
+add_dependencies(mlir-headers TTIROpsAttrsIncGen)
+
 set(LLVM_TARGET_DEFINITIONS TTIROpsInterfaces.td)
 mlir_tablegen(TTIROpsInterfaces.h.inc -gen-op-interface-decls)
 mlir_tablegen(TTIROpsInterfaces.cpp.inc -gen-op-interface-defs)
diff --git a/include/ttmlir/Dialect/TTIR/IR/TTIRBase.td b/include/ttmlir/Dialect/TTIR/IR/TTIRBase.td
index f8a319897..57f3dc37d 100644
--- a/include/ttmlir/Dialect/TTIR/IR/TTIRBase.td
+++ b/include/ttmlir/Dialect/TTIR/IR/TTIRBase.td
@@ -21,7 +21,7 @@ def TTIR_Dialect : Dialect {
         or dialects that are actually supported by a consuming backend.
     }];
     let cppNamespace = "::mlir::tt::ttir";
-
+    let useDefaultAttributePrinterParser = 1;
     let dependentDialects = [
       "::mlir::arith::ArithDialect",
       "::mlir::func::FuncDialect",
diff --git a/include/ttmlir/Dialect/TTIR/IR/TTIROps.h b/include/ttmlir/Dialect/TTIR/IR/TTIROps.h
index 26bcf1a19..cd102dbb9 100644
--- a/include/ttmlir/Dialect/TTIR/IR/TTIROps.h
+++ b/include/ttmlir/Dialect/TTIR/IR/TTIROps.h
@@ -16,6 +16,9 @@
 
 #include "TTIROpsInterfaces.h"
 
+#define GET_ATTRDEF_CLASSES
+#include "ttmlir/Dialect/TTIR/IR/TTIROpsAttrs.h.inc"
+
 #define GET_OP_CLASSES
 #include "ttmlir/Dialect/TTIR/IR/TTIROps.h.inc"
 
diff --git a/include/ttmlir/Dialect/TTIR/IR/TTIROps.td b/include/ttmlir/Dialect/TTIR/IR/TTIROps.td
index 6bb03a697..674042348 100644
--- a/include/ttmlir/Dialect/TTIR/IR/TTIROps.td
+++ b/include/ttmlir/Dialect/TTIR/IR/TTIROps.td
@@ -7,6 +7,7 @@
 
 include "ttmlir/Dialect/TT/IR/TTOpsTypes.td"
 include "ttmlir/Dialect/TTIR/IR/TTIRBase.td"
+include "ttmlir/Dialect/TTIR/IR/TTIROpsAttrs.td"
 include "ttmlir/Dialect/TTIR/IR/TTIROpsInterfaces.td"
 include "mlir/Dialect/Linalg/IR/LinalgBase.td"
 include "mlir/Interfaces/InferTypeOpInterface.td"
@@ -598,6 +599,45 @@ def TTIR_Conv2dOp : TTIR_DPSOp<"conv2d"> {
     let hasVerifier = 1;
 }
 
+def TTIR_ConvolutionOp : TTIR_DPSOp<"convolution"> {
+  let summary = "Generalized convolution op.";
+  let description = [{
+    Applies a convolution of the rhs with the lhs.
+
+    This operation captures convolutions of all dimensionality as well
+    as deconvolution/conv transpose.
+  }];
+
+  let arguments = (ins
+    AnyRankedTensor:$input,
+    AnyRankedTensor:$weight,
+    Optional<AnyRankedTensor>:$bias,
+    AnyRankedTensor:$output,
+    // Default value: one for each of the spatial dimension.
+    DefaultValuedOptionalAttr<DenseI64ArrayAttr, "SmallVector<int64_t>(getConvolutionLayout().getInputSpatialDimensions().size(), 1)">:$window_strides,
+    // Default value: two zeros for each of the spatial dimension.
+    DefaultValuedOptionalAttr<I64ElementsAttr, "SmallVector<int64_t>(getConvolutionLayout().getInputSpatialDimensions().size()*2, 0)">:$padding,
+    // Default value: one for each of the spatial dimension.
+    DefaultValuedOptionalAttr<DenseI64ArrayAttr, "SmallVector<int64_t>(getConvolutionLayout().getInputSpatialDimensions().size(), 1)">:$input_dilation,
+    // Default value: one for each of the spatial dimension.
+    DefaultValuedOptionalAttr<DenseI64ArrayAttr, "SmallVector<int64_t>(getConvolutionLayout().getInputSpatialDimensions().size(), 1)">:$weight_dilation,
+    // Default value: false for each of the spatial dimension.
+    DefaultValuedOptionalAttr<DenseBoolArrayAttr, "SmallVector<bool>(getConvolutionLayout().getInputSpatialDimensions().size(), false)">:$window_reversal,
+    TTIR_ConvolutionLayoutAttr:$convolution_layout,
+    ConfinedAttr<I64Attr, [IntPositive]>:$feature_group_count,
+    ConfinedAttr<I64Attr, [IntPositive]>:$batch_group_count,
+    TT_OperandConstraintArrayAttr:$operand_constraints
+  );
+
+  let results = (outs AnyRankedTensor);
+  let hasVerifier = 1;
+
+  let extraClassDeclaration = [{
+      MutableOperandRange getDpsInitsMutable() { return getOutputMutable(); }
+    }];
+}
+
+
 def TTIR_MaxPool2dOp : TTIR_DPSOp<"max_pool2d"> {
     let summary = "Applies a 2D max pooling over an input signal composed of several input planes.";
     let description = [{
diff --git a/include/ttmlir/Dialect/TTIR/IR/TTIROpsAttrs.td b/include/ttmlir/Dialect/TTIR/IR/TTIROpsAttrs.td
new file mode 100644
index 000000000..60943af26
--- /dev/null
+++ b/include/ttmlir/Dialect/TTIR/IR/TTIROpsAttrs.td
@@ -0,0 +1,44 @@
+// SPDX-FileCopyrightText: (c) 2024 Tenstorrent AI ULC
+//
+// SPDX-License-Identifier: Apache-2.0
+
+#ifndef TTMLIR_TTIR_ATTRS_TD
+#define TTMLIR_TTIR_ATTRS_TD
+
+include "mlir/IR/AttrTypeBase.td"
+include "ttmlir/Dialect/TTIR/IR/TTIRBase.td"
+
+def TTIR_ConvolutionLayoutAttr : AttrDef<TTIR_Dialect, "ConvolutionLayout", [], "::mlir::Attribute"> {
+  let mnemonic = "convolution_layout";
+  let summary = "Structure of dimension information for convolution op";
+  let description = [{
+    Holds the layout information for the input activation, weights, and output.
+  }];
+  let parameters = (ins
+    "int64_t":$inputBatchDimension,
+    "int64_t":$inputFeatureDimension,
+    ArrayRefParameter<"int64_t">:$inputSpatialDimensions,
+
+    "int64_t":$kernelOutputFeatureDimension,
+    "int64_t":$kernelInputFeatureDimension,
+    ArrayRefParameter<"int64_t">:$kernelSpatialDimensions,
+
+    "int64_t":$outputBatchDimension,
+    "int64_t":$outputFeatureDimension,
+    ArrayRefParameter<"int64_t">:$outputSpatialDimensions
+  );
+
+  let assemblyFormat = [{
+        `input_batch` `=` $inputBatchDimension `,`
+        `input_feature` `=` $inputFeatureDimension`,`
+        `input_spatial_dimensions` `=` custom<DimensionList>($inputSpatialDimensions) `,`
+        `kernel_output_feature` `=` $kernelOutputFeatureDimension `,`
+        `kernel_input_feature` `=` $kernelInputFeatureDimension `,`
+        `kernel_spatial_dimensions` `=` custom<DimensionList>($kernelSpatialDimensions) `,`
+        `output_batch` `=` $outputBatchDimension `,`
+        `output_feature` `=` $outputFeatureDimension `,`
+        `output_spatial_dimensions` `=` custom<DimensionList>($outputSpatialDimensions)
+  }];
+}
+
+#endif // TTMLIR_TTIR_ATTRS_TD
diff --git a/lib/Conversion/StableHLOToTTIR/StableHLOToTTIRPatterns.cpp b/lib/Conversion/StableHLOToTTIR/StableHLOToTTIRPatterns.cpp
index d41650933..4cb2c3efa 100644
--- a/lib/Conversion/StableHLOToTTIR/StableHLOToTTIRPatterns.cpp
+++ b/lib/Conversion/StableHLOToTTIR/StableHLOToTTIRPatterns.cpp
@@ -373,46 +373,28 @@ class StableHLOToTTIRConvolutionOpConversionPattern
     tensor::EmptyOp outputTensor = rewriter.create<tensor::EmptyOp>(
         srcOp.getLoc(), outputType.getShape(), outputType.getElementType());
 
-    std::vector<int64_t> strides =
-        adaptor.getWindowStrides().value_or(ArrayRef<int64_t>({1, 1})).vec();
-    IntegerAttr stride_height_attr =
-        rewriter.getSI32IntegerAttr(static_cast<int32_t>(strides[0]));
-    IntegerAttr stride_width_attr =
-        rewriter.getSI32IntegerAttr(static_cast<int32_t>(strides[1]));
-
-    std::vector<int64_t> dilation =
-        adaptor.getLhsDilation().value_or(ArrayRef<int64_t>({1, 1})).vec();
-
-    IntegerAttr dilation_height_attr =
-        rewriter.getSI32IntegerAttr(static_cast<int32_t>(dilation[0]));
-    IntegerAttr dilation_width_attr =
-        rewriter.getSI32IntegerAttr(static_cast<int32_t>(dilation[1]));
-
-    IntegerAttr groups_attr = rewriter.getSI32IntegerAttr(
-        static_cast<int32_t>(adaptor.getFeatureGroupCount()));
-
-    std::vector<int32_t> padding;
-    if (!adaptor.getPadding().has_value()) {
-      padding = {0, 0, 0, 0};
-    } else {
-      for (auto iter = adaptor.getPadding()->value_begin<int64_t>();
-           iter < adaptor.getPadding()->value_end<int64_t>(); iter++) {
-        padding.push_back(static_cast<int32_t>(*iter));
-      }
-    }
-
-    rewriter.replaceOpWithNewOp<mlir::tt::ttir::Conv2dOp>(
+    auto dimNums = adaptor.getDimensionNumbers();
+    rewriter.replaceOpWithNewOp<mlir::tt::ttir::ConvolutionOp>(
         srcOp, outputType, adaptor.getLhs(), adaptor.getRhs(),
-        mlir::Value(nullptr), outputTensor, stride_height_attr,
-        stride_width_attr, dilation_height_attr, dilation_width_attr,
-        groups_attr, rewriter.getSI32IntegerAttr(padding[0]),
-        rewriter.getSI32IntegerAttr(padding[1]),
-        rewriter.getSI32IntegerAttr(padding[2]),
-        rewriter.getSI32IntegerAttr(padding[3]),
+        mlir::Value(nullptr), outputTensor, adaptor.getWindowStridesAttr(),
+        adaptor.getPaddingAttr(), adaptor.getLhsDilationAttr(),
+        adaptor.getRhsDilationAttr(), adaptor.getWindowReversalAttr(),
+        mlir::tt::ttir::ConvolutionLayoutAttr::get(
+            getContext(), dimNums.getInputBatchDimension(),
+            dimNums.getInputFeatureDimension(),
+            dimNums.getInputSpatialDimensions(),
+            dimNums.getKernelOutputFeatureDimension(),
+            dimNums.getKernelInputFeatureDimension(),
+            dimNums.getKernelSpatialDimensions(),
+            dimNums.getOutputBatchDimension(),
+            dimNums.getOutputFeatureDimension(),
+            dimNums.getOutputSpatialDimensions()),
+        adaptor.getFeatureGroupCountAttr(), adaptor.getBatchGroupCountAttr(),
         rewriter.getArrayAttr(
             SmallVector<Attribute>(adaptor.getOperands().size() + 1,
                                    rewriter.getAttr<OperandConstraintAttr>(
                                        OperandConstraint::AnyDeviceTile))));
+
     return success();
   }
 };
diff --git a/lib/Conversion/TTIRToTTIRDecomposition/TTIRToTTIRDecomposition.cpp b/lib/Conversion/TTIRToTTIRDecomposition/TTIRToTTIRDecomposition.cpp
index b52571862..d361fce1f 100644
--- a/lib/Conversion/TTIRToTTIRDecomposition/TTIRToTTIRDecomposition.cpp
+++ b/lib/Conversion/TTIRToTTIRDecomposition/TTIRToTTIRDecomposition.cpp
@@ -74,10 +74,339 @@ struct IndexToSliceConversionPattern
   }
 };
 
+//===----------------------------------------------------------------------===//
+// Convolution passes
+//===----------------------------------------------------------------------===//
+
+using TransposeDims = std::tuple<int64_t, int64_t>;
+
+template <uint32_t NDims>
+using PaddingMatrix = std::array<std::array<int64_t, 2>, NDims>;
+
+template <uint32_t NDims>
+static PaddingMatrix<NDims> getPaddingMatrix(DenseIntElementsAttr paddingAttr) {
+  PaddingMatrix<NDims> paddingMatrix;
+  std::vector<int64_t> paddingFlattened(paddingAttr.value_begin<int64_t>(),
+                                        paddingAttr.value_end<int64_t>());
+
+  for (uint32_t i = 0; i < 2 * NDims; i += 2) {
+    paddingMatrix[i / 2] = {paddingFlattened[i], paddingFlattened[i + 1]};
+  }
+  return paddingMatrix;
+}
+/*
+ * The following functions are used to generate the transpose operations needed
+ * to convert a convolution operation to the specific op definitions for a
+ * ConvNdOp for any N spatial dimensions.
+ *
+ * All convolutions will have a batch and feature dimension, and the kernel will
+ * have an input and output feature dimension. The spatial dimensions can be
+ * represented by non-negative integers.
+ */
+enum ConvolutionDimension { BATCH = -1, FEATURE = -2, INVALID_DIM = -3 };
+
+enum ConvolutionKernelDimension {
+  INPUT_FEATURES = -1,
+  OUTPUT_FEATURES = -2,
+  INVALID_KERNEL_DIM = -3
+};
+
+static tensor::EmptyOp generateTransposeDPSOutput(Value input, int64_t dim0,
+                                                  int64_t dim1,
+                                                  PatternRewriter &rewriter) {
+  auto input_type = mlir::cast<mlir::RankedTensorType>(input.getType());
+  auto output_shape = input_type.getShape().vec();
+  std::swap(output_shape[dim0], output_shape[dim1]);
+
+  auto output_type = RankedTensorType::get(
+      output_shape, input_type.getElementType(), input_type.getEncoding());
+
+  return rewriter.create<tensor::EmptyOp>(input.getLoc(), output_shape,
+                                          output_type.getElementType());
+}
+
+static ttir::TransposeOp
+generateTranspose(Value input, int64_t dim0, int64_t dim1,
+                  PatternRewriter &rewriter,
+                  ::mlir::ArrayAttr operandConstraints) {
+  auto input_type = mlir::cast<mlir::RankedTensorType>(input.getType());
+  auto output_shape = input_type.getShape().vec();
+  std::swap(output_shape[dim0], output_shape[dim1]);
+
+  auto dim0_attr = rewriter.getSI32IntegerAttr(dim0);
+  auto dim1_attr = rewriter.getSI32IntegerAttr(dim1);
+
+  auto dps_output = generateTransposeDPSOutput(input, dim0, dim1, rewriter);
+  return rewriter.create<ttir::TransposeOp>(
+      input.getLoc(), dps_output.getType(), input, dps_output, dim0_attr,
+      dim1_attr, operandConstraints);
+}
+
+static std::vector<TransposeDims> generateKernelTransposeIndices(
+    ttir::ConvolutionOp op,
+    const std::vector<int64_t> ttnn_convolution_kernel_layout) {
+  std::vector<TransposeDims> transpose_indices;
+
+  std::vector<int64_t> kernel_layout(
+      ttnn_convolution_kernel_layout.size(),
+      ConvolutionKernelDimension::INVALID_KERNEL_DIM);
+  kernel_layout[op.getConvolutionLayout().getKernelOutputFeatureDimension()] =
+      ConvolutionKernelDimension::OUTPUT_FEATURES;
+  kernel_layout[op.getConvolutionLayout().getKernelInputFeatureDimension()] =
+      ConvolutionKernelDimension::INPUT_FEATURES;
+
+  int64_t spatial_count = 0;
+  for (int64_t spatial_dim :
+       op.getConvolutionLayout().getKernelSpatialDimensions()) {
+    kernel_layout[spatial_dim] = spatial_count;
+    spatial_count++;
+  }
+
+  const std::vector<int64_t> desired_kernel_layout =
+      ttnn_convolution_kernel_layout;
+  for (int64_t i = 0; i < static_cast<int64_t>(kernel_layout.size()); i++) {
+    if (kernel_layout[i] != desired_kernel_layout[i]) {
+      int64_t dim0 = i;
+      int64_t dim1 = std::find(kernel_layout.begin(), kernel_layout.end(),
+                               desired_kernel_layout[i]) -
+                     kernel_layout.begin();
+      transpose_indices.push_back(std::make_tuple(dim0, dim1));
+      std::swap(kernel_layout[dim0], kernel_layout[dim1]);
+    }
+  }
+
+  return transpose_indices;
+}
+
+static std::vector<TransposeDims> generateInputTransposeIndices(
+    ttir::ConvolutionOp op,
+    const std::vector<int64_t> ttnn_convolution_layout) {
+  std::vector<TransposeDims> transpose_indices;
+
+  std::vector<int64_t> input_layout(ttnn_convolution_layout.size(),
+                                    ConvolutionDimension::INVALID_DIM);
+  input_layout[op.getConvolutionLayout().getInputBatchDimension()] =
+      ConvolutionDimension::BATCH;
+  input_layout[op.getConvolutionLayout().getInputFeatureDimension()] =
+      ConvolutionDimension::FEATURE;
+
+  int64_t spatial_count = 0;
+  for (int64_t spatial_dim :
+       op.getConvolutionLayout().getInputSpatialDimensions()) {
+    input_layout[spatial_dim] = spatial_count;
+    spatial_count++;
+  }
+
+  const std::vector<int64_t> desired_input_layout = ttnn_convolution_layout;
+  for (int64_t i = 0; i < static_cast<int64_t>(input_layout.size()); i++) {
+    if (input_layout[i] != desired_input_layout[i]) {
+      int64_t dim0 = i;
+      int64_t dim1 = std::find(input_layout.begin(), input_layout.end(),
+                               desired_input_layout[i]) -
+                     input_layout.begin();
+      transpose_indices.push_back(std::make_tuple(dim0, dim1));
+      std::swap(input_layout[dim0], input_layout[dim1]);
+    }
+  }
+
+  return transpose_indices;
+}
+
+/**
+ * Although this function is mostly a clone of generateInputTransposeIndices,
+ * its slightly different in that if the original Convolution op had the same
+ * input and output layout, this function will generate the same transposes,
+ * that were applied to the input but in reverse order. This makes optimizing
+ * away the inserted transposes easier.
+ */
+static std::vector<TransposeDims> generateOutputTransposeIndices(
+    ttir::ConvolutionOp op,
+    const std::vector<int64_t> ttnn_convolution_layout) {
+  std::vector<TransposeDims> transpose_indices;
+
+  std::vector<int64_t> desired_output_layout(ttnn_convolution_layout.size(),
+                                             ConvolutionDimension::INVALID_DIM);
+  desired_output_layout[op.getConvolutionLayout().getOutputBatchDimension()] =
+      ConvolutionDimension::BATCH;
+  desired_output_layout[op.getConvolutionLayout().getOutputFeatureDimension()] =
+      ConvolutionDimension::FEATURE;
+
+  int64_t spatial_count = 0;
+  for (int64_t spatial_dim :
+       op.getConvolutionLayout().getOutputSpatialDimensions()) {
+    desired_output_layout[spatial_dim] = spatial_count;
+    spatial_count++;
+  }
+
+  std::vector<int64_t> output_layout = ttnn_convolution_layout;
+
+  for (int64_t i = static_cast<int64_t>(desired_output_layout.size()) - 1;
+       i >= 0; i--) {
+    if (desired_output_layout[i] != output_layout[i]) {
+      int64_t dim0 = i;
+      int64_t dim1 = std::find(output_layout.begin(), output_layout.end(),
+                               desired_output_layout[i]) -
+                     output_layout.begin();
+      transpose_indices.push_back(std::make_tuple(dim0, dim1));
+      std::swap(output_layout[dim0], output_layout[dim1]);
+    }
+  }
+
+  return transpose_indices;
+}
+
+static Value
+generateTransposeSequence(Value input, PatternRewriter &rewriter,
+                          std::vector<TransposeDims> transpose_indices,
+                          ::mlir::ArrayAttr operandConstraints) {
+  for (auto [dim0, dim1] : transpose_indices) {
+    input = generateTranspose(input, dim0, dim1, rewriter, operandConstraints)
+                .getResult();
+  }
+
+  return input;
+}
+
+struct ConvolutionToConv2dPattern
+    : public OpConversionPattern<ttir::ConvolutionOp> {
+public:
+  using OpConversionPattern<ttir::ConvolutionOp>::OpConversionPattern;
+
+  constexpr static uint32_t numSpatialDims = 2;
+  constexpr static uint32_t SPATIAL_DIM_HEIGHT = 0;
+  constexpr static uint32_t SPATIAL_DIM_WIDTH = 1;
+
+  // NHWC
+  const std::vector<int64_t> conv2d_layout = {
+      ConvolutionDimension::BATCH, SPATIAL_DIM_HEIGHT, SPATIAL_DIM_WIDTH,
+      ConvolutionDimension::FEATURE};
+  // OIHW
+  const std::vector<int64_t> conv2d_kernel_layout = {
+      ConvolutionKernelDimension::OUTPUT_FEATURES,
+      ConvolutionKernelDimension::INPUT_FEATURES, SPATIAL_DIM_HEIGHT,
+      SPATIAL_DIM_WIDTH};
+  LogicalResult isConv2d(ttir::ConvolutionOp op) const {
+
+    // Conv2d will have 2 spatial dimensions
+
+    assert(op.getConvolutionLayout().getInputSpatialDimensions().size() ==
+               op.getConvolutionLayout().getOutputSpatialDimensions().size() &&
+           "Convolution input, output, and kernel must have the same number of "
+           "spatial dimensions");
+    assert(op.getConvolutionLayout().getInputSpatialDimensions().size() ==
+               op.getConvolutionLayout().getKernelSpatialDimensions().size() &&
+           "Convolution input, output, and kernel must have the same number of "
+           "spatial dimensions");
+
+    if (op.getConvolutionLayout().getInputSpatialDimensions().size() !=
+        numSpatialDims) {
+      return failure();
+    }
+
+    // Not currently supporting window reversal
+    std::vector<bool> window_reversal(op.getWindowReversal().begin(),
+                                      op.getWindowReversal().end());
+    for (bool reversed : window_reversal) {
+      if (reversed) {
+        return failure();
+      }
+    }
+
+    // Not currently support batch groups
+    if (op.getBatchGroupCount() != 1) {
+      return failure();
+    }
+
+    return success();
+  }
+
+  LogicalResult
+  matchAndRewrite(ttir::ConvolutionOp op, OpAdaptor adaptor,
+                  ConversionPatternRewriter &rewriter) const override {
+
+    if (failed(isConv2d(op))) {
+      return failure();
+    }
+
+    auto stride_height_attr = rewriter.getSI32IntegerAttr(
+        adaptor.getWindowStrides()[SPATIAL_DIM_HEIGHT]);
+    auto stride_width_attr = rewriter.getSI32IntegerAttr(
+        adaptor.getWindowStrides()[SPATIAL_DIM_WIDTH]);
+    auto dilation_height_attr = rewriter.getSI32IntegerAttr(
+        adaptor.getWeightDilation()[SPATIAL_DIM_HEIGHT]);
+    auto dilation_width_attr = rewriter.getSI32IntegerAttr(
+        adaptor.getWeightDilation()[SPATIAL_DIM_WIDTH]);
+
+    // Padding is a list of 2-tuples, the order of the 2-tuples is in
+    // most-significant spatial dimension first order For Conv2d the most
+    // significant spatial dimension is the height, followed by the width.
+    auto padding_matrix =
+        getPaddingMatrix<numSpatialDims>(adaptor.getPadding());
+    auto padding_top_attr =
+        rewriter.getSI32IntegerAttr(padding_matrix[SPATIAL_DIM_HEIGHT][0]);
+    auto padding_bottom_attr =
+        rewriter.getSI32IntegerAttr(padding_matrix[SPATIAL_DIM_HEIGHT][1]);
+    auto padding_left_attr =
+        rewriter.getSI32IntegerAttr(padding_matrix[SPATIAL_DIM_WIDTH][0]);
+    auto padding_right_attr =
+        rewriter.getSI32IntegerAttr(padding_matrix[SPATIAL_DIM_WIDTH][1]);
+
+    auto groups_attr =
+        rewriter.getSI32IntegerAttr(adaptor.getFeatureGroupCount());
+
+    auto output_shape = op.getResult().getType().getShape().vec();
+    std::vector<int64_t> new_output_shape = {
+        output_shape[adaptor.getConvolutionLayout().getOutputBatchDimension()],
+        output_shape[adaptor.getConvolutionLayout()
+                         .getOutputSpatialDimensions()[SPATIAL_DIM_HEIGHT]],
+        output_shape[adaptor.getConvolutionLayout()
+                         .getOutputSpatialDimensions()[SPATIAL_DIM_WIDTH]],
+        output_shape[adaptor.getConvolutionLayout()
+                         .getOutputFeatureDimension()]};
+
+    auto inputType = mlir::cast<RankedTensorType>(adaptor.getInput().getType());
+    auto outputType =
+        inputType.cloneWith(new_output_shape, inputType.getElementType());
+
+    auto convDPSOutput = rewriter.create<tensor::EmptyOp>(
+        adaptor.getInput().getLoc(), new_output_shape,
+        outputType.getElementType());
+
+    auto input_transpose_indices =
+        generateInputTransposeIndices(op, conv2d_layout);
+    Value input = generateTransposeSequence(adaptor.getInput(), rewriter,
+                                            input_transpose_indices,
+                                            adaptor.getOperandConstraints());
+
+    auto kernel_transpose_indices =
+        generateKernelTransposeIndices(op, conv2d_kernel_layout);
+    Value weight = generateTransposeSequence(adaptor.getWeight(), rewriter,
+                                             kernel_transpose_indices,
+                                             adaptor.getOperandConstraints());
+    ttir::Conv2dOp new_conv = rewriter.create<ttir::Conv2dOp>(
+        op.getLoc(), outputType, input, weight, adaptor.getBias(),
+        convDPSOutput, stride_height_attr, stride_width_attr,
+        dilation_height_attr, dilation_width_attr, groups_attr,
+        padding_left_attr, padding_right_attr, padding_top_attr,
+        padding_bottom_attr, adaptor.getOperandConstraints());
+
+    auto output_transpose_indices =
+        generateOutputTransposeIndices(op, conv2d_layout);
+    Value output = generateTransposeSequence(new_conv.getResult(), rewriter,
+                                             output_transpose_indices,
+                                             adaptor.getOperandConstraints());
+
+    rewriter.replaceOp(op, output);
+
+    return success();
+  }
+};
+
 void populateTTIRToTTIRDecompositionPatterns(MLIRContext *ctx,
                                              RewritePatternSet &patterns,
                                              TypeConverter &typeConverter) {
   patterns.add<IndexToSliceConversionPattern>(typeConverter, ctx);
+  patterns.add<ConvolutionToConv2dPattern>(typeConverter, ctx);
 }
 
 } // namespace mlir::tt
diff --git a/lib/Conversion/TTIRToTTIRDecomposition/TTIRToTTIRDecompositionPass.cpp b/lib/Conversion/TTIRToTTIRDecomposition/TTIRToTTIRDecompositionPass.cpp
index 9a25856b0..e621e6b28 100644
--- a/lib/Conversion/TTIRToTTIRDecomposition/TTIRToTTIRDecompositionPass.cpp
+++ b/lib/Conversion/TTIRToTTIRDecomposition/TTIRToTTIRDecompositionPass.cpp
@@ -16,6 +16,7 @@
 #include "ttmlir/Dialect/TTNN/IR/TTNNOps.h"
 #include <mlir/Dialect/Func/IR/FuncOps.h>
 #include <mlir/Dialect/Tensor/IR/Tensor.h>
+#include <mlir/Transforms/GreedyPatternRewriteDriver.h>
 
 using namespace mlir;
 using namespace mlir::tt;
@@ -35,8 +36,18 @@ struct TTIRToTTIRDecompositionPass
   void runOnOperation() final {
     mlir::ConversionTarget target(getContext());
     target.addLegalDialect<ttir::TTIRDialect>();
+    target.addLegalDialect<mlir::func::FuncDialect>(); // we wish to keep
+                                                       // func.func and
+                                                       // func.call as legal ops
+    target.addLegalDialect<BuiltinDialect>(); // This contains the "module" op
+                                              // which is necesarry
 
+    target.addLegalOp<tensor::EmptyOp>(); // DPS operands are create with
+                                          // tensor::EmptyOp
+
+    // These are the ops we intend to remove entirely with this pass
     target.addIllegalOp<ttir::IndexOp>();
+    target.addIllegalOp<ttir::ConvolutionOp>();
 
     TypeConverter typeConverter;
     // All types map 1:1.
diff --git a/lib/Conversion/TTIRToTTNN/TTIRToTTNN.cpp b/lib/Conversion/TTIRToTTNN/TTIRToTTNN.cpp
index 6391d48e9..a873e0338 100644
--- a/lib/Conversion/TTIRToTTNN/TTIRToTTNN.cpp
+++ b/lib/Conversion/TTIRToTTNN/TTIRToTTNN.cpp
@@ -560,6 +560,30 @@ class Conv2dOpConversionPattern : public OpConversionPattern<ttir::Conv2dOp> {
 public:
   using OpConversionPattern<ttir::Conv2dOp>::OpConversionPattern;
 
+  ttnn::ReshapeOp generateReshape(ttir::Conv2dOp op, Value input,
+                                  ArrayRef<int64_t> newShape,
+                                  PatternRewriter &rewriter) const {
+    auto inputType = mlir::cast<RankedTensorType>(input.getType());
+    auto outputType = inputType.cloneWith(newShape, inputType.getElementType());
+
+    std::vector<int32_t> newShapeI32(newShape.begin(), newShape.end());
+    return rewriter.create<ttnn::ReshapeOp>(
+        input.getLoc(), outputType, input,
+        rewriter.getI32ArrayAttr(newShapeI32));
+  }
+
+  ttnn::ReshapeOp generateNHWFlatten(ttir::Conv2dOp op, Value input,
+                                     PatternRewriter &rewriter) const {
+    std::vector<int64_t> shape =
+        mlir::cast<RankedTensorType>(input.getType()).getShape().vec();
+
+    assert(shape.size() == 4 && "Must have 4-dim tensor as conv2d input");
+
+    std::vector<int64_t> newShape = {1, 1, shape[0] * shape[1] * shape[2],
+                                     shape[3]};
+    return generateReshape(op, input, newShape, rewriter);
+  }
+
   LogicalResult
   matchAndRewrite(ttir::Conv2dOp op, OpAdaptor adaptor,
                   ConversionPatternRewriter &rewriter) const override {
@@ -611,13 +635,37 @@ class Conv2dOpConversionPattern : public OpConversionPattern<ttir::Conv2dOp> {
     auto dilation_width =
         rewriter.getI32IntegerAttr(adaptor.getDilationWidth());
     auto groups = rewriter.getI32IntegerAttr(adaptor.getGroups());
-    rewriter.replaceOpWithNewOp<ttnn::Conv2dOp>(
-        op, this->getTypeConverter()->convertType(op.getType()),
-        adaptor.getInput(), adaptor.getWeight(), adaptor.getBias(),
-        adaptor.getOutput(), device, in_channels, out_channels, batch_size,
-        input_height, input_width, kernel_height, kernel_width, stride_height,
-        stride_width, padding_height, padding_width, dilation_height,
-        dilation_width, groups);
+
+    std::vector<int64_t> flattenedInputShape = {
+        1, 1, input_shape[0] * input_shape[1] * input_shape[2], input_shape[3]};
+    Value flattenedInput = generateNHWFlatten(op, adaptor.getInput(), rewriter);
+
+    std::vector<int64_t> flattenedOutputShape = {
+        1, 1, output_shape[0] * output_shape[1] * output_shape[2],
+        output_shape[3]};
+
+    output_ty = mlir::cast<RankedTensorType>(getTypeConverter()->convertType(
+        output_ty.cloneWith(flattenedOutputShape, output_ty.getElementType())));
+
+    // Using a tensor::EmptyOp so that the rewriter for EmptyOp can handle the
+    // attribute determination
+    auto convDPSOutput = rewriter.replaceOpWithNewOp<tensor::EmptyOp>(
+        adaptor.getOutput().getDefiningOp(), flattenedOutputShape,
+        output_ty.getElementType());
+
+    // Must set the type to the output type to maintain the layout attributes
+    convDPSOutput.getResult().setType(output_ty);
+
+    ttnn::Conv2dOp new_conv = rewriter.create<ttnn::Conv2dOp>(
+        op.getLoc(), output_ty, flattenedInput, adaptor.getWeight(),
+        adaptor.getBias(), convDPSOutput, device, in_channels, out_channels,
+        batch_size, input_height, input_width, kernel_height, kernel_width,
+        stride_height, stride_width, padding_height, padding_width,
+        dilation_height, dilation_width, groups);
+
+    Value output = generateReshape(op, new_conv, output_shape, rewriter);
+
+    rewriter.replaceOp(op, output);
     return success();
   }
 };
diff --git a/lib/Dialect/TTIR/IR/TTIRDialect.cpp b/lib/Dialect/TTIR/IR/TTIRDialect.cpp
index 46ec9bac2..73d259ea3 100644
--- a/lib/Dialect/TTIR/IR/TTIRDialect.cpp
+++ b/lib/Dialect/TTIR/IR/TTIRDialect.cpp
@@ -8,6 +8,11 @@
 #include "mlir/InitAllDialects.h"
 #include "mlir/Transforms/InliningUtils.h"
 #include "ttmlir/Dialect/TTIR/IR/TTIROps.h"
+#include "llvm/ADT/StringSet.h"
+#include "llvm/ADT/TypeSwitch.h"
+
+#define GET_ATTRDEF_CLASSES
+#include "ttmlir/Dialect/TTIR/IR/TTIROpsAttrs.cpp.inc"
 
 using namespace mlir;
 using namespace mlir::tt::ttir;
@@ -59,4 +64,8 @@ void TTIRDialect::initialize() {
 #include "ttmlir/Dialect/TTIR/IR/TTIROps.cpp.inc"
       >();
   addInterfaces<TTIRInlinerInterface>();
+  addAttributes<
+#define GET_ATTRDEF_LIST
+#include "ttmlir/Dialect/TTIR/IR/TTIROpsAttrs.cpp.inc"
+      >();
 }
diff --git a/lib/Dialect/TTIR/IR/TTIROps.cpp b/lib/Dialect/TTIR/IR/TTIROps.cpp
index c28bff26e..3ae2a7bad 100644
--- a/lib/Dialect/TTIR/IR/TTIROps.cpp
+++ b/lib/Dialect/TTIR/IR/TTIROps.cpp
@@ -62,6 +62,54 @@ ::mlir::LogicalResult mlir::tt::ttir::Conv2dOp::verify() {
   return success();
 }
 
+//===----------------------------------------------------------------------===//
+// ConvolutionOp
+//===----------------------------------------------------------------------===//
+
+::mlir::LogicalResult mlir::tt::ttir::ConvolutionOp::verify() {
+  if (getConvolutionLayout().getInputSpatialDimensions().size() !=
+      getConvolutionLayout().getOutputSpatialDimensions().size()) {
+    return emitOpError("Convolution input, output, and kernel must have the "
+                       "same number of spatial dimensions");
+  }
+  if (getConvolutionLayout().getInputSpatialDimensions().size() !=
+      getConvolutionLayout().getKernelSpatialDimensions().size()) {
+    return emitOpError("Convolution input, output, and kernel must have the "
+                       "same number of spatial dimensions");
+  }
+
+  // Subtract 2 from the rank as to not count batch and feature dimension
+  if (getInput().getType().getRank() - 2 !=
+      (int64_t)getConvolutionLayout().getInputSpatialDimensions().size()) {
+    return emitOpError("Input tensor must have the same number of spatial "
+                       "dimensions as specified in the ConvolutionLayout");
+  }
+
+  if (getWeight().getType().getRank() - 2 !=
+      (int64_t)getConvolutionLayout().getKernelSpatialDimensions().size()) {
+    return emitOpError("Weight tensor must have the same number of spatial "
+                       "dimensions as specified in the ConvolutionLayout");
+  }
+
+  std::optional<::mlir::RankedTensorType> biasType =
+      getBias().getImpl() ? std::make_optional(getBias().getType())
+                          : std::nullopt;
+
+  if (biasType.has_value()) {
+    if (biasType->getRank() != 4) {
+      return emitOpError("Bias must be a 4D tensor");
+    }
+  }
+
+  if (getWindowStrides().size() !=
+      getConvolutionLayout().getInputSpatialDimensions().size()) {
+    return emitOpError("Window strides must have the same number of elements "
+                       "as the spatial dimensions of the input tensor");
+  }
+
+  return success();
+}
+
 //===----------------------------------------------------------------------===//
 // MaxPool2dOp
 //===----------------------------------------------------------------------===//
diff --git a/runtime/lib/ttnn/operations/conv/conv2d.cpp b/runtime/lib/ttnn/operations/conv/conv2d.cpp
index 75e398350..31d922ac0 100644
--- a/runtime/lib/ttnn/operations/conv/conv2d.cpp
+++ b/runtime/lib/ttnn/operations/conv/conv2d.cpp
@@ -7,6 +7,7 @@
 #include "tt/runtime/detail/ttnn.h"
 #include "tt/runtime/ttnn/operations/utils.h"
 #include "ttmlir/Target/TTNN/program_generated.h"
+#include "ttnn/types.hpp"
 
 namespace tt::runtime::ttnn::operations::conv {
 void run(const ::tt::target::ttnn::Conv2dOp *op, ProgramContext &context) {
@@ -26,6 +27,7 @@ void run(const ::tt::target::ttnn::Conv2dOp *op, ProgramContext &context) {
   auto config = ::ttnn::operations::conv::conv2d::Conv2dConfig();
   config.dtype = utils::getDataType(op->input());
   config.weights_dtype = utils::getDataType(op->weight());
+  ::ttnn::MemoryConfig outMemConfig = utils::createMemoryConfig(op->out());
   ::ttnn::Tensor out =
       std::get<0>(::ttnn::operations::conv::conv2d::conv2d<::ttnn::Device>(
           input, weight, &device, op->in_channels(), op->out_channels(),
@@ -34,7 +36,7 @@ void run(const ::tt::target::ttnn::Conv2dOp *op, ProgramContext &context) {
           {op->stride_height(), op->stride_width()},
           {op->padding_height(), op->padding_width()},
           {op->dilation_height(), op->dilation_width()}, op->groups(), bias,
-          config));
+          config, outMemConfig));
   tensorPool.insert_or_assign(op->out()->global_id(), out);
 }
 } // namespace tt::runtime::ttnn::operations::conv
diff --git a/test/ttmlir/Conversion/StableHLOToTTIR/conv2d_op.mlir b/test/ttmlir/Conversion/StableHLOToTTIR/conv2d_op.mlir
index f2d708e82..ce4a6f656 100644
--- a/test/ttmlir/Conversion/StableHLOToTTIR/conv2d_op.mlir
+++ b/test/ttmlir/Conversion/StableHLOToTTIR/conv2d_op.mlir
@@ -7,16 +7,13 @@ module @jit_convolution attributes {} {
       window = {
         stride = [1, 1],
         pad = [[1, 1], [1, 1]],
-        lhs_dilate = [1, 1],
-        rhs_dilate = [1, 1],
-        reverse = [0, 0]
       } {
         feature_group_count = 1 : i64,
         batch_group_count = 1 : i64,
         precision_config = [#stablehlo<precision DEFAULT>, #stablehlo<precision DEFAULT>]
       } : (tensor<1x128x128x32xf32>, tensor<64x32x3x3xf32>) -> tensor<1x128x128x64xf32>
     // CHECK: %[[C:.*]] = tensor.empty[[C:.*]]
-    // CHECK: %[[C:.*]] = "ttir.conv2d"[[C:.*]]
+    // CHECK: %[[C:.*]] = "ttir.convolution"[[C:.*]]
     return %0 : tensor<1x128x128x64xf32>
   }
 }
diff --git a/test/ttmlir/Dialect/TTIR/convolution/convolution_tests_negative.mlir b/test/ttmlir/Dialect/TTIR/convolution/convolution_tests_negative.mlir
new file mode 100644
index 000000000..c400e938a
--- /dev/null
+++ b/test/ttmlir/Dialect/TTIR/convolution/convolution_tests_negative.mlir
@@ -0,0 +1,155 @@
+// RUN: not ttmlir-opt --split-input-file %s 2>&1 | FileCheck %s
+#any_device_tile = #tt.operand_constraint<dram|l1|tile|any_device_tile>
+
+module @jit_convolution_bad_spatial_dimensions {
+  func.func public @test_illegal_convolution(%arg0: tensor<1x3x100x100xbf16>, %arg1: tensor<7x3x3x3xbf16>) -> tensor<1x7x100x100xbf16> {
+    %0 = tensor.empty() : tensor<1x7x100x100xbf16>
+    // CHECK: error: 'ttir.convolution' op Convolution input, output, and kernel must have the same number of spatial dimensions
+    %1 = "ttir.convolution"(%arg0, %arg1, %0) <{
+      batch_group_count = 1 : i64,
+      convolution_layout = #ttir<convolution_layout
+        input_batch = 0,
+        input_feature = 1,
+        input_spatial_dimensions = 2x3,
+        kernel_output_feature = 0,
+        kernel_input_feature = 1,
+        kernel_spatial_dimensions = 2x3,
+        output_batch = 0,
+        output_feature = 1,
+        output_spatial_dimensions = 2
+      >,
+      feature_group_count = 1 : i64,
+      input_dilation = array<i64: 1, 1>,
+      operand_constraints = [#any_device_tile, #any_device_tile, #any_device_tile],
+      padding = dense<1> : tensor<2x2xi64>,
+      weight_dilation = array<i64: 1, 1>,
+      window_reversal = array<i1: false, false>,
+      window_strides = array<i64: 1, 1>
+    }> : (tensor<1x3x100x100xbf16>, tensor<7x3x3x3xbf16>, tensor<1x7x100x100xbf16>) -> tensor<1x7x100x100xbf16>
+    return %1 : tensor<1x7x100x100xbf16>
+  }
+}
+
+// -----
+#any_device_tile = #tt.operand_constraint<dram|l1|tile|any_device_tile>
+module @jit_convolution_bad_stride_dimensions {
+  func.func public @test_illegal_convolution(%arg0: tensor<1x3x100x100xbf16>, %arg1: tensor<7x3x3x3xbf16>) -> tensor<1x7x100x100xbf16> {
+    %0 = tensor.empty() : tensor<1x7x100x100xbf16>
+    // CHECK: error: 'ttir.convolution' op Window strides must have the same number of elements as the spatial dimensions of the input tensor
+    %1 = "ttir.convolution"(%arg0, %arg1, %0) <{
+      batch_group_count = 1 : i64,
+      convolution_layout = #ttir<convolution_layout
+        input_batch = 0,
+        input_feature = 1,
+        input_spatial_dimensions = 2x3,
+        kernel_output_feature = 0,
+        kernel_input_feature = 1,
+        kernel_spatial_dimensions = 2x3,
+        output_batch = 0,
+        output_feature = 1,
+        output_spatial_dimensions = 2x3
+      >,
+      feature_group_count = 1 : i64,
+      input_dilation = array<i64: 1, 1>,
+      operand_constraints = [#any_device_tile, #any_device_tile, #any_device_tile],
+      padding = dense<1> : tensor<2x2xi64>,
+      weight_dilation = array<i64: 1, 1>,
+      window_reversal = array<i1: false, false>,
+      window_strides = array<i64: 1, 1, 1>
+    }> : (tensor<1x3x100x100xbf16>, tensor<7x3x3x3xbf16>, tensor<1x7x100x100xbf16>) -> tensor<1x7x100x100xbf16>
+    return %1 : tensor<1x7x100x100xbf16>
+  }
+}
+
+// -----
+#any_device_tile = #tt.operand_constraint<dram|l1|tile|any_device_tile>
+module @jit_convolution_bad_input_tensor {
+  func.func public @test_illegal_convolution(%arg0: tensor<1x3x100x100x100xbf16>, %arg1: tensor<7x3x3x3xbf16>) -> tensor<1x7x100x100xbf16> {
+    %0 = tensor.empty() : tensor<1x7x100x100xbf16>
+    // CHECK: error: 'ttir.convolution' op Input tensor must have the same number of spatial dimensions as specified in the ConvolutionLayout
+    %1 = "ttir.convolution"(%arg0, %arg1, %0) <{
+      batch_group_count = 1 : i64,
+      convolution_layout = #ttir<convolution_layout
+        input_batch = 0,
+        input_feature = 1,
+        input_spatial_dimensions = 2x3,
+        kernel_output_feature = 0,
+        kernel_input_feature = 1,
+        kernel_spatial_dimensions = 2x3,
+        output_batch = 0,
+        output_feature = 1,
+        output_spatial_dimensions = 2x3
+      >,
+      feature_group_count = 1 : i64,
+      input_dilation = array<i64: 1, 1>,
+      operand_constraints = [#any_device_tile, #any_device_tile, #any_device_tile],
+      padding = dense<1> : tensor<2x2xi64>,
+      weight_dilation = array<i64: 1, 1>,
+      window_reversal = array<i1: false, false>,
+      window_strides = array<i64: 1, 1>
+    }> : (tensor<1x3x100x100x100xbf16>, tensor<7x3x3x3xbf16>, tensor<1x7x100x100xbf16>) -> tensor<1x7x100x100xbf16>
+    return %1 : tensor<1x7x100x100xbf16>
+  }
+}
+
+// -----
+#any_device_tile = #tt.operand_constraint<dram|l1|tile|any_device_tile>
+module @jit_convolution_bad_weight_tensor {
+  func.func public @test_illegal_convolution(%arg0: tensor<1x3x100x100xbf16>, %arg1: tensor<20x7x3x3x3xbf16>) -> tensor<1x7x100x100xbf16> {
+    %0 = tensor.empty() : tensor<1x7x100x100xbf16>
+    // CHECK: error: 'ttir.convolution' op Weight tensor must have the same number of spatial dimensions as specified in the ConvolutionLayout
+    %1 = "ttir.convolution"(%arg0, %arg1, %0) <{
+      batch_group_count = 1 : i64,
+      convolution_layout = #ttir<convolution_layout
+        input_batch = 0,
+        input_feature = 1,
+        input_spatial_dimensions = 2x3,
+        kernel_output_feature = 0,
+        kernel_input_feature = 1,
+        kernel_spatial_dimensions = 2x3,
+        output_batch = 0,
+        output_feature = 1,
+        output_spatial_dimensions = 2x3
+      >,
+      feature_group_count = 1 : i64,
+      input_dilation = array<i64: 1, 1>,
+      operand_constraints = [#any_device_tile, #any_device_tile, #any_device_tile],
+      padding = dense<1> : tensor<2x2xi64>,
+      weight_dilation = array<i64: 1, 1>,
+      window_reversal = array<i1: false, false>,
+      window_strides = array<i64: 1, 1>
+    }> : (tensor<1x3x100x100xbf16>, tensor<20x7x3x3x3xbf16>, tensor<1x7x100x100xbf16>) -> tensor<1x7x100x100xbf16>
+    return %1 : tensor<1x7x100x100xbf16>
+  }
+}
+
+// -----
+#any_device_tile = #tt.operand_constraint<dram|l1|tile|any_device_tile>
+module @jit_convolution_bad_bias_tensor {
+  func.func public @test_illegal_convolution(%arg0: tensor<1x3x100x100xbf16>, %arg1: tensor<7x3x3x3xbf16>, %arg2: tensor<1x1x7xbf16>) -> tensor<1x7x100x100xbf16> {
+    %0 = tensor.empty() : tensor<1x7x100x100xbf16>
+    // CHECK: error: 'ttir.convolution' op Bias must be a 4D tensor
+    %1 = "ttir.convolution"(%arg0, %arg1, %arg2, %0) <{
+      batch_group_count = 1 : i64,
+      convolution_layout = #ttir<convolution_layout
+        input_batch = 0,
+        input_feature = 1,
+        input_spatial_dimensions = 2x3,
+        kernel_output_feature = 0,
+        kernel_input_feature = 1,
+        kernel_spatial_dimensions = 2x3,
+        output_batch = 0,
+        output_feature = 1,
+        output_spatial_dimensions = 2x3
+      >,
+      feature_group_count = 1 : i64,
+      input_dilation = array<i64: 1, 1>,
+      operand_constraints = [#any_device_tile, #any_device_tile, #any_device_tile],
+      padding = dense<1> : tensor<2x2xi64>,
+      weight_dilation = array<i64: 1, 1>,
+      window_reversal = array<i1: false, false>,
+      window_strides = array<i64: 1, 1>
+    }> : (tensor<1x3x100x100xbf16>, tensor<7x3x3x3xbf16>, tensor<1x1x7xbf16>, tensor<1x7x100x100xbf16>) -> tensor<1x7x100x100xbf16>
+    return %1 : tensor<1x7x100x100xbf16>
+  }
+}
diff --git a/test/ttmlir/Dialect/TTNN/convolution/complex_conv_channel_first.mlir b/test/ttmlir/Dialect/TTNN/convolution/complex_conv_channel_first.mlir
new file mode 100644
index 000000000..1a146ef0d
--- /dev/null
+++ b/test/ttmlir/Dialect/TTNN/convolution/complex_conv_channel_first.mlir
@@ -0,0 +1,34 @@
+// RUN: ttmlir-opt --ttir-to-ttnn-backend-pipeline %s | FileCheck %s
+#any_device_tile = #tt.operand_constraint<dram|l1|tile|any_device_tile>
+module @jit_convolution {
+  func.func public @test_NCHW_IOHW_to_NHWC_OIHW_conv2d(%arg0: tensor<1x3x100x100xbf16>, %arg1: tensor<7x3x3x3xbf16>) -> tensor<1x7x100x100xbf16> {
+    %0 = tensor.empty() : tensor<1x7x100x100xbf16>
+    // CHECK: %[[C:.*]] = "ttnn.transpose"[[C:.*]]
+    // CHECK: %[[C:.*]] = "ttnn.transpose"[[C:.*]]
+    // CHECK: %[[C:.*]] = "ttnn.conv2d"[[C:.*]]
+    %1 = "ttir.convolution"(%arg0, %arg1, %0) <{
+      batch_group_count = 1 : i64,
+      convolution_layout = #ttir<convolution_layout
+        input_batch = 0,
+        input_feature = 1,
+        input_spatial_dimensions = 2x3,
+        kernel_output_feature = 0,
+        kernel_input_feature = 1,
+        kernel_spatial_dimensions = 2x3,
+        output_batch = 0,
+        output_feature = 1,
+        output_spatial_dimensions = 2x3
+      >,
+      feature_group_count = 1 : i64,
+      input_dilation = array<i64: 1, 1>,
+      operand_constraints = [#any_device_tile, #any_device_tile, #any_device_tile],
+      padding = dense<1> : tensor<2x2xi64>,
+      weight_dilation = array<i64: 1, 1>,
+      window_reversal = array<i1: false, false>,
+      window_strides = array<i64: 1, 1>
+    }> : (tensor<1x3x100x100xbf16>, tensor<7x3x3x3xbf16>, tensor<1x7x100x100xbf16>) -> tensor<1x7x100x100xbf16>
+    // CHECK: %[[C:.*]] = "ttnn.transpose"[[C:.*]]
+    // CHECK: %[[C:.*]] = "ttnn.transpose"[[C:.*]]
+    return %1 : tensor<1x7x100x100xbf16>
+  }
+}
diff --git a/test/ttmlir/Dialect/TTNN/simple_conv.mlir b/test/ttmlir/Dialect/TTNN/convolution/simple_conv.mlir
similarity index 100%
rename from test/ttmlir/Dialect/TTNN/simple_conv.mlir
rename to test/ttmlir/Dialect/TTNN/convolution/simple_conv.mlir
diff --git a/test/ttmlir/Silicon/TTNN/complex_conv_channel_first.mlir b/test/ttmlir/Silicon/TTNN/complex_conv_channel_first.mlir
new file mode 100644
index 000000000..3dca895c8
--- /dev/null
+++ b/test/ttmlir/Silicon/TTNN/complex_conv_channel_first.mlir
@@ -0,0 +1,36 @@
+// RUN: ttmlir-opt --ttir-to-ttnn-backend-pipeline="system-desc-path=%system_desc_path%" %s > %t.mlir
+// RUN: FileCheck %s --input-file=%t.mlir
+// RUN: ttmlir-translate --ttnn-to-flatbuffer %t.mlir > %t.ttnn
+#any_device_tile = #tt.operand_constraint<dram|l1|tile|any_device_tile>
+module @jit_convolution {
+  func.func public @test_NCHW_IOHW_to_NHWC_OIHW_conv2d(%arg0: tensor<1x3x100x100xbf16>, %arg1: tensor<7x3x3x3xbf16>) -> tensor<1x7x100x100xbf16> {
+    %0 = tensor.empty() : tensor<1x7x100x100xbf16>
+    // CHECK: %[[C:.*]] = "ttnn.transpose"[[C:.*]]
+    // CHECK: %[[C:.*]] = "ttnn.transpose"[[C:.*]]
+    // CHECK: %[[C:.*]] = "ttnn.conv2d"[[C:.*]]
+    %1 = "ttir.convolution"(%arg0, %arg1, %0) <{
+      batch_group_count = 1 : i64,
+      convolution_layout = #ttir<convolution_layout
+        input_batch = 0,
+        input_feature = 1,
+        input_spatial_dimensions = 2x3,
+        kernel_output_feature = 0,
+        kernel_input_feature = 1,
+        kernel_spatial_dimensions = 2x3,
+        output_batch = 0,
+        output_feature = 1,
+        output_spatial_dimensions = 2x3
+      >,
+      feature_group_count = 1 : i64,
+      input_dilation = array<i64: 1, 1>,
+      operand_constraints = [#any_device_tile, #any_device_tile, #any_device_tile],
+      padding = dense<1> : tensor<2x2xi64>,
+      weight_dilation = array<i64: 1, 1>,
+      window_reversal = array<i1: false, false>,
+      window_strides = array<i64: 1, 1>
+    }> : (tensor<1x3x100x100xbf16>, tensor<7x3x3x3xbf16>, tensor<1x7x100x100xbf16>) -> tensor<1x7x100x100xbf16>
+    // CHECK: %[[C:.*]] = "ttnn.transpose"[[C:.*]]
+    // CHECK: %[[C:.*]] = "ttnn.transpose"[[C:.*]]
+    return %1 : tensor<1x7x100x100xbf16>
+  }
+}