Drop unit dimensions in tensor_ext.rotate and tensor_ext.rotate_and_reduce.

asraa · copybara-github · commit d168e37856bb · 2025-08-28T15:24:40.000-07:00
This allows rotation operations to be run on 1-D tensors.

PiperOrigin-RevId: 800635444
diff --git a/lib/Transforms/ConvertToCiphertextSemantics/BUILD b/lib/Transforms/ConvertToCiphertextSemantics/BUILD
@@ -16,6 +16,7 @@ cc_library(
         ":pass_inc_gen",
         "@heir//lib/Dialect/Secret/IR:SecretPatterns",
         "@heir//lib/Dialect/TensorExt/IR:Dialect",
+        "@heir//lib/Transforms/DropUnitDims",
         "@heir//lib/Utils",
         "@heir//lib/Utils:AffineMapUtils",
         "@heir//lib/Utils:AttributeUtils",
diff --git a/lib/Transforms/ConvertToCiphertextSemantics/ConvertToCiphertextSemantics.cpp b/lib/Transforms/ConvertToCiphertextSemantics/ConvertToCiphertextSemantics.cpp
@@ -16,6 +16,7 @@
 #include "lib/Dialect/TensorExt/IR/TensorExtOps.h"
 #include "lib/Transforms/ConvertToCiphertextSemantics/AssignLayout.h"
 #include "lib/Transforms/ConvertToCiphertextSemantics/TypeConversion.h"
+#include "lib/Transforms/DropUnitDims/DropUnitDims.h"
 #include "lib/Utils/AffineMapUtils.h"
 #include "lib/Utils/AttributeUtils.h"
 #include "lib/Utils/ContextAwareConversionUtils.h"
@@ -27,6 +28,7 @@
 #include "lib/Utils/Utils.h"
 #include "llvm/include/llvm/ADT/ArrayRef.h"         // from @llvm-project
 #include "llvm/include/llvm/ADT/STLExtras.h"        // from @llvm-project
+#include "llvm/include/llvm/ADT/SmallVector.h"      // from @llvm-project
 #include "llvm/include/llvm/ADT/StringExtras.h"     // from @llvm-project
 #include "llvm/include/llvm/Support/Debug.h"        // from @llvm-project
 #include "llvm/include/llvm/Support/raw_ostream.h"  // from @llvm-project
@@ -47,13 +49,13 @@
 #include "mlir/include/mlir/IR/BuiltinTypeInterfaces.h"  // from @llvm-project
 #include "mlir/include/mlir/IR/BuiltinTypes.h"           // from @llvm-project
 #include "mlir/include/mlir/IR/ImplicitLocOpBuilder.h"   // from @llvm-project
+#include "mlir/include/mlir/IR/OpDefinition.h"           // from @llvm-project
 #include "mlir/include/mlir/IR/OperationSupport.h"       // from @llvm-project
 #include "mlir/include/mlir/IR/PatternMatch.h"           // from @llvm-project
 #include "mlir/include/mlir/Support/LLVM.h"              // from @llvm-project
 #include "mlir/include/mlir/Support/LogicalResult.h"     // from @llvm-project
 #include "mlir/include/mlir/Transforms/DialectConversion.h"  // from @llvm-project
 #include "mlir/include/mlir/Transforms/GreedyPatternRewriteDriver.h"  // from @llvm-project
-#include "mlir/include/mlir/Transforms/WalkPatternRewriteDriver.h"  // from @llvm-project
 
 #define DEBUG_TYPE "convert-to-ciphertext-semantics"
 
@@ -1357,7 +1359,6 @@ class ConvertExpandShape
     if (!sourceLayout) {
       return op.emitError() << "failed to fetch new layout attribute for input";
     }
-    op.dump();
 
     if (resultType != srcType) {
       return rewriter.notifyMatchFailure(
@@ -1385,6 +1386,99 @@ class ConvertExpandShape
   }
 };
 
+struct DropRotateUnitDims : OpRewritePattern<tensor_ext::RotateOp> {
+  using OpRewritePattern<tensor_ext::RotateOp>::OpRewritePattern;
+
+  LogicalResult matchAndRewrite(tensor_ext::RotateOp rotateOp,
+                                PatternRewriter& rewriter) const override {
+    SmallVector<int64_t> operandUnitDims =
+        getUnitDims(rotateOp.getTensor().getType());
+    if (operandUnitDims.empty()) {
+      LLVM_DEBUG(llvm::dbgs() << "no unit dims to drop");
+      return failure();
+    }
+
+    SmallVector<Value> collapsedOperands =
+        collapseOperands(rewriter, {rotateOp.getTensor()}, operandUnitDims);
+
+    tensor_ext::RotateOp collapsedOp = tensor_ext::RotateOp::create(
+        rewriter, rotateOp.getLoc(), collapsedOperands[0], rotateOp.getShift());
+    rewriter.replaceOp(rotateOp, expandResult(rewriter, collapsedOp.getResult(),
+                                              rotateOp.getOutput().getType(),
+                                              operandUnitDims));
+    return success();
+  }
+};
+
+struct DropRotateAndReduceUnitDims
+    : OpRewritePattern<tensor_ext::RotateAndReduceOp> {
+  using OpRewritePattern<tensor_ext::RotateAndReduceOp>::OpRewritePattern;
+
+  LogicalResult matchAndRewrite(tensor_ext::RotateAndReduceOp rotateOp,
+                                PatternRewriter& rewriter) const override {
+    SmallVector<int64_t> operandUnitDims =
+        getUnitDims(rotateOp.getTensor().getType());
+    if (operandUnitDims.empty()) {
+      LLVM_DEBUG(llvm::dbgs() << "no unit dims to drop");
+      return failure();
+    }
+
+    SmallVector<Value> collapsedOperands =
+        collapseOperands(rewriter, {rotateOp.getTensor()}, operandUnitDims);
+
+    auto collapsedOp = tensor_ext::RotateAndReduceOp::create(
+        rewriter, rotateOp.getLoc(), collapsedOperands[0],
+        rotateOp.getPlaintexts(), rotateOp.getPeriod(), rotateOp.getSteps());
+    rewriter.replaceOp(rotateOp, expandResult(rewriter, collapsedOp.getResult(),
+                                              rotateOp.getOutput().getType(),
+                                              operandUnitDims));
+    return success();
+  }
+};
+
+struct DropElementwiseUnitDims : OpTraitRewritePattern<OpTrait::Elementwise> {
+  explicit DropElementwiseUnitDims(MLIRContext* context)
+      : OpTraitRewritePattern(context) {}
+
+  LogicalResult matchAndRewrite(mlir::Operation* op,
+                                PatternRewriter& rewriter) const override {
+    // Ensure that all operands and results have the same type.
+    SmallVector<Type> operandAndResultTypes =
+        llvm::to_vector(op->getOperandTypes());
+    operandAndResultTypes.append(op->getResultTypes().begin(),
+                                 op->getResultTypes().end());
+    if (!llvm::all_equal(operandAndResultTypes) || op->getNumOperands() == 0 ||
+        op->getNumResults() != 1) {
+      return failure();
+    }
+
+    auto tensorType = dyn_cast<RankedTensorType>(op->getOperand(0).getType());
+    if (!tensorType) {
+      return failure();
+    }
+
+    SmallVector<int64_t> operandUnitDims = getUnitDims(tensorType);
+    if (operandUnitDims.empty()) {
+      LLVM_DEBUG(llvm::dbgs() << "no unit dims to drop");
+      return failure();
+    }
+
+    SmallVector<Value> collapsedOperands = collapseOperands(
+        rewriter, llvm::to_vector(op->getOperands()), operandUnitDims);
+
+    Type resultType = collapsedOperands[0].getType();
+    Operation* collapsedOp = rewriter.create(OperationState(
+        op->getLoc(), op->getName().getStringRef(), collapsedOperands,
+        resultType, op->getAttrs(), op->getSuccessors()));
+
+    rewriter.replaceOp(
+        op, expandResult(rewriter, collapsedOp->getResults()[0],
+                         cast<RankedTensorType>(op->getResult(0).getType()),
+                         operandUnitDims));
+    return success();
+  }
+};
+
 struct ConvertToCiphertextSemantics
     : impl::ConvertToCiphertextSemanticsBase<ConvertToCiphertextSemantics> {
   using ConvertToCiphertextSemanticsBase::ConvertToCiphertextSemanticsBase;
@@ -1425,6 +1519,10 @@ struct ConvertToCiphertextSemantics
     // Note ConvertAssignLayout generates tensor.concat
     RewritePatternSet cleanupPatterns2(context);
     tensor::populateDecomposeTensorConcatPatterns(cleanupPatterns2);
+    // Drop unit dimensions for tensor_ext ops that require 1-D tensors (i.e.
+    // rotation ops) and elementwise ops.
+    cleanupPatterns2.add<DropRotateUnitDims, DropRotateAndReduceUnitDims,
+                         DropElementwiseUnitDims>(context);
     // Folding here will remove any unrealized conversion cast ops that were
     // inserted to persist new layouts.
     if (failed(applyPatternsGreedily(module, std::move(cleanupPatterns2)))) {
diff --git a/lib/Transforms/DropUnitDims/DropUnitDims.cpp b/lib/Transforms/DropUnitDims/DropUnitDims.cpp
@@ -37,21 +37,30 @@ namespace heir {
 
 namespace {
 
-/// Collapse the given `value` so that the type matches the type of
-/// `origOutput`.
-static Value collapseValue(RewriterBase& rewriter, Location loc, Value operand,
-                           ArrayRef<int64_t> targetShape,
-                           ArrayRef<ReassociationIndices> reassociation) {
+Value collapseValue(RewriterBase& rewriter, Location loc, Value operand,
+                    ArrayRef<int64_t> targetShape,
+                    ArrayRef<ReassociationIndices> reassociation) {
   auto tensorType = cast<RankedTensorType>(operand.getType());
   auto targetType =
       RankedTensorType::get(targetShape, tensorType.getElementType());
   return tensor::CollapseShapeOp::create(rewriter, loc, targetType, operand,
                                          reassociation);
 }
 
-/// Returns a collapsed `val` where the collapsing occurs at dims in positions.
-static Value collapseDimsAt(PatternRewriter& rewriter, Value val,
-                            ArrayRef<int64_t> positions) {
+}  // namespace
+
+SmallVector<int64_t> getUnitDims(ShapedType type) {
+  SmallVector<int64_t> unitDims;
+  for (int64_t i = 0; i < type.getRank(); ++i) {
+    if (type.getDimSize(i) == 1) {
+      unitDims.push_back(i);
+    }
+  }
+  return unitDims;
+}
+
+Value collapseDimsAt(PatternRewriter& rewriter, Value val,
+                     ArrayRef<int64_t> positions) {
   auto valType = cast<ShapedType>(val.getType());
   SmallVector<int64_t> collapsedShape(valType.getShape());
   for (int64_t pos : llvm::reverse(positions)) {
@@ -62,7 +71,22 @@ static Value collapseDimsAt(PatternRewriter& rewriter, Value val,
       getReassociationForReshapeAtDim(valType.getRank(), positions));
 }
 
-}  // namespace
+/// Collapse all collapsible operands.
+SmallVector<Value> collapseOperands(PatternRewriter& rewriter,
+                                    ArrayRef<Value> operands,
+                                    ArrayRef<int64_t> collapseDims) {
+  return llvm::map_to_vector(operands, [&](auto operand) {
+    return collapseDimsAt(rewriter, operand, collapseDims);
+  });
+}
+
+/// Expand result tensor.
+Value expandResult(PatternRewriter& rewriter, Value result,
+                   RankedTensorType expandedType, SmallVector<int64_t> dims) {
+  return tensor::ExpandShapeOp::create(
+      rewriter, result.getLoc(), expandedType, result,
+      getReassociationForReshapeAtDim(expandedType.getRank(), dims));
+}
 
 // Drop unit dims on linalg.map operations that perform a single elementwise
 // operation. This will only drop batch dims (leading unit dimensions). This
@@ -72,24 +96,6 @@ static Value collapseDimsAt(PatternRewriter& rewriter, Value val,
 struct ReduceLinalgMap : OpRewritePattern<linalg::MapOp> {
   using OpRewritePattern<linalg::MapOp>::OpRewritePattern;
 
-  /// Collapse all collapsible operands.
-  SmallVector<Value> collapseOperands(PatternRewriter& rewriter,
-                                      ArrayRef<Value> operands,
-                                      ArrayRef<int64_t> collapseDims) const {
-    return llvm::map_to_vector(operands, [&](auto operand) {
-      return collapseDimsAt(rewriter, operand, collapseDims);
-    });
-  }
-
-  /// Expand result tensor.
-  Value expandResult(PatternRewriter& rewriter, Value result,
-                     RankedTensorType expandedType,
-                     SmallVector<int64_t> dims) const {
-    return tensor::ExpandShapeOp::create(
-        rewriter, result.getLoc(), expandedType, result,
-        getReassociationForReshapeAtDim(expandedType.getRank(), dims));
-  }
-
   LogicalResult matchAndRewrite(linalg::MapOp mapOp,
                                 PatternRewriter& rewriter) const override {
     if (mapOp.hasUserDefinedMaps()) {
@@ -114,14 +120,8 @@ struct ReduceLinalgMap : OpRewritePattern<linalg::MapOp> {
 
     // Check for unit dims in the output shape. A map op requires all inputs and
     // outputs have the same shape.
-    auto outputShape = mapOp.getInit().getType().getShape();
-    SmallVector<int64_t> operandUnitDims;
-    for (int64_t i = 0; i < outputShape.size(); ++i) {
-      if (outputShape[i] == 1) {
-        operandUnitDims.push_back(i);
-      }
-    }
-
+    SmallVector<int64_t> operandUnitDims =
+        getUnitDims(mapOp.getInit().getType());
     if (operandUnitDims.empty()) {
       LLVM_DEBUG(llvm::dbgs() << "no unit dims to drop");
       return failure();
diff --git a/lib/Transforms/DropUnitDims/DropUnitDims.h b/lib/Transforms/DropUnitDims/DropUnitDims.h
@@ -1,7 +1,11 @@
 #ifndef LIB_TRANSFORMS_DROPUNITDIMS_DROPUNITDIMS_H_
 #define LIB_TRANSFORMS_DROPUNITDIMS_DROPUNITDIMS_H_
 
-#include "mlir/include/mlir/Pass/Pass.h"  // from @llvm-project
+#include "mlir/include/mlir/Dialect/Arith/Utils/Utils.h"  // from @llvm-project
+#include "mlir/include/mlir/IR/MLIRContext.h"             // from @llvm-project
+#include "mlir/include/mlir/IR/PatternMatch.h"            // from @llvm-project
+#include "mlir/include/mlir/Pass/Pass.h"                  // from @llvm-project
+#include "mlir/include/mlir/Support/LLVM.h"               // from @llvm-project
 
 namespace mlir {
 namespace heir {
@@ -12,6 +16,22 @@ namespace heir {
 #define GEN_PASS_REGISTRATION
 #include "lib/Transforms/DropUnitDims/DropUnitDims.h.inc"
 
+// Returns a list of unit dims of a type
+SmallVector<int64_t> getUnitDims(ShapedType type);
+
+/// Returns a collapsed `val` where the collapsing occurs at dims in positions.
+Value collapseDimsAt(PatternRewriter& rewriter, Value val,
+                     ArrayRef<int64_t> positions);
+
+/// Collapse all collapsible operands.
+SmallVector<Value> collapseOperands(PatternRewriter& rewriter,
+                                    ArrayRef<Value> operands,
+                                    ArrayRef<int64_t> collapseDims);
+
+/// Expand result tensor.
+Value expandResult(PatternRewriter& rewriter, Value result,
+                   RankedTensorType expandedType, SmallVector<int64_t> dims);
+
 }  // namespace heir
 }  // namespace mlir
 
diff --git a/tests/Transforms/convert_to_ciphertext_semantics/collapse_shape.mlir b/tests/Transforms/convert_to_ciphertext_semantics/collapse_shape.mlir
@@ -34,7 +34,8 @@ module {
     %1 = tensor_ext.assign_layout %cst {layout = #new_layout2, tensor_ext.layout = #new_layout2} : tensor<512xf32>
     // CHECK: secret.generic
     // CHECK-NEXT: ^body(%[[input0:.*]]: tensor<1x1024xf32>)
-    // CHECK: tensor_ext.rotate_and_reduce %[[input0]]
+    // CHECK: %[[collapsed:.*]] = tensor.collapse_shape %[[input0]]
+    // CHECK: tensor_ext.rotate_and_reduce %[[collapsed]]
     %7 = secret.generic(%arg4: !secret.secret<tensor<1x784xf32>> {tensor_ext.layout = #new_layout5}) {
     ^body(%input0: tensor<1x784xf32>):
       %collapsed = tensor.collapse_shape %input0 [[0, 1]] {tensor_ext.layout = #new_layout6} : tensor<1x784xf32> into tensor<784xf32>
diff --git a/tests/Transforms/convert_to_ciphertext_semantics/drop_unit_dims.mlir b/tests/Transforms/convert_to_ciphertext_semantics/drop_unit_dims.mlir
@@ -0,0 +1,35 @@
+// RUN: heir-opt %s --convert-to-ciphertext-semantics --split-input-file | FileCheck %s
+
+#kernel = #secret.kernel<name = "MatvecDiagonal", force = false>
+#new_layout1 = #tensor_ext.new_layout<"{ [i0, i1] -> [ct, slot] : (i0 - i1 + ct) mod 512 = 0 and (-i1 + ct + slot) mod 1024 = 0 and 0 <= i0 <= 511 and 0 <= i1 <= 783 and 0 <= ct <= 511 and 0 <= slot <= 1023 }">
+#new_layout2 = #tensor_ext.new_layout<"{ [i0] -> [ct, slot] : ct = 0 and (-i0 + slot) mod 512 = 0 and 0 <= i0 <= 511 and 0 <= slot <= 1023 }">
+#new_layout5 = #tensor_ext.new_layout<"{ [i0, i1] -> [ct, slot] : i0 = 0 and ct = 0 and (-i1 + slot) mod 1024 = 0 and 0 <= i1 <= 783 and 0 <= slot <= 1023 }">
+#new_layout6 = #tensor_ext.new_layout<"{ [i0] -> [ct, slot] : ct = 0 and (-i0 + slot) mod 1024 = 0 and 0 <= i0 <= 783 and 0 <= slot <= 1023 }">
+module{
+  // CHECK: func.func @main
+  func.func @main(%arg0: tensor<512x784xf32>, %arg1: tensor<512xf32>, %arg4: !secret.secret<tensor<1x784xf32>> {tensor_ext.layout = #new_layout5}) -> (!secret.secret<tensor<512xf32>> {jax.result_info = "result[0]", tensor_ext.layout = #new_layout2}) {
+    %cst = arith.constant dense<0.000000e+00> : tensor<512xf32>
+    %0 = tensor_ext.assign_layout %arg0 {layout = #new_layout1, tensor_ext.layout = #new_layout1} : tensor<512x784xf32>
+    %1 = tensor_ext.assign_layout %cst {layout = #new_layout2, tensor_ext.layout = #new_layout2} : tensor<512xf32>
+    %2 = tensor_ext.assign_layout %arg1 {layout = #new_layout2, tensor_ext.layout = #new_layout2} : tensor<512xf32>
+    // CHECK: secret.generic(%[[arg2:.*]]: !secret.secret<tensor<1x1024xf32>>)
+    // CHECK: ^body(%[[input0:.*]]: tensor<1x1024xf32>)
+    // CHECK: %[[collapsed:.*]] = tensor.collapse_shape %[[input0]]
+    // CHECK-SAME: tensor<1x1024xf32> into tensor<1024xf32>
+    // CHECK: %[[v4:.*]] = tensor_ext.rotate_and_reduce %[[collapsed]]
+    // CHECK: %[[collapsed_2:.*]] = tensor.collapse_shape
+    // CHECK: %[[v5:.*]] = arith.addf %[[v4]], %[[collapsed_2]] : tensor<1024xf32>
+    // CHECK: %[[v6:.*]] = tensor_ext.rotate %[[v5]], %[[c512:.*]] : tensor<1024xf32>
+    // CHECK: %[[expanded:.*]] = tensor.expand_shape
+    // CHECK-SAME: tensor<1024xf32> into tensor<1x1024xf32>
+    // CHECK: secret.yield %[[expanded]]
+    %7 = secret.generic(%arg4: !secret.secret<tensor<1x784xf32>> {tensor_ext.layout = #new_layout5}) {
+    ^body(%input0: tensor<1x784xf32>):
+      %collapsed = tensor.collapse_shape %input0 [[0, 1]] {tensor_ext.layout = #new_layout6} : tensor<1x784xf32> into tensor<784xf32>
+      %8 = linalg.matvec {secret.kernel = #kernel, tensor_ext.layout = #new_layout2} ins(%0, %collapsed : tensor<512x784xf32>, tensor<784xf32>) outs(%1 : tensor<512xf32>) -> tensor<512xf32>
+      %9 = arith.addf %2, %8 {tensor_ext.layout = #new_layout2} : tensor<512xf32>
+      secret.yield %9 : tensor<512xf32>
+    } -> (!secret.secret<tensor<512xf32>> {tensor_ext.layout = #new_layout2})
+    return %7 : !secret.secret<tensor<512xf32>>
+  }
+}