onnx · philass · Sep 17, 2022 · Sep 8, 2022 · Sep 8, 2022 · Sep 8, 2022
diff --git a/src/Accelerators/NNPA/Conversion/ONNXToZHigh/RewriteONNXForZHigh.td b/src/Accelerators/NNPA/Conversion/ONNXToZHigh/RewriteONNXForZHigh.td
@@ -88,6 +88,17 @@ def replaceONNXBatchNormalizationInferenceModePattern : Pattern<
 // 
 //===----------------------------------------------------------------------===//
 
+// Get a type for a tensor that stores the shape of another tensor.
+def GetStart: NativeCodeCall<
+  //"IntegerType::get($_builder, 64, IntegerType::Signed)"
+  "$_builder.getIntegerAttr($_builder.getIntegerType(64, true), 0)"
+>;
+
+def GetEnd: NativeCodeCall<
+  //"IntegerAttr::get(IntegerType(64, true, APInt(64, $0.getType().cast<ShapedType>().getRank(), true)))"
+  "$_builder.getIntegerAttr($_builder.getIntegerType(64, true), $0.getType().cast<ShapedType>().getRank())"
+>;
+
 // Get a type for a tensor that stores the shape of another tensor.
 def GetShapeTypeOf: NativeCodeCall<
   "RankedTensorType::get({$0.getType().cast<ShapedType>().getRank()}, $_builder.getIntegerType(64))"
@@ -112,7 +123,10 @@ def expandConstantOperandForAddOp1: Pat<
 def expandConstantOperandForAddOp2: Pat<
   (ONNXAddOp $x, (ONNXConstantOp:$c $_, $_, $_, $_, $_, $_, $_, $_)),
   (ONNXAddOp $x, (ONNXExpandOp $c,
-                               (ONNXShapeOp $x, (returnType (GetShapeTypeOf $x))),
+                               (ONNXShapeOp $x,
+                                            (GetEnd $x), 
+                                            (GetStart), 
+                                            (returnType (GetShapeTypeOf $x))),
                                (returnType $x))),
   [(IsUniBroadcastingFromFirstToSecond $c, $x)]
 >;
@@ -124,15 +138,21 @@ def expandConstantOperandForAddOp2: Pat<
 def expandConstantOperandForDivOp1: Pat<
   (ONNXDivOp $x, (ONNXConstantOp:$c $_, $_, $_, $_, $_, $_, $_, $_)),
   (ONNXDivOp $x, (ONNXExpandOp $c,
-                               (ONNXShapeOp $x, (returnType (GetShapeTypeOf $x))),
+                               (ONNXShapeOp $x,
+                                            (GetEnd $x),
+                                            (GetStart),
+                                            (returnType (GetShapeTypeOf $x))),
                                (returnType $x))),
   [(IsUniBroadcastingFromFirstToSecond $c, $x)]
 >;
 
 def expandConstantOperandForDivOp2: Pat<
   (ONNXDivOp (ONNXConstantOp:$c $_, $_, $_, $_, $_, $_, $_, $_), $x),
   (ONNXDivOp (ONNXExpandOp $c,
-                           (ONNXShapeOp $x, (returnType (GetShapeTypeOf $x))),
+                           (ONNXShapeOp $x,
+                                        (GetEnd $x),
+                                        (GetStart),
+                                        (returnType (GetShapeTypeOf $x))),
                            (returnType $x)),
              $x),
   [(IsUniBroadcastingFromFirstToSecond $c, $x)]
@@ -151,7 +171,10 @@ def expandConstantOperandForMulOp1: Pat<
 def expandConstantOperandForMulOp2: Pat<
   (ONNXMulOp $x, (ONNXConstantOp:$c $_, $_, $_, $_, $_, $_, $_, $_)),
   (ONNXMulOp $x, (ONNXExpandOp $c,
-                               (ONNXShapeOp $x, (returnType (GetShapeTypeOf $x))),
+                               (ONNXShapeOp $x,
+                                            (GetEnd $x),
+                                            (GetStart),
+                                            (returnType (GetShapeTypeOf $x))),
                                (returnType $x))),
   [(IsUniBroadcastingFromFirstToSecond $c, $x)]
 >;
@@ -163,15 +186,21 @@ def expandConstantOperandForMulOp2: Pat<
 def expandConstantOperandForSubOp1: Pat<
   (ONNXSubOp $x, (ONNXConstantOp:$c $_, $_, $_, $_, $_, $_, $_, $_)),
   (ONNXSubOp $x, (ONNXExpandOp $c,
-                               (ONNXShapeOp $x, (returnType (GetShapeTypeOf $x))),
+                               (ONNXShapeOp $x,
+                                            (GetEnd $x),
+                                            (GetStart),
+                                            (returnType (GetShapeTypeOf $x))),
                                (returnType $x))),
   [(IsUniBroadcastingFromFirstToSecond $c, $x)]
 >;
 
 def expandConstantOperandForSubOp2: Pat<
   (ONNXSubOp (ONNXConstantOp:$c $_, $_, $_, $_, $_, $_, $_, $_), $x),
   (ONNXSubOp (ONNXExpandOp $c,
-                           (ONNXShapeOp $x, (returnType (GetShapeTypeOf $x))),
+                           (ONNXShapeOp $x,
+                                        (GetEnd $x),
+                                        (GetStart),
+                                        (returnType (GetShapeTypeOf $x))),
                            (returnType $x)),
              $x),
   [(IsUniBroadcastingFromFirstToSecond $c, $x)]

diff --git a/src/Builder/OpBuildTable.inc b/src/Builder/OpBuildTable.inc
@@ -159,7 +159,7 @@ op_dialect_version_map_["SequenceEmpty"] = {11};
 op_dialect_version_map_["SequenceErase"] = {11};
 op_dialect_version_map_["SequenceInsert"] = {11};
 op_dialect_version_map_["SequenceLength"] = {11};
-op_dialect_version_map_["Shape"] = {13};
+op_dialect_version_map_["Shape"] = {15};
 op_dialect_version_map_["Shrink"] = {9};
 op_dialect_version_map_["Sigmoid"] = {13};
 op_dialect_version_map_["Sign"] = {13};
@@ -739,7 +739,7 @@ op_dialect_top_version_map_["SequenceEmpty"] = 11;
 op_dialect_top_version_map_["SequenceErase"] = 11;
 op_dialect_top_version_map_["SequenceInsert"] = 11;
 op_dialect_top_version_map_["SequenceLength"] = 11;
-op_dialect_top_version_map_["Shape"] = 13;
+op_dialect_top_version_map_["Shape"] = 15;
 op_dialect_top_version_map_["Shrink"] = 9;
 op_dialect_top_version_map_["Sigmoid"] = 13;
 op_dialect_top_version_map_["Sign"] = 13;

diff --git a/src/Conversion/ONNXToKrnl/Tensor/Shape.cpp b/src/Conversion/ONNXToKrnl/Tensor/Shape.cpp
@@ -28,7 +28,7 @@ struct ONNXShapeOpLowering : public ConversionPattern {
   LogicalResult matchAndRewrite(Operation *op, ArrayRef<Value> operands,
       ConversionPatternRewriter &rewriter) const final {
     // Get shape.
-    ONNXShapeOpAdaptor operandAdaptor(operands);
+    ONNXShapeOpAdaptor operandAdaptor(operands, op->getAttrDictionary());
     ONNXShapeOp shapeOp = cast<ONNXShapeOp>(op);
     Location loc = op->getLoc();
     ONNXShapeOpShapeHelper shapeHelper(&shapeOp, &rewriter,

diff --git a/src/Dialect/ONNX/ONNXOps.td.inc b/src/Dialect/ONNX/ONNXOps.td.inc
@@ -5565,8 +5565,38 @@ def ONNXShapeOp:ONNX_Op<"Shape",
   let summary = "ONNX Shape operation";
   let description = [{
   "Takes a tensor as input and outputs an 1D int64 tensor containing the shape of the input tensor."
+  "Optional attributes start and end can be used to compute a slice of the input tensor's shape."
+  "If start axis is omitted, the slice starts from axis 0."
+  "The end axis, if specified, is exclusive (and the returned value will not include the size of that axis)."
+  "If the end axis is omitted, the axes upto the last one will be included."
+  "Negative axes indicate counting back from the last axis."
+  "Note that axes will be clipped to the range [0, r-1], where r is the"
+  "rank of the input tensor if they are out-of-range (after adding r in the case of"
+  "negative axis). Thus, specifying any end value > r is equivalent to specifying an end"
+  "value of r, and specifying any start value < -r is equivalent to specifying a start"
+  "value of 0."
+  ""
+  "For example:"
+  "Input tensor with shape: [2, 3, 4] "
+  "No attributes specified."
+  "Output: [2, 3, 4] "
+  ""
+  "Input tensor with shape: [2, 3, 4] "
+  "start: -1"
+  "Output: [4] "
+  ""
+  "Input tensor with shape: [2, 3, 4] "
+  "end: -1"
+  "Output: [2, 3]"
+  ""
+  "Input tensor with shape: [2, 3, 4] "
+  "start: 1"
+  "end: 2"
+  "Output: [3] "
   }];
-  let arguments = (ins AnyTypeOf<[TensorOf<[UI8]>, TensorOf<[UI16]>, TensorOf<[UI32]>, TensorOf<[UI64]>, TensorOf<[I8]>, TensorOf<[I16]>, TensorOf<[I32]>, TensorOf<[I64]>, TensorOf<[BF16]>, TensorOf<[F16]>, TensorOf<[F32]>, TensorOf<[F64]>, TensorOf<[StringType]>, TensorOf<[I1]>, TensorOf<[Complex<F32>]>, TensorOf<[Complex<F64>]>]>:$data);
+  let arguments = (ins AnyTypeOf<[TensorOf<[UI8]>, TensorOf<[UI16]>, TensorOf<[UI32]>, TensorOf<[UI64]>, TensorOf<[I8]>, TensorOf<[I16]>, TensorOf<[I32]>, TensorOf<[I64]>, TensorOf<[BF16]>, TensorOf<[F16]>, TensorOf<[F32]>, TensorOf<[F64]>, TensorOf<[StringType]>, TensorOf<[I1]>, TensorOf<[Complex<F32>]>, TensorOf<[Complex<F64>]>]>:$data,
+    OptionalAttr<SI64Attr>:$end,
+    DefaultValuedAttr<SI64Attr, "0">:$start);
   let results = (outs TensorOf<[I64]>:$shape);
   let extraClassDeclaration = [{
     static int getNumberOfOperands() {

diff --git a/src/Dialect/ONNX/ONNXOpsHelper.cpp b/src/Dialect/ONNX/ONNXOpsHelper.cpp
@@ -495,12 +495,34 @@ Value normalizeConstantOp(
 }
 
 // Create a DenseElementsAttr based on the shape of type.
-DenseElementsAttr createDenseElementsAttrFromShape(
-    PatternRewriter &rewriter, Value value) {
+DenseElementsAttr createDenseElementsAttrFromShape(PatternRewriter &rewriter,
+    Value value, Attribute startAttr, Attribute endAttr) {
+  // Check that end is provided
+
   auto inType = value.getType().cast<ShapedType>();
   auto shape = inType.getShape();
-  SmallVector<int64_t, 1> dims = {inType.getRank()};
-  SmallVector<int64_t, 4> values(shape.begin(), shape.end());
+  int64_t rank = inType.getRank();
+
+  int64_t start = 0;
+  int64_t end = rank;
+
+  if (startAttr) {
+    start = startAttr.cast<IntegerAttr>().getSInt();
+  }
+  if (endAttr) {
+    end = endAttr.cast<IntegerAttr>().getSInt();
+  }
+
+  // Normalize if start/end are not in (0, ..., rank)
+  if (start < 0) {
+    start = start + rank;
+  }
+  if (end < 0) {
+    end = end + rank;
+  }
+
+  SmallVector<int64_t, 1> dims = {end - start};
+  SmallVector<int64_t, 4> values(shape.begin() + start, shape.begin() + end);
   auto tensorType = RankedTensorType::get(dims, rewriter.getIntegerType(64));
   return DenseElementsAttr::get(tensorType, makeArrayRef(values));
 }

diff --git a/src/Dialect/ONNX/ONNXOpsHelper.hpp b/src/Dialect/ONNX/ONNXOpsHelper.hpp
@@ -174,7 +174,8 @@ mlir::Value normalizeConstantOp(
 
 // Create a DenseElementsAttr based on the shape of type.
 mlir::DenseElementsAttr createDenseElementsAttrFromShape(
-    mlir::PatternRewriter &rewriter, mlir::Value value);
+    mlir::PatternRewriter &rewriter, mlir::Value value,
+    mlir::Attribute startAttr, mlir::Attribute endAttr);
 
 // Create a DenseElementsAttr based on the size of type.
 mlir::DenseElementsAttr createDenseElementsAttrFromSize(

diff --git a/src/Dialect/ONNX/Rewrite.td b/src/Dialect/ONNX/Rewrite.td
@@ -36,7 +36,7 @@ def createDenseElementsAttrFromFloatAttr : NativeCodeCall<
 
 // Create a DenseElementsAttr from the shape of the type of a value.
 def createDenseElementsAttrFromShape : NativeCodeCall<
-  "onnx_mlir::createDenseElementsAttrFromShape($_builder, $0)">;
+  "onnx_mlir::createDenseElementsAttrFromShape($_builder, $0, $1, $2)">;
 
 // Create a DenseElementsAttr from the size of the type of a value.
 def createDenseElementsAttrFromSize : NativeCodeCall<
@@ -531,7 +531,9 @@ def SwapReshapeMatMulPattern: Pattern<
  // TODO: Support dynamic dimensions.
  (ONNXMatMulOp:$res2 (ONNXReshapeOp:$res1 $A, $_, $az), $B),
  [(ONNXReshapeOp (ONNXMatMulOp $A, $B, (returnType (GetReturnTypeForMatMulOpND2D $A, $B))),
-                 (ONNXConstantOpFromDenseAttr (createDenseElementsAttrFromShape $res2)), $az)],
+                 (ONNXConstantOpFromDenseAttr 
+                    (createDenseElementsAttrFromShape $res2, (GetNullAttr), (GetNullAttr))
+                 ), $az)],
  [(HasRankGT<2> $A), (HasRankOf<2> $res1), (HasRankOf<2> $B), // A is reshaped to 2D.
   (HaveSameLastDim $A, $res1), // The last dim of A is unchanged by reshape.
   (IsStaticShapeTensor:$res2)  // $res2 has static dims in order to create ReshapeOp.
@@ -719,9 +721,9 @@ def RewriteBatchNormInferenceModeConvPattern2: Pat<
 
 // TODO: this rules may need to be updated once ShapeOp has start/end.
 def ShapeToConstantPattern: Pat<
-     (ONNXShapeOp $A),
+     (ONNXShapeOp $A, $end, $start),
      (ONNXConstantOp
-        (GetNullAttr), (createDenseElementsAttrFromShape $A),
+        (GetNullAttr), (createDenseElementsAttrFromShape $A, $start, $end),
         (GetNullFloatAttr), (GetNullArrayAttr), (GetNullIntegerAttr),
         (GetNullArrayAttr), (GetNullStringAttr), (GetNullArrayAttr)
      ),

diff --git a/src/Dialect/ONNX/ShapeInference/Shape.cpp b/src/Dialect/ONNX/ShapeInference/Shape.cpp
@@ -9,60 +9,85 @@
 //===----------------------------------------------------------------------===//
 
 #include "src/Dialect/ONNX/ShapeInference/ONNXShapeHelper.hpp"
+#include <tuple>
 #include <utility>
 
 using namespace mlir;
 
 namespace onnx_mlir {
 
+namespace {
+
+// If start axis is omitted, the slice starts from axis 0.
+// The end axis, if specified, is exclusive (and the returned value will not
+// include the size of that axis). If the end axis is omitted, the axes upto the
+// last one will be included. Negative axes indicate counting back from the last
+// axis. Note that axes will be clipped to the range [0, r-1], where r is the
+// rank of the input tensor if they are out-of-range (after adding r in the case
+// of negative axis). Thus, specifying any end value > r is equivalent to
+// specifying an end value of r, and specifying any start value < -r is
+// equivalent to specifying a start value of 0.
+int64_t normalize(int64_t value, int64_t rank) {
+  if (value < 0)
+    value += rank;
+
+  if (value < 0)
+    value = 0;
+
+  if (value > rank)
+    value = rank;
+
+  return value;
+}
+
 // Compute a slice of the input tensor's shape. The slice starts from axis 0.
-// The axes upto the last one will be included. Negative axes indicate counting
+// The axes up to the last one will be included. Negative axes indicate counting
 // back from the last axis.
-static std::pair<int64_t, int64_t> getDataShapeBounds(
+std::pair<int64_t, int64_t> getDataShapeBounds(
     ONNXShapeOpAdaptor &operandAdaptor) {
   Value data = operandAdaptor.data();
   MemRefBoundsIndexCapture dataBounds(data);
-  int64_t dataRank = dataBounds.getRank();
+  int64_t rank = dataBounds.getRank();
 
   // Compute the normalized start/end. Negative value means counting
   // dimensions from the back.
-  int64_t normalizedStart = 0;
-  int64_t normalizedEnd = dataRank;
-
-  if (normalizedStart < 0)
-    normalizedStart += dataRank;
-  if (normalizedEnd < 0)
-    normalizedEnd += dataRank;
+  int64_t start = operandAdaptor.start();
+  int64_t end = rank;
+  if (operandAdaptor.end().has_value()) {
+    end = operandAdaptor.end().value();
+  }
 
-  return std::make_pair(normalizedStart, normalizedEnd);
+  return std::make_pair(normalize(start, rank), normalize(end, rank));
 }
 
+} // namespace
+
 LogicalResult ONNXShapeOpShapeHelper::computeShape(
     ONNXShapeOpAdaptor operandAdaptor) {
   Value data = operandAdaptor.data();
   MemRefBoundsIndexCapture dataBounds(data);
-  int64_t dataRank = dataBounds.getRank();
-  std::pair<int64_t, int64_t> bounds = getDataShapeBounds(operandAdaptor);
 
-  if (bounds.first < 0 || bounds.first > dataRank)
-    return op->emitError("start value is out of bound");
-  if (bounds.second < 0 || bounds.second > dataRank)
-    return op->emitError("end value is out of bound");
+  int64_t start;
+  int64_t end;
+  std::tie(start, end) = getDataShapeBounds(operandAdaptor);
 
   // Output is the actual number of values (1D)
-  dimsForOutput().emplace_back(LiteralIndexExpr(bounds.second - bounds.first));
+  dimsForOutput().emplace_back(LiteralIndexExpr(end - start));
+
   return success();
 }
 
 // Compute the data selected by the Shape operator.
 DimsExpr computeSelectedData(ONNXShapeOpAdaptor &operandAdaptor) {
   MemRefBoundsIndexCapture dataBounds(operandAdaptor.data());
-  std::pair<int64_t, int64_t> bounds = getDataShapeBounds(operandAdaptor);
-  assert(bounds.first >= 0 && bounds.first <= bounds.second &&
-         bounds.second <= (int64_t)dataBounds.getRank() && "Unexpected bounds");
+  int64_t start;
+  int64_t end;
+  std::tie(start, end) = getDataShapeBounds(operandAdaptor);
+  assert(start >= 0 && start <= end && end <= (int64_t)dataBounds.getRank() &&
+         "Unexpected bounds");
 
   DimsExpr selectedData;
-  for (int64_t i = bounds.first; i < bounds.second; ++i)
+  for (int64_t i = start; i < end; ++i)
     selectedData.emplace_back(dataBounds.getDim(i));
 
   return selectedData;