Make sure that RankedTensorType casting is valid.

abattery · tensorflower-gardener · commit 670cf675ea98 · 2020-11-27T03:21:46.000-08:00
PiperOrigin-RevId: 344509898
Change-Id: I7053148588a93e60099605f7a90419a1f14a0667
diff --git a/tensorflow/compiler/mlir/lite/tests/prepare-composite-functions-tf.mlir b/tensorflow/compiler/mlir/lite/tests/prepare-composite-functions-tf.mlir
@@ -153,6 +153,30 @@ func @layernormalizedlstmcellsimple(%arg0: tensor<1x?xf32>, %arg1: tensor<3x4xf3
 
 // -----
 
+module{
+
+// expected-warning @+1 {{we cannot fuse this lstm func because all the inputs have not ranked tensor type.}}
+func @lstmcellsimple(%arg0: tensor<*xf32>, %arg1: tensor<*xf32>, %arg2: tensor<*xf32>, %arg3: tensor<*xf32>, %arg4: tensor<*xf32>) -> tensor<*xf32> attributes  {tf._implements = "LSTMCellSimple", tf._reference = "mlir"} {
+    %0 = "tf.BatchMatMulV2"(%arg3, %arg1) {adj_x = false, adj_y = false} : (tensor<*xf32>, tensor<*xf32>) -> tensor<*xf32>
+    %1 = constant dense<[[2.3, 3.4, 4.5, 5.5]]> : tensor<1x4xf32>
+    %2 = "tf.Add"(%0, %1) : (tensor<*xf32>, tensor<1x4xf32>) -> tensor<*xf32>
+    %3 = tensor_cast %2 : tensor<*xf32> to tensor<*xf32>
+    return %3 : tensor<*xf32>
+}
+
+// expected-warning @+1 {{we cannot fuse this lstm func because all the inputs have not ranked tensor type.}}
+func @layernormalizedlstmcellsimple(%arg0: tensor<*xf32>, %arg1: tensor<*xf32>, %arg2: tensor<*xf32>, %arg3: tensor<*xf32>, %arg4: tensor<*xf32>) -> tensor<*xf32> attributes  {tf._implements = "LayerNormalizedLstmCellSimple", tf._reference = "mlir"} {
+    %0 = "tf.BatchMatMulV2"(%arg3, %arg1) {adj_x = false, adj_y = false} : (tensor<*xf32>, tensor<*xf32>) -> tensor<*xf32>
+    %1 = constant dense<[[2.3, 3.4, 4.5, 5.5]]> : tensor<1x4xf32>
+    %2 = "tf.Add"(%0, %1) : (tensor<*xf32>, tensor<1x4xf32>) -> tensor<*xf32>
+    %3 = tensor_cast %2 : tensor<*xf32> to tensor<*xf32>
+    return %3 : tensor<*xf32>
+}
+
+}
+
+// -----
+
 module {
 func @inference_standard_lstm_time_major(%arg0: tensor<?x8x8xf32>, %arg1: tensor<8x10xf32>, %arg2: tensor<8x10xf32>, %arg3: tensor<8x40xf32>, %arg4: tensor<10x40xf32>, %arg5: tensor<40xf32>) -> (tensor<8x10xf32>, tensor<?x8x10xf32>, tensor<8x10xf32>, tensor<8x10xf32>, tensor<f32>) attributes {tf._input_shapes = ["tfshape$dim { size: -1 } dim { size: 8 } dim { size: 8 }", "tfshape$dim { size: 8 } dim { size: 10 }", "tfshape$dim { size: 8 } dim { size: 10 }", "tfshape$unknown_rank: true", "tfshape$unknown_rank: false", "tfshape$unknown_rank: false"], tf.api_implements = "lstm_b4e9f0e7-ac55-42bc-8ef2-8496419a608c", tf.api_preferred_device = "CPU", tf.go_backwards = false, tf.time_major = true} {
   %0 = "tf.BatchMatMulV2"(%arg0, %arg3) {adj_x = false, adj_y = false} : (tensor<?x8x8xf32>, tensor<8x40xf32>) -> tensor<?x8x40xf32>
diff --git a/tensorflow/compiler/mlir/lite/tests/prepare-tf.mlir b/tensorflow/compiler/mlir/lite/tests/prepare-tf.mlir
@@ -485,6 +485,18 @@ func @StridedSliceEllipsisMaskAfter(%arg0: tensor<21x15x7xf32>) -> tensor<5x15x7
   // CHECK: %[[STRIDED_SLICE:.*]] = "tf.StridedSlice"(%arg0, %[[CST]], %[[CST]], %[[CST_0]]) {begin_mask = 6 : i64, ellipsis_mask = 0 : i64, end_mask = 6 : i64, new_axis_mask = 0 : i64, shrink_axis_mask = 0 : i64} : (tensor<21x15x7xf32>, tensor<3xi32>, tensor<3xi32>, tensor<3xi32>) -> tensor<5x15x7xf32>
 }
 
+// CHECK-LABEL: @NoStridedSliceEllipsisMask
+func @NoStridedSliceEllipsisMask(%arg0: tensor<*xf32>) -> tensor<21x15x2xf32> {
+  %cst = constant dense<0> : tensor<2xi32>
+  %cst_0 = constant dense<1> : tensor<2xi32>
+  %0 = "tf.StridedSlice"(%arg0, %cst, %cst, %cst_0) {begin_mask = 0 : i64, ellipsis_mask = 1 : i64, end_mask = 0 : i64, new_axis_mask = 0 : i64, shrink_axis_mask = 0 : i64} : (tensor<*xf32>, tensor<2xi32>, tensor<2xi32>, tensor<2xi32>) -> tensor<21x15x2xf32>
+  return %0 : tensor<21x15x2xf32>
+
+  // CHECK: %[[CST:.*]] = constant dense<0> : tensor<2xi32>
+  // CHECK: %[[CST_0:.*]] = constant dense<1> : tensor<2xi32>
+  // CHECK: %[[STRIDED_SLICE:.*]] = "tf.StridedSlice"(%arg0, %[[CST]], %[[CST]], %[[CST_0]]) {begin_mask = 0 : i64, ellipsis_mask = 1 : i64, end_mask = 0 : i64, new_axis_mask = 0 : i64, shrink_axis_mask = 0 : i64} : (tensor<*xf32>, tensor<2xi32>, tensor<2xi32>, tensor<2xi32>) -> tensor<21x15x2xf32>
+}
+
 // CHECK-LABEL: @NoPadStridedSliceNonNewAxisMask
 func @NoPadStridedSliceNonNewAxisMask(%arg0: tensor<1x2x3x1xf32>) -> tensor<1x2x3x1xf32> {
   %cst = constant dense<0> : tensor<4xi32>
diff --git a/tensorflow/compiler/mlir/lite/transforms/prepare_composite_functions_tf.cc b/tensorflow/compiler/mlir/lite/transforms/prepare_composite_functions_tf.cc
@@ -125,6 +125,117 @@ class PrepareCompositeFunctionsPass
   void runOnOperation() override;
 };
 
+LogicalResult CheckFusableLayerNormalizedLstmCellSimple(FuncOp lstm_func) {
+  for (int i = 0; i < 5; ++i) {
+    auto input = lstm_func.getArgument(i);
+    auto input_type = input.getType().dyn_cast_or_null<RankedTensorType>();
+    if (!input_type) {
+      lstm_func.emitWarning(
+          "we cannot fuse this lstm func because all the inputs have not "
+          "ranked tensor type.");
+      return failure();
+    }
+  }
+
+  return success();
+}
+
+LogicalResult CheckFusableLstmCellSimple(FuncOp lstm_func) {
+  for (int i = 0; i < 4; ++i) {
+    auto input = lstm_func.getArgument(i);
+    auto input_type = input.getType().dyn_cast_or_null<RankedTensorType>();
+    if (!input_type) {
+      lstm_func.emitWarning(
+          "we cannot fuse this lstm func because all the inputs have not "
+          "ranked tensor type.");
+      return failure();
+    }
+  }
+
+  return success();
+}
+
+LogicalResult CheckOutputConsumer(
+    Operation* call_op, int expected_num_outputs,
+    llvm::DenseSet<int> expected_consumer_indices) {
+  const int num_results = call_op->getNumResults();
+  if (num_results != expected_num_outputs) return failure();
+
+  for (int i = 0; i < expected_num_outputs; ++i) {
+    auto it = expected_consumer_indices.find(i);
+    if (it == expected_consumer_indices.end()) {
+      // Unexpected consumer.
+      if (!call_op->getResult(i).use_empty()) return failure();
+    }
+  }
+  return success();
+}
+
+LogicalResult CheckFusableKerasLstm(FuncOp lstm_func, ModuleOp module) {
+  for (auto func : module.getOps<FuncOp>()) {
+    if (func == lstm_func) continue;
+    auto result = func.walk([&](CallOpInterface op) {
+      if (dyn_cast<FuncOp>(op.resolveCallable()) == lstm_func) {
+        // Keras LSTM have 5 outputs.
+        // We should make sure only the first or the second output are
+        // consumed.
+        if (failed(CheckOutputConsumer(op.getOperation(), 5, {0, 1})))
+          return WalkResult::interrupt();
+      }
+      return WalkResult::advance();
+    });
+
+    if (result.wasInterrupted()) return failure();
+  }
+
+  // We should know the batch size in advance for the lstm fusion.
+  // A good indicator of batch size is both cell state and input state (indices
+  // 1 & 2) have fixed shape and other input tenors should have ranked tensor
+  // types.
+  for (int i = 0; i < 6; ++i) {
+    auto input = lstm_func.getArgument(i);
+    auto input_type = input.getType().dyn_cast_or_null<RankedTensorType>();
+    if (!input_type) {
+      lstm_func.emitWarning(
+          "we cannot fuse this lstm func because all the inputs have not "
+          "ranked tensor type.");
+      return failure();
+    }
+    switch (i) {
+      case 1:  // output_init_state
+      case 2:  // hidden_init_state
+        if (!input_type.hasStaticShape()) {
+          lstm_func.emitWarning(
+              "we cannot fuse this lstm func because the batch size is not "
+              "fixed, please consider setting fixed batch size like "
+              "https://github.com/tensorflow/tensorflow/blob/master/tensorflow/"
+              "lite/examples/experimental_new_converter/"
+              "Keras_LSTM_fusion_Codelab.ipynb");
+          return failure();
+        }
+        break;
+      case 3:  // wiehgt
+      case 4:  // recurrent_kernel
+      case 5:  // bias
+        if (!input_type.hasStaticShape()) {
+          lstm_func.emitWarning(
+              "we cannot fuse this lstm func because the weight & bias are not "
+              "fixed, please consider setting fixed batch size like "
+              "https://github.com/tensorflow/tensorflow/blob/master/tensorflow/"
+              "lite/examples/experimental_new_converter/"
+              "Keras_LSTM_fusion_Codelab.ipynb");
+          return failure();
+        }
+        break;
+      default:
+        // No op.
+        break;
+    }
+  }
+
+  return success();
+}
+
 void PrepareCompositeFunctionsPass::ConvertTFImplements(FuncOp func,
                                                         StringAttr attr) {
   if (attr.getValue() == "embedding_matmul") {
@@ -138,13 +249,19 @@ void PrepareCompositeFunctionsPass::ConvertTFImplements(FuncOp func,
     }
     convert_embedded_lookup.RewriteFunc();
   } else if (attr.getValue() == mlir::TFL::kLstmCellSimple) {
+    // Check if the lstm cell simple can be fused, if not, we just don't do
+    // anything.
+    if (failed(CheckFusableLstmCellSimple(func))) return;
     func.eraseBody();
     func.addEntryBlock();
     ConvertLSTMCellSimpleToFusedLSTM convert_lstm_cell_simple(func);
     if (failed(convert_lstm_cell_simple.RewriteFunc())) {
       return signalPassFailure();
     }
   } else if (attr.getValue() == mlir::TFL::kLayerNormalizedLstmCellSimple) {
+    // Check if the layer normalized lstm cell simple can be fused, if not, we
+    // just don't do anything.
+    if (failed(CheckFusableLayerNormalizedLstmCellSimple(func))) return;
     func.eraseBody();
     func.addEntryBlock();
     ConvertLayerNormalizedLSTMCellSimpleToFusedLSTM
@@ -181,59 +298,6 @@ void PrepareCompositeFunctionsPass::ConvertTFImplementsWithAttributes(
   }
 }
 
-LogicalResult CheckOutputConsumer(
-    Operation* call_op, int expected_num_outputs,
-    llvm::DenseSet<int> expected_consumer_indices) {
-  const int num_results = call_op->getNumResults();
-  if (num_results != expected_num_outputs) return failure();
-
-  for (int i = 0; i < expected_num_outputs; ++i) {
-    auto it = expected_consumer_indices.find(i);
-    if (it == expected_consumer_indices.end()) {
-      // Unexpected consumer.
-      if (!call_op->getResult(i).use_empty()) return failure();
-    }
-  }
-  return success();
-}
-
-LogicalResult CheckFusableKerasLstm(FuncOp lstm_func, ModuleOp module) {
-  for (auto func : module.getOps<FuncOp>()) {
-    if (func == lstm_func) continue;
-    auto result = func.walk([&](CallOpInterface op) {
-      if (dyn_cast<FuncOp>(op.resolveCallable()) == lstm_func) {
-        // Keras LSTM have 5 outputs.
-        // We should make sure only the first or the second output are
-        // consumed.
-        if (failed(CheckOutputConsumer(op.getOperation(), 5, {0, 1})))
-          return WalkResult::interrupt();
-      }
-      return WalkResult::advance();
-    });
-
-    if (result.wasInterrupted()) return failure();
-  }
-
-  // We should know the batch size in advance for the lstm fusion.
-  // A good indicator of batch size is both cell state and input state have
-  // fixed shape. (indices 1 & 2).
-  for (int i = 1; i < 3; ++i) {
-    auto input = lstm_func.getArgument(i);
-    auto input_type = input.getType().dyn_cast_or_null<RankedTensorType>();
-    if (!input_type || !input_type.hasStaticShape()) {
-      lstm_func.emitWarning(
-          "we cannot fuse this lstm func because the batch size is not fixed, "
-          "please consider setting fixed batch size like "
-          "https://github.com/tensorflow/tensorflow/blob/master/tensorflow/"
-          "lite/examples/experimental_new_converter/"
-          "Keras_LSTM_fusion_Codelab.ipynb");
-      return failure();
-    }
-  }
-
-  return success();
-}
-
 void PrepareCompositeFunctionsPass::ConvertTFAPIImplements(FuncOp func,
                                                            StringAttr attr,
                                                            ModuleOp module) {
diff --git a/tensorflow/compiler/mlir/lite/transforms/prepare_tf.cc b/tensorflow/compiler/mlir/lite/transforms/prepare_tf.cc
@@ -526,6 +526,7 @@ struct ConvertTFStridedSlice : public RewritePattern {
 
     // Insert a new reshape op.
     Value original_input = strided_slice_op.input();
+    // TODO(b/174267775): Make sure that the input type has ranked tensor type.
     RankedTensorType original_input_type =
         original_input.getType().cast<RankedTensorType>();
     const ArrayRef<int64_t> &original_input_shape =
@@ -619,7 +620,10 @@ struct ConvertTFStridedSlice : public RewritePattern {
     }
 
     Value input = strided_slice_op.input();
-    RankedTensorType input_type = input.getType().cast<RankedTensorType>();
+    RankedTensorType input_type = input.getType().dyn_cast<RankedTensorType>();
+    if (!input_type) {
+      return failure();
+    }
     const ArrayRef<int64_t> input_shape = input_type.getShape();
 
     const int input_size = input_shape.size();