Update tf.While/tf.WhileRegion shape inference to support different operand and result shapes.

andyly · tensorflower-gardener · commit 3c572a3c5587 · 2020-11-25T08:22:12.000-08:00
tf.While/tf.WhileRegion supports changing shapes in each iteration of its loop body. That case currently can be checked via the `shape_invariants` attribute, and special handling is necessary to refining shapes and propagating handle types.

PiperOrigin-RevId: 344255608
Change-Id: Ibcca0c48b7fd6e305a2b38b9261dfcbcb03815ba
diff --git a/tensorflow/compiler/mlir/tensorflow/tests/shape_inference.mlir b/tensorflow/compiler/mlir/tensorflow/tests/shape_inference.mlir
@@ -622,4 +622,99 @@ module attributes {tf.versions = {bad_consumers = [], min_consumer = 0 : i32, pr
     }
     return %0 : tensor<*xi32>
   }
+
+  // Test shape invariant While only propagates operand handle types into
+  // results and functions/regions.
+  // CHECK-LABEL: func @while_shape_invariant_propagate
+  // CHECK-SAME: ({{%.+}}: tensor<4xf32>, {{%.+}}: tensor<!tf.resource<tensor<4xf32>>>, {{%.+}}: tensor<!tf.resource<tensor<8xf32>>>, {{%.+}}: tensor<1xi32>)
+  // CHECK-SAME: -> (tensor<*xf32>, tensor<*x!tf.resource<tensor<4xf32>>>, tensor<!tf.resource<tensor<8xf32>>>, tensor<?xi32>, tensor<*xf32>, tensor<*x!tf.resource<tensor<4xf32>>>, tensor<!tf.resource<tensor<8xf32>>>, tensor<?xi32>)
+  func @while_shape_invariant_propagate(%arg0: tensor<4xf32>, %arg1: tensor<!tf.resource<tensor<4xf32>>>, %arg2: tensor<!tf.resource<tensor<8xf32>>>, %arg3: tensor<1xi32>) -> (tensor<*xf32>, tensor<*x!tf.resource>, tensor<!tf.resource>, tensor<?xi32>, tensor<*xf32>, tensor<*x!tf.resource>, tensor<!tf.resource>, tensor<?xi32>) {
+    // CHECK: "tf.While"
+    // CHECK-SAME: (tensor<4xf32>, tensor<!tf.resource<tensor<4xf32>>>, tensor<!tf.resource<tensor<8xf32>>>, tensor<1xi32>)
+    // CHECK-SAME: -> (tensor<*xf32>, tensor<*x!tf.resource<tensor<4xf32>>>, tensor<!tf.resource<tensor<8xf32>>>, tensor<?xi32>)
+    %0:4 = "tf.While"(%arg0, %arg1, %arg2, %arg3) {cond = @while_shape_invariant_func_propagate, body = @while_shape_invariant_body_func_propagate, is_stateless = false, shape_invariant} : (tensor<4xf32>, tensor<!tf.resource<tensor<4xf32>>>, tensor<!tf.resource<tensor<8xf32>>>, tensor<1xi32>) -> (tensor<*xf32>, tensor<*x!tf.resource>, tensor<!tf.resource>, tensor<?xi32>)
+
+    // CHECK: "tf.WhileRegion"
+    %1:4 = "tf.WhileRegion"(%arg0, %arg1, %arg2, %arg3) ( {
+    // CHECK-NEXT: ^{{.+}}({{%.+}}: tensor<*xf32>, {{%.+}}: tensor<*x!tf.resource<tensor<4xf32>>>, {{%.+}}: tensor<!tf.resource<tensor<8xf32>>>, {{%.+}}: tensor<?xi32>):
+    ^cond(%carg0: tensor<*xf32>, %carg1: tensor<*x!tf.resource>, %carg2: tensor<!tf.resource>, %carg3: tensor<?xi32>):
+      %2 = "tf.Const"() {value = dense<true> : tensor<i1>} : () -> tensor<i1>
+      "tf.Yield"(%2) : (tensor<i1>) -> ()
+    }, {
+    // CHECK: ^{{.+}}({{%.+}}: tensor<*xf32>, {{%.+}}: tensor<*x!tf.resource<tensor<4xf32>>>, {{%.+}}: tensor<!tf.resource<tensor<8xf32>>>, {{%.+}}: tensor<?xi32>):
+    ^body(%barg0: tensor<*xf32>, %barg1: tensor<*x!tf.resource>, %barg2: tensor<!tf.resource>, %barg3: tensor<?xi32>):
+      %2 = "tf.SomeOp"(%barg3) : (tensor<?xi32>) -> tensor<?xi32>
+      // CHECK: "tf.Yield"
+      // CHECK-SAME: (tensor<*xf32>, tensor<*x!tf.resource<tensor<4xf32>>>, tensor<!tf.resource<tensor<8xf32>>>, tensor<?xi32>) -> ()
+      "tf.Yield"(%barg0, %barg1, %barg2, %2) : (tensor<*xf32>, tensor<*x!tf.resource>, tensor<!tf.resource>, tensor<?xi32>) -> ()
+    // CHECK-NEXT: shape_invariant
+    // CHECK-SAME: (tensor<4xf32>, tensor<!tf.resource<tensor<4xf32>>>, tensor<!tf.resource<tensor<8xf32>>>, tensor<1xi32>)
+    // CHECK-SAME: -> (tensor<*xf32>, tensor<*x!tf.resource<tensor<4xf32>>>, tensor<!tf.resource<tensor<8xf32>>>, tensor<?xi32>)
+    }) {is_stateless = false, shape_invariant} : (tensor<4xf32>, tensor<!tf.resource<tensor<4xf32>>>, tensor<!tf.resource<tensor<8xf32>>>, tensor<1xi32>) -> (tensor<*xf32>, tensor<*x!tf.resource>, tensor<!tf.resource>, tensor<?xi32>)
+
+    return %0#0, %0#1, %0#2, %0#3, %1#0, %1#1, %1#2, %1#3 : tensor<*xf32>, tensor<*x!tf.resource>, tensor<!tf.resource>, tensor<?xi32>, tensor<*xf32>, tensor<*x!tf.resource>, tensor<!tf.resource>, tensor<?xi32>
+  }
+
+  // CHECK-LABEL: func @while_shape_invariant_func_propagate
+  // CHECK-SAME: ({{%.+}}: tensor<*xf32>, {{%.+}}: tensor<*x!tf.resource<tensor<4xf32>>>, {{%.+}}: tensor<!tf.resource<tensor<8xf32>>>, {{%.+}}: tensor<?xi32>)
+  // CHECK-SAME: -> tensor<i1>
+  func @while_shape_invariant_func_propagate(%arg0: tensor<*xf32>, %arg1: tensor<*x!tf.resource>, %arg2: tensor<!tf.resource>, %arg3: tensor<?xi32>) -> tensor<i1> {
+    %0 = "tf.Const"() {value = dense<true> : tensor<i1>} : () -> tensor<i1>
+    return %0 : tensor<i1>
+  }
+
+  // CHECK-LABEL: func @while_shape_invariant_body_func_propagate
+  // CHECK-SAME: ({{%.+}}: tensor<*xf32>, {{%.+}}: tensor<*x!tf.resource<tensor<4xf32>>>, {{%.+}}: tensor<!tf.resource<tensor<8xf32>>>, {{%.+}}: tensor<?xi32>)
+  // CHECK-SAME: -> (tensor<*xf32>, tensor<*x!tf.resource<tensor<4xf32>>>, tensor<!tf.resource<tensor<8xf32>>>, tensor<?xi32>)
+  func @while_shape_invariant_body_func_propagate(%arg0: tensor<*xf32>, %arg1: tensor<*x!tf.resource>, %arg2: tensor<!tf.resource>, %arg3: tensor<?xi32>) -> (tensor<*xf32>, tensor<*x!tf.resource>, tensor<!tf.resource>, tensor<?xi32>) {
+    %0 = "tf.SomeOp"(%arg3) : (tensor<?xi32>) -> tensor<?xi32>
+    return %arg0, %arg1, %arg2, %0 : tensor<*xf32>, tensor<*x!tf.resource>, tensor<!tf.resource>, tensor<?xi32>
+  }
+
+  // Test shape invariant While with result type refinement.
+  // CHECK-LABEL: func @while_shape_invariant_refine
+  // CHECK-SAME: ({{%.+}}: tensor<2xi32>, {{%.+}}: tensor<8xf32>, {{%.+}}: tensor<?xi1>)
+  // CHECK-SAME: -> (tensor<2xi32>, tensor<8xf32>, tensor<?xi1>, tensor<2xi32>, tensor<8xf32>, tensor<?xi1>)
+  func @while_shape_invariant_refine(%arg0: tensor<2xi32>, %arg1: tensor<8xf32>, %arg2: tensor<?xi1>) -> (tensor<?xi32>, tensor<*xf32>, tensor<*xi1>, tensor<?xi32>, tensor<*xf32>, tensor<*xi1>) {
+    // CHECK: "tf.While"
+    // CHECK-SAME: (tensor<2xi32>, tensor<8xf32>, tensor<?xi1>)
+    // CHECK-SAME: -> (tensor<2xi32>, tensor<8xf32>, tensor<?xi1>)
+    %0:3 = "tf.While"(%arg0, %arg1, %arg2) {cond = @while_shape_invariant_func_refine, body = @while_shape_invariant_body_func_refine, is_stateless = false, shape_invariant} : (tensor<2xi32>, tensor<8xf32>, tensor<?xi1>) -> (tensor<?xi32>, tensor<*xf32>, tensor<*xi1>)
+
+    // CHECK: "tf.WhileRegion"
+    %1:3 = "tf.WhileRegion"(%arg0, %arg1, %arg2) ( {
+    // CHECK-NEXT: ^{{.+}}({{%.+}}: tensor<2xi32>, {{%.+}}: tensor<8xf32>, {{%.+}}: tensor<?xi1>):
+    ^cond(%carg0: tensor<2xi32>, %carg1: tensor<8xf32>, %carg2: tensor<?xi1>):
+      %2 = "tf.Const"() {value = dense<true> : tensor<i1>} : () -> tensor<i1>
+      "tf.Yield"(%2) : (tensor<i1>) -> ()
+    }, {
+    // CHECK: ^{{.+}}({{%.+}}: tensor<2xi32>, {{%.+}}: tensor<8xf32>, {{%.+}}: tensor<?xi1>):
+    ^body(%barg0: tensor<2xi32>, %barg1: tensor<8xf32>, %barg2: tensor<?xi1>):
+      %2:3 = "tf.IdentityN"(%barg0, %barg1, %barg2) : (tensor<2xi32>, tensor<8xf32>, tensor<?xi1>) -> (tensor<?xi32>, tensor<*xf32>, tensor<*xi1>)
+      // CHECK: "tf.Yield"
+      // CHECK-SAME: (tensor<2xi32>, tensor<8xf32>, tensor<?xi1>) -> ()
+      "tf.Yield"(%2#0, %2#1, %2#2) : (tensor<?xi32>, tensor<*xf32>, tensor<*xi1>) -> ()
+    // CHECK-NEXT: shape_invariant
+    // CHECK-SAME: (tensor<2xi32>, tensor<8xf32>, tensor<?xi1>)
+    // CHECK-SAME: -> (tensor<2xi32>, tensor<8xf32>, tensor<?xi1>)
+    }) {is_stateless = false, shape_invariant} : (tensor<2xi32>, tensor<8xf32>, tensor<?xi1>) -> (tensor<?xi32>, tensor<*xf32>, tensor<*xi1>)
+
+    return %0#0, %0#1, %0#2, %1#0, %1#1, %1#2 : tensor<?xi32>, tensor<*xf32>, tensor<*xi1>, tensor<?xi32>, tensor<*xf32>, tensor<*xi1>
+  }
+
+  // CHECK-LABEL: func @while_shape_invariant_func_refine
+  // CHECK-SAME: ({{%.+}}: tensor<2xi32>, {{%.+}}: tensor<8xf32>, {{%.+}}: tensor<?xi1>)
+  // CHECK-SAME: -> tensor<i1>
+  func @while_shape_invariant_func_refine(%arg0: tensor<2xi32>, %arg1: tensor<8xf32>, %arg2: tensor<?xi1>) -> tensor<i1> {
+    %0 = "tf.Const"() {value = dense<true> : tensor<i1>} : () -> tensor<i1>
+    return %0 : tensor<i1>
+  }
+
+  // CHECK-LABEL: func @while_shape_invariant_body_func_refine
+  // CHECK-SAME: ({{%.+}}: tensor<2xi32>, {{%.+}}: tensor<8xf32>, {{%.+}}: tensor<?xi1>)
+  // CHECK-SAME: -> (tensor<2xi32>, tensor<8xf32>, tensor<?xi1>)
+  func @while_shape_invariant_body_func_refine(%arg0: tensor<2xi32>, %arg1: tensor<8xf32>, %arg2: tensor<?xi1>) -> (tensor<?xi32>, tensor<*xf32>, tensor<*xi1>) {
+    %0:3 = "tf.IdentityN"(%arg0, %arg1, %arg2) : (tensor<2xi32>, tensor<8xf32>, tensor<?xi1>) -> (tensor<?xi32>, tensor<*xf32>, tensor<*xi1>)
+    return %0#0, %0#1, %0#2 : tensor<?xi32>, tensor<*xf32>, tensor<*xi1>
+  }
 }
diff --git a/tensorflow/compiler/mlir/tensorflow/transforms/shape_inference.cc b/tensorflow/compiler/mlir/tensorflow/transforms/shape_inference.cc
@@ -279,6 +279,16 @@ class ShapeInference {
     results_[value_port] = value;
   }
 
+  // Infers shape of tf.While/tf.WhileRegion. If `shape_invariant` attribute is
+  // set, operand types are set as result types if associated body result types
+  // match the operand type (does not change per loop iteration). If operand and
+  // body result types are not the same, only handle types are propagated to
+  // result types. This is necessary to not incorrectly change result shapes
+  // when the While op will have a different result shape. Otherwise operand
+  // shapes are propagated to result shapes.
+  template <typename WhileOpTy>
+  bool InferShapeForWhile(WhileOpTy op, TypeRange body_result_types);
+
   // Performs shape inference on the provided op and return true if the type of
   // at least one result has been changed.
   // A tf.Cast() is inserted for any uses that isn't in the TensorFlow dialect.
@@ -298,16 +308,17 @@ class ShapeInference {
   //   1) They are never reused, ie. having a single use in module.
   //   2) Their input types match those of their parent ops (excluding inputs
   //      like predicate).
-  LogicalResult PropagateShapeToFunctions(
-      ModuleOp module, Operation::operand_type_range input_types,
-      ArrayRef<FuncOp> functions, int64_t max_iteration);
+  LogicalResult PropagateShapeToFunctions(ModuleOp module,
+                                          TypeRange input_types,
+                                          ArrayRef<FuncOp> functions,
+                                          int64_t max_iteration);
 
   // Propagates shapes to regions given the shapes of the inputs of the regions.
   // All regions provided in `regions` are assumed to have inputs of type
   // `input_types`.
-  LogicalResult PropagateShapeToRegions(
-      Operation::operand_type_range input_types, ArrayRef<Region*> regions,
-      int64_t max_iteration);
+  LogicalResult PropagateShapeToRegions(TypeRange input_types,
+                                        ArrayRef<Region*> regions,
+                                        int64_t max_iteration);
 
   // Shape propagation for call/control flow ops.
   LogicalResult PropagateShapeIntoAttachedFunctions(Operation* op,
@@ -757,15 +768,58 @@ bool ShapeInference::InferShapeForNonTFDialectOperation(Operation* op) {
   return false;
 }
 
+// Finds element type to be used for result from operand, with special handling
+// for handle types.
+Type GetElementTypeFromOperand(TensorType operand_type,
+                               TensorType result_type) {
+  auto operand_handle_type =
+      operand_type.getElementType().dyn_cast<TensorFlowTypeWithSubtype>();
+  if (!operand_handle_type) return result_type.getElementType();
+  auto result_handle_type =
+      result_type.getElementType().cast<TensorFlowTypeWithSubtype>();
+  if (operand_handle_type.GetSubtypes().empty() ||
+      !result_handle_type.GetSubtypes().empty())
+    return result_type.getElementType();
+  return operand_handle_type;
+}
+
+template <typename WhileOpTy>
+bool ShapeInference::InferShapeForWhile(WhileOpTy op,
+                                        TypeRange body_result_types) {
+  if (!op.shape_invariant())
+    return RefineTypeForPassThroughOperands(op, op.input(), op.output());
+
+  bool changed = false;
+  for (auto entry :
+       zip(op.input().getTypes(), op.output(), body_result_types)) {
+    auto operand_type = std::get<0>(entry).template cast<TensorType>();
+    Value result = std::get<1>(entry);
+    auto body_result_type = std::get<2>(entry).template cast<TensorType>();
+    if (operand_type == body_result_type) {
+      changed |= RefineResultType(op, result, operand_type);
+      continue;
+    }
+    auto result_type = result.getType().cast<TensorType>();
+    Type element_type = GetElementTypeFromOperand(operand_type, result_type);
+    Type potential_refined_type;
+    if (result_type.hasRank())
+      potential_refined_type =
+          RankedTensorType::get(result_type.getShape(), element_type);
+    else
+      potential_refined_type = UnrankedTensorType::get(element_type);
+    changed |= RefineResultType(op, result, potential_refined_type);
+  }
+  return changed;
+}
+
 bool ShapeInference::InferShapeForSingleOperation(Operation* op) {
   LLVM_DEBUG(op->print(llvm::dbgs() << "InferShapeForSingleOperation for ");
              llvm::dbgs() << "\n");
   assert(tf_dialect_ == op->getDialect());
   // The shape function of these ops sometimes does not propagate subtypes
   // (handle shapes) for resource and variant types. We use a simple passthrough
   // to make sure they are preserved in the output.
-  if (isa<TF::IdentityOp, TF::IdentityNOp, TF::ZerosLikeOp, TF::WhileOp,
-          TF::WhileRegionOp>(op)) {
+  if (isa<TF::IdentityOp, TF::IdentityNOp, TF::ZerosLikeOp>(op)) {
     return RefineTypeForPassThroughOperands(op, op->getOperands(),
                                             op->getResults());
   }
@@ -799,6 +853,15 @@ bool ShapeInference::InferShapeForSingleOperation(Operation* op) {
   if (auto if_region = dyn_cast<IfRegionOp>(op))
     return InferShapeForIfRegion(if_region);
 
+  if (auto while_op = dyn_cast<WhileOp>(op))
+    return InferShapeForWhile(while_op,
+                              while_op.body_function().getType().getResults());
+
+  if (auto while_region = dyn_cast<WhileRegionOp>(op))
+    return InferShapeForWhile(
+        while_region,
+        while_region.body().front().getTerminator()->getOperandTypes());
+
   // Return operand as a constant attribute.
   auto operand_as_constant_fn = [&](Value operand) {
     ValuePort vp(operand);
@@ -851,8 +914,8 @@ bool ShapeInference::InferShapeForSingleOperation(Operation* op) {
 }
 
 LogicalResult ShapeInference::PropagateShapeToFunctions(
-    ModuleOp module, Operation::operand_type_range input_types,
-    ArrayRef<FuncOp> functions, int64_t max_iteration) {
+    ModuleOp module, TypeRange input_types, ArrayRef<FuncOp> functions,
+    int64_t max_iteration) {
   bool all_succeeded = true;
   // If shape propagation fails for one function, return failure, but do not
   // early exit and attempt to propagate shapes for all provided functions to
@@ -885,9 +948,9 @@ LogicalResult ShapeInference::PropagateShapeToFunctions(
   return success(all_succeeded);
 }
 
-LogicalResult ShapeInference::PropagateShapeToRegions(
-    Operation::operand_type_range input_types, ArrayRef<Region*> regions,
-    int64_t max_iteration) {
+LogicalResult ShapeInference::PropagateShapeToRegions(TypeRange input_types,
+                                                      ArrayRef<Region*> regions,
+                                                      int64_t max_iteration) {
   DCOMMENT("\tPropagating shapes to regions");
   bool all_succeeded = true;
   // If shape propagation fails for one region, return failure, but do not
@@ -965,23 +1028,68 @@ void ShapeInference::PropagateConstantFromCallee(CallOpInterface call_op,
   }
 }
 
+// Finds compatible types to propagate into functions/regions of a shape variant
+// tf.While/tf.WhileRegion. If operand and result types are the same, that type
+// is returned. Otherwise functions/regions arguments are returned but with the
+// handle type from the operand type.
+// TODO(b/174145518): Support more granular shape refining of different shaped
+// operands and results (e.g. if rank does not change or only some dimensions
+// change).
+llvm::SmallVector<Type, 4> GetWhileCompatibleTypes(
+    TypeRange operand_types, TypeRange result_types,
+    TypeRange region_argument_types) {
+  llvm::SmallVector<Type, 4> types;
+  types.reserve(operand_types.size());
+  for (auto entry :
+       llvm::zip(operand_types, result_types, region_argument_types)) {
+    Type operand_type = std::get<0>(entry);
+    Type result_type = std::get<1>(entry);
+    if (operand_type == result_type) {
+      types.push_back(operand_type);
+    } else {
+      auto region_argument_type = std::get<2>(entry).cast<TensorType>();
+      Type element_type = GetElementTypeFromOperand(
+          operand_type.cast<TensorType>(), region_argument_type);
+      Type potential_refined_type;
+      if (region_argument_type.hasRank())
+        potential_refined_type = RankedTensorType::get(
+            region_argument_type.getShape(), element_type);
+      else
+        potential_refined_type = UnrankedTensorType::get(element_type);
+      types.push_back(potential_refined_type);
+    }
+  }
+  return types;
+}
+
 LogicalResult ShapeInference::PropagateShapeIntoAttachedFunctions(
     Operation* op, int64_t max_iteration) {
   ModuleOp module = op->getParentOfType<ModuleOp>();
   if (auto if_op = dyn_cast<TF::IfOp>(op)) {
     DCOMMENT("Propagating shapes into If");
     return PropagateShapeToFunctions(
-        module, drop_begin(if_op.getOperandTypes(), 1),
+        module, if_op.input().getTypes(),
         {if_op.then_function(), if_op.else_function()}, max_iteration);
   } else if (auto case_op = dyn_cast<TF::CaseOp>(op)) {
     SmallVector<FuncOp, 4> branches;
     case_op.get_branch_functions(branches);
-    return PropagateShapeToFunctions(module,
-                                     drop_begin(case_op.getOperandTypes(), 1),
+    return PropagateShapeToFunctions(module, case_op.input().getTypes(),
                                      branches, max_iteration);
   } else if (auto while_op = dyn_cast<TF::WhileOp>(op)) {
+    // If `shape_invariant` is set, operand shapes cannot be simply propagated
+    // to result shapes as the op may have different intermediate shapes (such
+    // While ops can have different result shapes from operand shapes).
+    // Compatible shapes must be determined before propagating them.
+    if (while_op.shape_invariant()) {
+      auto compatible_types = GetWhileCompatibleTypes(
+          while_op.input().getTypes(), while_op.output().getTypes(),
+          while_op.body_function().getType().getInputs());
+      return PropagateShapeToFunctions(
+          module, compatible_types,
+          {while_op.cond_function(), while_op.body_function()}, max_iteration);
+    }
     return PropagateShapeToFunctions(
-        module, while_op.getOperandTypes(),
+        module, while_op.input().getTypes(),
         {while_op.cond_function(), while_op.body_function()}, max_iteration);
   } else if (auto call_op = dyn_cast<CallOpInterface>(op)) {
     if (auto func = dyn_cast<FuncOp>(call_op.resolveCallable())) {
@@ -1004,7 +1112,19 @@ LogicalResult ShapeInference::PropagateShapeIntoAttachedFunctions(
 LogicalResult ShapeInference::PropagateShapeIntoAttachedRegions(
     Operation* op, int64_t max_iteration) {
   if (auto while_op = dyn_cast<TF::WhileRegionOp>(op)) {
-    return PropagateShapeToRegions(while_op.getOperandTypes(),
+    // If `shape_invariant` is set, operand shapes cannot be simply propagated
+    // to result shapes as the op may have different intermediate shapes (such
+    // While ops can have different result shapes from operand shapes).
+    // Compatible shapes must be determined before propagating them.
+    if (while_op.shape_invariant()) {
+      auto compatible_types = GetWhileCompatibleTypes(
+          while_op.input().getTypes(), while_op.output().getTypes(),
+          while_op.body().getArgumentTypes());
+      return PropagateShapeToRegions(compatible_types,
+                                     {&while_op.cond(), &while_op.body()},
+                                     max_iteration);
+    }
+    return PropagateShapeToRegions(while_op.input().getTypes(),
                                    {&while_op.cond(), &while_op.body()},
                                    max_iteration);
   }