texpine
diff --git a/‎tensorflow/c/c_api.cc‎
Lines changed: 1 addition & 1 deletion b/‎tensorflow/c/c_api.cc‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎tensorflow/cc/framework/scope.cc‎
Lines changed: 2 additions & 1 deletion b/‎tensorflow/cc/framework/scope.cc‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎tensorflow/compiler/tests/binary_ops_test.py‎
Lines changed: 14 additions & 0 deletions b/‎tensorflow/compiler/tests/binary_ops_test.py‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎tensorflow/compiler/tests/randomized_tests.cc‎
Lines changed: 46 additions & 15 deletions b/‎tensorflow/compiler/tests/randomized_tests.cc‎
Lines changed: 46 additions & 15 deletions
diff --git a/‎tensorflow/compiler/tf2xla/kernels/one_hot_op.cc‎
Lines changed: 7 additions & 56 deletions b/‎tensorflow/compiler/tf2xla/kernels/one_hot_op.cc‎
Lines changed: 7 additions & 56 deletions
diff --git a/‎tensorflow/compiler/tf2xla/kernels/softmax_op.cc‎
Lines changed: 117 additions & 42 deletions b/‎tensorflow/compiler/tf2xla/kernels/softmax_op.cc‎
Lines changed: 117 additions & 42 deletions
@@ -730,7 +730,7 @@ extern "C" {
 struct TF_Graph {
   TF_Graph()
       : graph(OpRegistry::Global()),
-        refiner(graph.op_registry()),
+        refiner(graph.versions().producer(), graph.op_registry()),
         num_sessions(0),
         delete_requested(false),
         parent(nullptr),
 
@@ -118,7 +118,8 @@ Scope::Impl::Impl(Graph* graph, Status* status, NameMap* name_map,
 
 Scope Scope::NewRootScope() {
   Graph* graph = new Graph(OpRegistry::Global());
-  ShapeRefiner* refiner = new ShapeRefiner(graph->op_registry());
+  ShapeRefiner* refiner =
+      new ShapeRefiner(graph->versions().producer(), graph->op_registry());
   return Scope(new Impl(graph, new Status, new Impl::NameMap, refiner));
 }
 
 
@@ -132,6 +132,20 @@ def testFloatOps(self):
           ],
           equality_test=self.ListsAreClose)
 
+      self._testBinary(
+          gen_nn_ops._sparse_softmax_cross_entropy_with_logits,
+          np.array([[0.1, 0.2, 0.3, 0.4], [0.5, 0.6, 0.7, 0.8],
+                    [0.9, 1.0, 1.1, 1.2]], dtype=dtype),
+          np.array([2, 1, 7], dtype=np.int32),
+          expected=[
+              np.array([1.342536, 1.442536, np.nan], dtype=dtype),
+              np.array([[0.213838, 0.236328, -0.738817, 0.288651],
+                        [0.213838, -0.763672, 0.261183, 0.288651],
+                        [np.nan, np.nan, np.nan, np.nan]],
+                       dtype=dtype),
+          ],
+          equality_test=self.ListsAreClose)
+
   def testIntOps(self):
     for dtype in self.int_types:
       self._testBinary(
 
@@ -1773,22 +1773,13 @@ TEST_F(OpTest, Softmax) {
   });
 }
 
-TEST_F(OpTest, Split) {
+TEST_F(OpTest, SoftmaxCrossEntropyWithLogits) {
   Repeatedly([this]() {
-    DataType type = Choose<DataType>(kAllXlaTypes);
-    std::vector<int64> dims = RandomDims(1);
-    std::uniform_int_distribution<int> ud;
-    int32 dim = std::uniform_int_distribution<int32>(
-        0, static_cast<int32>(dims.size()) - 1)(generator());
-    int n = std::uniform_int_distribution<int>(1, 5)(generator());
-    // Ensure 'dim' is evenly divisible by 'n'.
-    dims[dim] /= n;
-    dims[dim] *= n;
-    ExpectTfAndXlaOutputsAreClose(OpTestBuilder("Split")
-                                      .Input(test::AsScalar<int32>(dim))
-                                      .Input(RandomTensor(type, dims))
-                                      .Attr("T", type)
-                                      .Attr("num_split", n));
+    std::vector<int64> dims = RandomDims(2, 2, 1);
+    ExpectTfAndXlaOutputsAreClose(OpTestBuilder("SoftmaxCrossEntropyWithLogits")
+                                      .Input(RandomTensor(DT_FLOAT, dims))
+                                      .Input(RandomTensor(DT_FLOAT, dims))
+                                      .Attr("T", DT_FLOAT));
   });
 }
 
@@ -1846,6 +1837,46 @@ TEST_F(OpTest, SparseMatMul) {
   });
 }
 
+TEST_F(OpTest, SparseSoftmaxCrossEntropyWithLogits) {
+  Repeatedly([this]() {
+    std::vector<int64> dims = RandomDims(2, 2, 1);
+    int64 batch_size = dims[0];
+    int64 num_classes = dims[1];
+
+    std::vector<int32> indices(batch_size);
+    for (int64 i = 0; i < batch_size; ++i) {
+      indices[i] =
+          std::uniform_int_distribution<int32>(0, num_classes - 1)(generator());
+    }
+
+    ExpectTfAndXlaOutputsAreClose(
+        OpTestBuilder("SparseSoftmaxCrossEntropyWithLogits")
+            .Input(RandomTensor(DT_FLOAT, dims))
+            .Input(test::AsTensor<int32>(indices))
+            .Attr("T", DT_FLOAT)
+            .Attr("Tlabels", DT_INT32));
+  });
+}
+
+TEST_F(OpTest, Split) {
+  Repeatedly([this]() {
+    DataType type = Choose<DataType>(kAllXlaTypes);
+    std::vector<int64> dims = RandomDims(1);
+    std::uniform_int_distribution<int> ud;
+    int32 dim = std::uniform_int_distribution<int32>(
+        0, static_cast<int32>(dims.size()) - 1)(generator());
+    int n = std::uniform_int_distribution<int>(1, 5)(generator());
+    // Ensure 'dim' is evenly divisible by 'n'.
+    dims[dim] /= n;
+    dims[dim] *= n;
+    ExpectTfAndXlaOutputsAreClose(OpTestBuilder("Split")
+                                      .Input(test::AsScalar<int32>(dim))
+                                      .Input(RandomTensor(type, dims))
+                                      .Attr("T", type)
+                                      .Attr("num_split", n));
+  });
+}
+
 TEST_F(OpTest, Sqrt) {
   Repeatedly([this]() {
     ExpectTfAndXlaOutputsAreClose(OpTestBuilder("Sqrt")
 
@@ -16,22 +16,13 @@ limitations under the License.
 // XLA implementation of OneHot operator.
 
 #include "tensorflow/compiler/tf2xla/literal_util.h"
+#include "tensorflow/compiler/tf2xla/xla_helpers.h"
 #include "tensorflow/compiler/tf2xla/xla_op_kernel.h"
 #include "tensorflow/compiler/tf2xla/xla_op_registry.h"
 
 namespace tensorflow {
 namespace {
 
-template <typename T>
-Tensor MakeLinspaceTensor(const TensorShape& shape, int64 depth) {
-  Tensor linspace(DataTypeToEnum<T>::v(), shape);
-  auto linspace_flat = linspace.flat<T>();
-  for (int64 i = 0; i < depth; ++i) {
-    linspace_flat(i) = i;
-  }
-  return linspace;
-}
-
 class OneHotOp : public XlaOpKernel {
  public:
   explicit OneHotOp(OpKernelConstruction* ctx) : XlaOpKernel(ctx) {
@@ -71,52 +62,12 @@ class OneHotOp : public XlaOpKernel {
         ctx, depth >= 0,
         errors::InvalidArgument("depth must be non-negative, got: ", depth));
 
-    TensorShape output_shape = indices_shape;
-    output_shape.InsertDim(axis, depth);
-
-    xla::ComputationDataHandle on_value = ctx->Input(2);
-    xla::ComputationDataHandle off_value = ctx->Input(3);
-
-    // Build a Tensor populated with values 0, 1, 2, ... depth.
-    std::vector<int64> linspace_dims(output_dims, 1);
-    linspace_dims[axis] = depth;
-    TensorShape linspace_shape(linspace_dims);
-    Tensor linspace;
-    switch (ctx->input_type(0)) {
-      case DT_UINT8:
-        linspace = MakeLinspaceTensor<uint8>(linspace_shape, depth);
-        break;
-      case DT_INT32:
-        linspace = MakeLinspaceTensor<int32>(linspace_shape, depth);
-        break;
-      case DT_INT64:
-        linspace = MakeLinspaceTensor<int64>(linspace_shape, depth);
-        break;
-      default:
-        ctx->SetStatus(errors::InvalidArgument(
-            "Invalid argument type ", DataTypeString(ctx->input_type(0))));
-        return;
-    }
-    xla::Literal linspace_literal;
-    OP_REQUIRES_OK(ctx, HostTensorToLiteral(linspace, &linspace_literal));
-
-    xla::ComputationBuilder* builder = ctx->builder();
-    xla::ComputationDataHandle indices = ctx->Input(0);
-
-    // Broadcast the linspace constant across the indices along the new axis,
-    // and test equality at each position.
-    std::vector<int64> broadcast_dims(indices_shape.dims());
-    std::iota(broadcast_dims.begin(), broadcast_dims.begin() + axis, 0);
-    std::iota(broadcast_dims.begin() + axis, broadcast_dims.end(), axis + 1);
-    xla::ComputationDataHandle one_hot =
-        builder->Eq(indices, builder->ConstantLiteral(linspace_literal),
-                   broadcast_dims);
-
-    // Selects the user-provided off_value and on_value values.
-    ctx->SetOutput(
-        0, builder->Select(
-               one_hot, builder->Broadcast(on_value, output_shape.dim_sizes()),
-               builder->Broadcast(off_value, output_shape.dim_sizes())));
+    xla::ComputationDataHandle one_hot;
+    OP_REQUIRES_OK(
+        ctx, XlaHelpers::OneHot(ctx->builder(), depth, axis, input_type(0),
+                                indices_shape, ctx->Input(0), ctx->Input(2),
+                                ctx->Input(3), &one_hot));
+    ctx->SetOutput(0, one_hot);
   }
 
  private:
 
@@ -77,6 +77,51 @@ class SoftmaxOp : public XlaOpKernel {
 REGISTER_XLA_OP("Softmax", SoftmaxOp);
 REGISTER_XLA_OP("LogSoftmax", SoftmaxOp);
 
+std::pair<xla::ComputationDataHandle, xla::ComputationDataHandle>
+CrossEntropyWithLogits(XlaOpKernelContext* ctx, DataType type,
+                       const xla::ComputationDataHandle& logits,
+                       const xla::ComputationDataHandle& labels) {
+  const xla::Computation& max_func = *ctx->GetOrCreateMax(type);
+  const xla::Computation& add_func = *ctx->GetOrCreateAdd(type);
+
+  const int kBatchDim = 0;
+  const int kClassDim = 1;
+
+  xla::ComputationBuilder* b = ctx->builder();
+  // Find the max in each batch, resulting in a tensor of shape [batch]
+  auto logits_max =
+      b->Reduce(logits, XlaHelpers::MinValue(b, type), max_func, {kClassDim});
+
+  // Subtract the max in batch b from every element in batch b.
+  // Broadcasts along the batch dimension.
+  auto shifted_logits = b->Sub(logits, logits_max, {kBatchDim});
+
+  // exp(logits - max_logits)
+  auto exp_shifted_logits = b->Exp(shifted_logits);
+
+  // sum_{class} (exp(logits - max_logits))
+  auto sum_exp = b->Reduce(exp_shifted_logits, XlaHelpers::Zero(b, type),
+                           add_func, {kClassDim});
+
+  // log(sum(exp(logits - max_logits)))
+  auto log_sum_exp = b->Log(sum_exp);
+
+  // sum(-labels *
+  //    ((logits - max_logits) - log(sum(exp(logits - max_logits)))))
+  // along classes
+  // (The subtraction broadcasts along the batch dimension.)
+  xla::ComputationDataHandle loss = b->Reduce(
+      b->Mul(b->Neg(labels), b->Sub(shifted_logits, log_sum_exp, {kBatchDim})),
+      XlaHelpers::Zero(b, type), add_func, {kClassDim});
+
+  // backprop: prob - labels, where
+  //   prob = exp(logits - max_logits) / sum(exp(logits - max_logits))
+  //     (where the division broadcasts along the batch dimension)
+  xla::ComputationDataHandle backprop =
+      b->Sub(b->Div(exp_shifted_logits, sum_exp, {kBatchDim}), labels);
+  return {loss, backprop};
+}
+
 class SoftmaxXentWithLogitsOp : public XlaOpKernel {
  public:
   explicit SoftmaxXentWithLogitsOp(OpKernelConstruction* ctx)
@@ -88,65 +133,95 @@ class SoftmaxXentWithLogitsOp : public XlaOpKernel {
     OP_REQUIRES(ctx, logits_shape.IsSameSize(labels_shape),
                 errors::InvalidArgument(
                     "logits and labels must be same size: logits_size=",
-                    logits_shape.DebugString(), " labels_size=",
-                    labels_shape.DebugString()));
+                    logits_shape.DebugString(),
+                    " labels_size=", labels_shape.DebugString()));
     OP_REQUIRES(ctx, TensorShapeUtils::IsMatrix(logits_shape),
                 errors::InvalidArgument("logits must be 2-dimensional"));
     // As we already tested that both inputs have the same shape no need to
     // check that "labels" is a matrix too.
 
-    // loss is 1-D (one per example), and size is batch_size.
-
-    const int kBatchDim = 0;
-    const int kClassDim = 1;
-
     const DataType type = input_type(0);
-    xla::ComputationBuilder* b = ctx->builder();
     auto logits = ctx->Input(0);
     auto labels = ctx->Input(1);
 
-    const xla::Computation& max_func = *ctx->GetOrCreateMax(type);
-    const xla::Computation& add_func = *ctx->GetOrCreateAdd(type);
-
-    // Find the max in each batch, resulting in a tensor of shape [batch]
-    auto logits_max =
-        b->Reduce(logits, XlaHelpers::MinValue(b, type), max_func, {kClassDim});
-
-    // Subtract the max in batch b from every element in batch b.
-    // Broadcasts along the batch dimension.
-    auto shifted_logits = b->Sub(logits, logits_max, {kBatchDim});
-
-    // exp(logits - max_logits)
-    auto exp_shifted_logits = b->Exp(shifted_logits);
-
-    // sum_{class} (exp(logits - max_logits))
-    auto sum_exp = b->Reduce(exp_shifted_logits, XlaHelpers::Zero(b, type),
-                             add_func, {kClassDim});
-
-    // log(sum(exp(logits - max_logits)))
-    auto log_sum_exp = b->Log(sum_exp);
+    xla::ComputationDataHandle loss, backprop;
+    std::tie(loss, backprop) =
+        CrossEntropyWithLogits(ctx, type, logits, labels);
+    ctx->SetOutput(0, loss);
+    ctx->SetOutput(1, backprop);
+  }
+};
 
-    // sum(-labels *
-    //    ((logits - max_logits) - log(sum(exp(logits - max_logits)))))
-    // along classes
-    // (The subtraction broadcasts along the batch dimension.)
-    xla::ComputationDataHandle loss =
-        b->Reduce(b->Mul(b->Neg(labels),
-                         b->Sub(shifted_logits, log_sum_exp, {kBatchDim})),
-                  XlaHelpers::Zero(b, type), add_func, {kClassDim});
+REGISTER_XLA_OP("SoftmaxCrossEntropyWithLogits", SoftmaxXentWithLogitsOp);
 
-    // backprop: prob - labels, where
-    //   prob = exp(logits - max_logits) / sum(exp(logits - max_logits))
-    //     (where the division broadcasts along the batch dimension)
-    xla::ComputationDataHandle backprop =
-        b->Sub(b->Div(exp_shifted_logits, sum_exp, {kBatchDim}), labels);
+class SparseSoftmaxXentWithLogitsOp : public XlaOpKernel {
+ public:
+  explicit SparseSoftmaxXentWithLogitsOp(OpKernelConstruction* ctx)
+      : XlaOpKernel(ctx) {}
 
+  void Compile(XlaOpKernelContext* ctx) override {
+    const TensorShape logits_shape = ctx->InputShape(0);
+    const TensorShape labels_shape = ctx->InputShape(1);
+    OP_REQUIRES(ctx, TensorShapeUtils::IsMatrix(logits_shape),
+                errors::InvalidArgument("logits must be 2-D, but got shape ",
+                                        logits_shape.DebugString()));
+    OP_REQUIRES(ctx, TensorShapeUtils::IsVector(labels_shape),
+                errors::InvalidArgument("labels must be 1-D, but got shape ",
+                                        labels_shape.DebugString()));
+    OP_REQUIRES(ctx, logits_shape.dim_size(0) == labels_shape.dim_size(0),
+                errors::InvalidArgument(
+                    "logits and labels must have the same first dimension, "
+                    "got logits shape ",
+                    logits_shape.DebugString(), " and labels shape ",
+                    labels_shape.DebugString()));
+    OP_REQUIRES(ctx, logits_shape.dim_size(1) > 0,
+                errors::InvalidArgument(
+                    "Must have at least one class, but got logits shape ",
+                    logits_shape.DebugString()));
+
+    int64 batch_size = logits_shape.dim_size(0);
+    int64 depth = logits_shape.dim_size(1);
+
+    DataType logits_type = input_type(0);
+    DataType indices_type = input_type(1);
+
+    xla::ComputationDataHandle indices = ctx->Input(1);
+
+    xla::ComputationBuilder* builder = ctx->builder();
+    xla::ComputationDataHandle labels;
+    OP_REQUIRES_OK(ctx,
+                   XlaHelpers::OneHot(
+                       builder, depth, /*axis=*/1, input_type(1), labels_shape,
+                       indices, XlaHelpers::One(builder, logits_type),
+                       XlaHelpers::Zero(builder, logits_type), &labels));
+
+    // If any of the indices are out of range, we must populate the labels with
+    // NaNs to obey the interface contract of
+    // tf.nn.sparse_softmax_cross_entropy_with_logits.
+    // Builds a vector of {batch_size} that is 0 if the index is in range, or
+    // NaN otherwise; then add that vector to the labels to force out-of-range
+    // values to NaNs.
+    xla::ComputationDataHandle nan_or_zero = builder->Select(
+        builder->LogicalAnd(
+            builder->Le(XlaHelpers::Zero(builder, indices_type), indices),
+            builder->Lt(indices, XlaHelpers::IntegerLiteral(
+                                     builder, indices_type, depth))),
+        builder->Broadcast(XlaHelpers::Zero(builder, logits_type),
+                           {batch_size}),
+        builder->Broadcast(XlaHelpers::FloatLiteral(builder, logits_type, NAN),
+                           {batch_size}));
+    labels = builder->Add(labels, nan_or_zero, {0});
+
+    xla::ComputationDataHandle loss, backprop;
+    std::tie(loss, backprop) =
+        CrossEntropyWithLogits(ctx, logits_type, ctx->Input(0), labels);
     ctx->SetOutput(0, loss);
     ctx->SetOutput(1, backprop);
   }
 };
 
-REGISTER_XLA_OP("SoftmaxCrossEntropyWithLogits", SoftmaxXentWithLogitsOp);
+REGISTER_XLA_OP("SparseSoftmaxCrossEntropyWithLogits",
+                SparseSoftmaxXentWithLogitsOp);
 
 }  // namespace
 }  // namespace tensorflow
Original file line number	Diff line number	Diff line change
`@@ -118,7 +118,8 @@ Scope::Impl::Impl(Graph* graph, Status* status, NameMap* name_map,`
`118`	`118`
`119`	`119`	`Scope Scope::NewRootScope() {`
`120`	`120`	`Graph* graph = new Graph(OpRegistry::Global());`
`121`		`- ShapeRefiner* refiner = new ShapeRefiner(graph->op_registry());`
	`121`	`+ ShapeRefiner* refiner =`
	`122`	`+ new ShapeRefiner(graph->versions().producer(), graph->op_registry());`
`122`	`123`	`return Scope(new Impl(graph, new Status, new Impl::NameMap, refiner));`
`123`	`124`	`}`
`124`	`125`