tensorflow · Nov 16, 2020
diff --git a/‎Sources/CX10/BUILD
+1 b/‎Sources/CX10/BUILD
+1
diff --git a/‎Sources/CX10/functional_while.cc
+319 b/‎Sources/CX10/functional_while.cc
+319
diff --git a/‎Sources/CX10/xla_tensor_wrapper.cc
+5 b/‎Sources/CX10/xla_tensor_wrapper.cc
+5
diff --git a/‎Sources/CX10/xla_tensor_wrapper.h
+6 b/‎Sources/CX10/xla_tensor_wrapper.h
+6
diff --git a/‎Sources/TensorFlow/Core/Tensor.swift
+2 b/‎Sources/TensorFlow/Core/Tensor.swift
+2
@@ -11,6 +11,7 @@ cc_library(
 cc_library(
     name = "xla_tensor_wrapper",
     srcs = [
+        "functional_while.cc",
         "xla_tensor_wrapper.cc",
         "xla_tensor_ops_wrapper.cc",
         "xla_tensor_ops_wrapper_generated.cc.inc",
 
@@ -0,0 +1,319 @@
+// Copyright 2020 TensorFlow Authors
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//      http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#if defined(_WIN32)
+#define XLA_API __declspec(dllexport)
+#else
+#define XLA_API __attribute__((__visibility__("default")))
+#endif
+
+#include "xla_tensor_wrapper.h"
+
+#include "absl/container/flat_hash_set.h"
+#include "tensorflow/compiler/tf2xla/xla_tensor/helpers.h"
+#include "tensorflow/compiler/tf2xla/xla_tensor/ir.h"
+#include "tensorflow/compiler/tf2xla/xla_tensor/lowering_context.h"
+
+using swift_xla::XLATensor;
+using swift_xla::ir::LoweringContext;
+using swift_xla::ir::Node;
+using swift_xla::ir::NodePtr;
+using swift_xla::ir::OpList;
+using swift_xla::ir::Output;
+using swift_xla::ir::Value;
+using swift_xla::ir::XlaOpVector;
+
+xla::Shape ShapeOfXlaOpList(absl::Span<const Value> ops) {
+  xla::Shape result;
+  result.set_element_type(xla::TUPLE);
+  result.mutable_tuple_shapes()->reserve(ops.size());
+  for (const auto& op : ops) {
+    xla::ShapeUtil::AppendShapeToTuple(op.shape(), &result);
+  }
+  TF_DCHECK_OK(xla::ShapeUtil::ValidateShapeWithOptionalLayout(result));
+  return result;
+}
+
+struct ExtraInputDiscovery {
+  // TODO: color when building the graph as this can be n^2
+  // in the number of for loops.
+  void BackRefVisit(const Output& v, const Node* node = nullptr) {
+    auto& state = state_map[v.node];
+    if (!state.visited) {
+      state.visited = true;
+      work_list.push_back(v.node);
+    }
+    if (node) state.refs.push_back(node);
+  }
+  void PlaceholderVisit(const Node* node) {
+    auto& state = state_map[node];
+    if (!state.depends_on_placeholder) {
+      state.depends_on_placeholder = true;
+      work_list.push_back(node);
+    }
+  }
+  void WorkListBackRefVisit() {
+    while (!work_list.empty()) {
+      const Node* node = work_list.back();
+      work_list.pop_back();
+      for (const auto& value : node->operands()) {
+        BackRefVisit(value, node);
+      }
+    }
+  }
+  void WorkListPlaceholderVisit() {
+    while (!work_list.empty()) {
+      const Node* node = work_list.back();
+      work_list.pop_back();
+      for (auto* ref : state_map[node].refs) {
+        PlaceholderVisit(ref);
+      }
+    }
+  }
+  void BackRefVisitExtraSearch(const Output& v, const NodePtr& n) {
+    auto& state = state_map[v.node];
+    if (!state.visited_looking_for_extras) {
+      state.visited_looking_for_extras = true;
+      if (state.depends_on_placeholder) {
+        work_list.push_back(v.node);
+      } else {
+        results.push_back(Value(n, v.index));
+      }
+    }
+  }
+  void WorkListBackRefVisitExtraSearch() {
+    while (!work_list.empty()) {
+      const Node* node = work_list.back();
+      work_list.pop_back();
+      auto& operands = node->operands();
+      auto& node_ptrs = node->operand_nodes();
+      for (size_t i = 0; i < operands.size(); ++i) {
+        BackRefVisitExtraSearch(operands[i], node_ptrs[i]);
+      }
+    }
+  }
+  struct State {
+    State() {}
+    bool visited =
+        false;  // Has been fully visited if true and work_list.empty().
+    bool depends_on_placeholder = false;
+    bool visited_looking_for_extras = false;
+    std::vector<const Node*> refs;
+  };
+  std::vector<const Node*> work_list;
+  absl::flat_hash_map<const Node*, State> state_map;
+  std::vector<Value> results;
+};
+
+std::vector<Value> DiscoverExtraInputs(absl::Span<const Value> results,
+                                       const Value& index_placeholder,
+                                       absl::Span<const Value> placeholders) {
+  ExtraInputDiscovery state;
+  for (auto& result : results) {
+    state.BackRefVisit(result);
+  }
+  state.WorkListBackRefVisit();
+  for (auto& placeholder : placeholders) {
+    state.PlaceholderVisit(placeholder.node.get());
+  }
+  state.PlaceholderVisit(index_placeholder.node.get());
+  state.WorkListPlaceholderVisit();
+  for (auto& result : results) {
+    state.BackRefVisitExtraSearch(result, result.node);
+  }
+  state.WorkListBackRefVisitExtraSearch();
+  return std::move(state.results);
+}
+
+class XLAFunctionalWhileNode : public swift_xla::ir::Node {
+ public:
+  static std::vector<Value> BuildArgs(absl::Span<const Value> initial,
+                                      const Value& n,
+                                      absl::Span<const Value> extras) {
+    std::vector<Value> out(initial.begin(), initial.end());
+    out.push_back(n);
+    out.insert(out.end(), extras.begin(), extras.end());
+    return out;
+  }
+  static xla::hash_t HashOfResults(absl::Span<const Value> results) {
+    xla::hash_t hash = 0;
+    for (auto& result : results)
+      hash = xla::util::HashCombine(hash, result.hash());
+    return hash;
+  }
+  XLAFunctionalWhileNode(absl::Span<const Value> initial, const Value& n,
+                         const Value& index_placeholder,
+                         absl::Span<const Value> placeholders,
+                         absl::Span<const Value> results)
+      : Node(swift_xla::ir::OpKind(at::aten::functional_while),
+             BuildArgs(
+                 initial, n,
+                 DiscoverExtraInputs(results, index_placeholder, placeholders)),
+             ShapeOfXlaOpList(results), results.size(), HashOfResults(results)),
+        index_placeholder_(index_placeholder),
+        placeholders_(placeholders.begin(), placeholders.end()),
+        results_(results.begin(), results.end()) {}
+
+  static xla::XlaOp zeroLike(xla::XlaOp op) {
+    auto* b = op.builder();
+    return xla::ConstantLiteral(
+        b, xla::LiteralUtil::Zero(
+               swift_xla::XlaHelpers::ShapeOfXlaOp(op).element_type()));
+  }
+
+  static xla::XlaOp oneLike(xla::XlaOp op) {
+    auto* b = op.builder();
+    return xla::ConstantLiteral(
+        b, xla::LiteralUtil::One(
+               swift_xla::XlaHelpers::ShapeOfXlaOp(op).element_type()));
+  }
+
+  XlaOpVector Lower(LoweringContext* loctx) const {
+    size_t last_i = placeholders_.size();
+
+    auto body_builder = loctx->builder()->CreateSubBuilder("loop_body");
+    xla::XlaOp initial;
+    {
+      std::vector<xla::XlaOp> args;
+      args.reserve(operands().size() + 1);
+      for (size_t i = 0; i < last_i; ++i) {
+        args.push_back(loctx->GetOutputOp(operand(i)));
+      }
+      auto tmp = loctx->GetOutputOp(operand(last_i));
+      auto it = zeroLike(tmp);
+      args.push_back(it);
+      args.push_back(tmp);
+      for (size_t i = last_i + 1; i < operands().size(); ++i) {
+        args.push_back(loctx->GetOutputOp(operand(i)));
+      }
+
+      initial = xla::Tuple(loctx->builder(), args);
+    }
+    xla::XlaOp body_result;
+    {
+      auto* b = body_builder.get();
+      swift_xla::ir::Util::EmissionMap emap;
+      for (const auto& placeholder : placeholders_) {
+        emap[placeholder.node.get()] = swift_xla::ir::Util::kEmitted;
+      }
+      for (size_t i = last_i + 1; i < operands().size(); ++i) {
+        emap[operand(i).node] = swift_xla::ir::Util::kEmitted;
+      }
+      emap[index_placeholder_.node.get()] = swift_xla::ir::Util::kEmitted;
+      swift_xla::ir::LoweringContext body_loctx(b, loctx->device(),
+                                                std::move(emap));
+      auto t = xla::Parameter(
+          b, 0, swift_xla::XlaHelpers::ShapeOfXlaOp(initial), "tuple");
+      auto p1 = xla::GetTupleElement(t, last_i);
+      auto p2 = xla::GetTupleElement(t, last_i + 1);
+      for (size_t i = 0; i < placeholders_.size(); ++i) {
+        body_loctx.AssignOutputOp(placeholders_[i], xla::GetTupleElement(t, i));
+      }
+      for (size_t i = last_i + 1; i < operands().size(); ++i) {
+        body_loctx.AssignOutputOp(operand(i), xla::GetTupleElement(t, i + 1));
+      }
+      body_loctx.AssignOutputOp(index_placeholder_, p1);
+
+      std::vector<xla::XlaOp> tmps;
+      for (auto& result : results_) {
+        tmps.push_back(body_loctx.GetOutputOp(result));
+      }
+      tmps.push_back(p1 + oneLike(p1));
+      tmps.push_back(p2);
+      for (size_t i = last_i + 1; i < operands().size(); ++i) {
+        tmps.push_back(body_loctx.GetOutputOp(operand(i)));
+      }
+      body_result = xla::Tuple(b, tmps);
+    }
+
+    auto cond_builder = loctx->builder()->CreateSubBuilder("cond_body");
+    xla::XlaOp cond_result;
+    {
+      auto* b = cond_builder.get();
+      auto t = xla::Parameter(
+          b, 0, swift_xla::XlaHelpers::ShapeOfXlaOp(initial), "tuple");
+      auto p1 = xla::GetTupleElement(t, last_i);
+      auto p2 = xla::GetTupleElement(t, last_i + 1);
+      cond_result = xla::Lt(p1, p2);
+    }
+
+    auto result = xla::While(
+        cond_builder->Build(cond_result).ConsumeValueOrDie(),
+        body_builder->Build(body_result).ConsumeValueOrDie(), initial);
+
+    std::vector<xla::XlaOp> results;
+    for (size_t i = 0; i < last_i; ++i) {
+      results.push_back(xla::GetTupleElement(result, i));
+    }
+    return ReturnOps(results, loctx);
+  }
+
+  Value index_placeholder_;
+  std::vector<Value> placeholders_;
+  std::vector<Value> results_;
+};
+
+class XLAPlaceholderNode : public swift_xla::ir::Node {
+ public:
+  XLAPlaceholderNode(xla::Shape shape, int id)
+      : Node(swift_xla::ir::OpKind(at::aten::placeholder), {}, shape, 1,
+             xla::util::MHash(id)),
+        id_(id) {}
+  NodePtr Clone(OpList operands) const override {
+    return swift_xla::ir::MakeNode<XLAPlaceholderNode>(shape(), id_);
+  }
+  XlaOpVector Lower(LoweringContext* loctx) const override {
+    LOG(FATAL) << "Cannot lower placeholder: " << ToString() << " id: " << id_;
+  }
+  std::string ToString() const override {
+    std::stringstream ss;
+    ss << Node::ToString() << ", id=" << id_;
+    return ss.str();
+  }
+  int id_;
+};
+
+std::vector<Value> UnpackIrValues(OpaqueXLATensorArrayRef array) {
+  std::vector<Value> out;
+  out.reserve(array.size);
+  for (size_t i = 0; i < array.size; ++i) {
+    out.push_back(array.data[i]->GetIrValue());
+  }
+  return out;
+}
+
+OpaqueXLATensorArrayRef XLATensor_functional_while(
+    OpaqueXLATensor* n, OpaqueXLATensorArrayRef initial,
+    OpaqueXLATensorArrayRef placeholders, OpaqueXLATensor* indexPlaceholder,
+    OpaqueXLATensorArrayRef results) {
+  auto initial_ir = UnpackIrValues(initial);
+  auto placeholders_ir = UnpackIrValues(placeholders);
+  auto results_ir = UnpackIrValues(results);
+
+  auto result_node = swift_xla::ir::MakeNode<XLAFunctionalWhileNode>(
+      initial_ir, n->GetIrValue(), indexPlaceholder->GetIrValue(),
+      placeholders_ir, results_ir);
+  size_t count = results.size;
+  auto opaque_tensors = new OpaqueXLATensor*[count];
+  for (size_t i = 0; i < count; ++i) {
+    opaque_tensors[i] = new XLATensor(
+        results.data[i]->CreateFrom(swift_xla::ir::Value(result_node, i)));
+  }
+  return {opaque_tensors, count};
+}
+
+OpaqueXLATensor* XLATensor_makePlaceholder(OpaqueXLATensor* t, int id) {
+  return new XLATensor(t->CreateFrom(
+      swift_xla::ir::MakeNode<XLAPlaceholderNode>(t->shape(), id)));
+}
@@ -315,6 +315,11 @@ OpaqueString* XLATensor_ir_text(OpaqueXLATensor* a) {
       swift_xla::ir::DumpUtil::ToText({a->GetIrValue().node.get()});
   return new std::string(ir_dag_text);
 }
+OpaqueString* XLATensor_xla_ir_text(OpaqueXLATensor* a) {
+  std::string ir_dag_text =
+      swift_xla::ir::DumpUtil::ToHlo({a->GetIrValue()}, a->GetDevice());
+  return new std::string(ir_dag_text);
+}
 OpaqueXLATensor* XLATensor_linspace(XLAScalar start, XLAScalar stop,
                                     int64_t num, const CDevice device,
                                     enum XLATensorScalarType type) {
 
@@ -293,6 +293,7 @@ XLA_API OpaqueXLATensor* XLATensor_ge(OpaqueXLATensor* x, OpaqueXLATensor* y);
 XLA_API OpaqueString* XLATensor_get_annotations(OpaqueXLATensor* a);
 XLA_API OpaqueXLATensor* XLATensor_gt(OpaqueXLATensor* x, OpaqueXLATensor* y);
 XLA_API OpaqueString* XLATensor_ir_text(OpaqueXLATensor* a);
+XLA_API OpaqueString* XLATensor_xla_ir_text(OpaqueXLATensor* a);
 XLA_API OpaqueXLATensor* XLATensor_is_finite(OpaqueXLATensor* input);
 XLA_API OpaqueXLATensor* XLATensor_is_inf(OpaqueXLATensor* input);
 XLA_API OpaqueXLATensor* XLATensor_is_nan(OpaqueXLATensor* input);
@@ -427,6 +428,11 @@ XLA_API OpaqueXLATensor* XLATensor_xla_slice(OpaqueXLATensor* input,
                                              Int64ArrayRef begin,
                                              Int64ArrayRef end,
                                              Int64ArrayRef strides);
+XLA_API OpaqueXLATensorArrayRef XLATensor_functional_while(
+    OpaqueXLATensor* n, OpaqueXLATensorArrayRef initial,
+    OpaqueXLATensorArrayRef placeholders, OpaqueXLATensor* indexPlaceholder,
+    OpaqueXLATensorArrayRef results);
+XLA_API OpaqueXLATensor* XLATensor_makePlaceholder(OpaqueXLATensor* t, int id);
 // Retrieves the device for a given tensor.
 XLA_API struct CDevice XLATensor_device(OpaqueXLATensor* t);
 // Creates a float tensor on the current device filled with random numbers in
 
@@ -22,6 +22,7 @@ infix operator .!=: ComparisonPrecedence
 public protocol AnyTensor {
   var _rawTensorHandle: CTensorHandle { get }
   var _tensorFlowDataType: TensorDataType { get }
+  var scalarType: TensorFlowScalar.Type { get }
 }
 
 /// A multidimensional array of elements that is a generalization of vectors and matrices to
@@ -55,6 +56,7 @@ public struct Tensor<Scalar: TensorFlowScalar> {
 extension Tensor: AnyTensor {
   public var _rawTensorHandle: CTensorHandle { return handle._cTensorHandle }
   public var _tensorFlowDataType: TensorDataType { return Scalar.tensorFlowDataType }
+  public var scalarType: TensorFlowScalar.Type { return Scalar.self }
 }
 
 //===------------------------------------------------------------------------------------------===//
Original file line number	Diff line number	Diff line change
`@@ -22,6 +22,7 @@ infix operator .!=: ComparisonPrecedence`
`22`	`22`	`public protocol AnyTensor {`
`23`	`23`	`var _rawTensorHandle: CTensorHandle { get }`
`24`	`24`	`var _tensorFlowDataType: TensorDataType { get }`
	`25`	`+ var scalarType: TensorFlowScalar.Type { get }`
`25`	`26`	`}`
`26`	`27`
`27`	`28`	`/// A multidimensional array of elements that is a generalization of vectors and matrices to`
`@@ -55,6 +56,7 @@ public struct Tensor<Scalar: TensorFlowScalar> {`
`55`	`56`	`extension Tensor: AnyTensor {`
`56`	`57`	`public var _rawTensorHandle: CTensorHandle { return handle._cTensorHandle }`
`57`	`58`	`public var _tensorFlowDataType: TensorDataType { return Scalar.tensorFlowDataType }`
	`59`	`+ public var scalarType: TensorFlowScalar.Type { return Scalar.self }`
`58`	`60`	`}`
`59`	`61`
`60`	`62`	`//===------------------------------------------------------------------------------------------===//`