SciSharp
diff --git a/‎src/TensorFlowNET.Core/Operations/ControlFlows/ControlFlowContext.cs‎
Lines changed: 26 additions & 2 deletions b/‎src/TensorFlowNET.Core/Operations/ControlFlows/ControlFlowContext.cs‎
Lines changed: 26 additions & 2 deletions
diff --git a/‎src/TensorFlowNET.Core/Operations/ControlFlows/ControlFlowState.cs‎
Lines changed: 157 additions & 109 deletions b/‎src/TensorFlowNET.Core/Operations/ControlFlows/ControlFlowState.cs‎
Lines changed: 157 additions & 109 deletions
@@ -20,6 +20,7 @@ limitations under the License.
 using Tensorflow.Operations.ControlFlows;
 using static Tensorflow.ControlFlowContextDef;
 using static Tensorflow.Binding;
+using util = Tensorflow.control_flow_util;
 
 namespace Tensorflow.Operations
 {
@@ -146,6 +147,14 @@ public virtual void Exit()
             graph._set_control_flow_context(last_context);
         }
 
+        public void ExitResult(Tensor[] result)
+        {
+            if(_outer_context != null)
+            {
+                throw new NotImplementedException("ExitResult");
+            }
+        }
+
         /// <summary>
         /// Add `op` to the current context.
         /// </summary>
@@ -172,6 +181,11 @@ public virtual Tensor AddValue(Tensor val)
             return null;
         }
 
+        public void AddName(string name)
+        {
+            _values.Add(name);
+        }
+
         /// <summary>
         /// Notifies a scope about an operator added to an inner scope.
         /// </summary>
@@ -246,9 +260,11 @@ protected virtual (Operation[], Operation[]) _RemoveExternalControlEdges(Operati
             }
             else
             {
-                foreach(Tensor x in op.control_inputs)
+                foreach(Operation x in op.control_inputs)
                 {
-                    throw new NotImplementedException("");
+                    var ctxt = util.GetOutputContext(x);
+                    if (ctxt != null && ctxt.GetWhileContext() == while_ctxt)
+                        internal_control_inputs.append(x);
                 }
             }
 
@@ -288,6 +304,14 @@ protected ControlFlowContext from_control_flow_context_def(ControlFlowContextDef
             throw new NotImplementedException($"Unknown ControlFlowContextDef field: {context_def.CtxtCase}");
         }
 
+        public virtual bool IsWhileContext()
+        {
+            throw new NotImplementedException("IsWhileContext");
+        }
+
+        public virtual bool IsCondContext()
+            => false;
+
         public object to_proto()
         {
             throw new NotImplementedException();
 
@@ -14,13 +14,20 @@ You may obtain a copy of the License at
    limitations under the License.
 ******************************************************************************/
 
+using System;
+using System.Linq;
+using System.Collections.Generic;
+using util = Tensorflow.control_flow_util;
+using static Tensorflow.Binding;
+
 namespace Tensorflow.Operations.ControlFlows
 {
     /// <summary>
     /// Maintain the mapping from the loops to their grad states.
     /// </summary>
     public class ControlFlowState
     {
+        Dictionary<ControlFlowContext, GradLoopState> _map;
         //class ControlFlowState(object):
         //  """Maintain the mapping from the loops to their grad states."""
 
@@ -40,51 +47,67 @@ public class ControlFlowState
         //      return self._map.get(forward_ctxt)
         //    return None
 
-        //  def ProcessUnusedLoopExits(self, pending_count, to_ops_set):
-        //    """Process all the "unused" loop exits.
-
-        //    The "unused" exits of the loops are added to `unused_exits`. An exit is
-        //    unused if its pending_count is 0. If there is an exit with real gradient,
-        //    all these deferred exits will enter the backprop loop with zero gradient.
-        //    Otherwise, they will enter the backprop loop with None. As an example,
-        //    people often write:
-
-        //    ```python
-        //    v1, _ = tf.while_loop(p, b, [x1, x2])
-        //    result = gradients(v1, x1)
-        //    ```
-
-        //    The exit node for x2 is not included by the betweenness analysis. But we
-        //    need to backprop x2 if x2 is involved in computing v1.
-
-        //    Args:
-        //      pending_count: The number of backprop inputs for every op.
-        //      to_ops_set: The set of ops for ys in gradients(ys, xs)
-
-        //    Returns:
-        //      The set of unused loop exits that we know at this point we need
-        //      to backprop.
-        //    """
-        //    loop_exits = []
-        //    for grad_state in self._map.values():
-        //      for y in grad_state.forward_loop_exits:
-        //        if pending_count[y.op] == 0:
-        //          grad_state.pending_exits_count -= 1
-        //          if y.op not in to_ops_set:
-        //            grad_state.unused_exits.append(y)
-        //          if grad_state.pending_exits_count == 0:
-        //            loop_exits.extend(grad_state.unused_exits)
-        //      # Need to include Enters in backprop for higher-order gradients.
-        //      for y in grad_state.forward_context.loop_enters:
-        //        if pending_count[y.op] == 0:
-        //          pending_count[y.op] = 1
-        //    return loop_exits
-
-        //  def EnterGradWhileContext(self, op, before):
-        //    """Enter the WhileContext for gradient computation."""
-        //    grad_state = self.GetGradState(op, before)
-        //    if grad_state:
-        //      grad_state.grad_context.Enter()
+        public ControlFlowState()
+        {
+            _map = new Dictionary<ControlFlowContext, GradLoopState>();
+        }
+
+        /// <summary>
+        /// Return the grad state for this op if it's in a forward loop context.
+        /// </summary>
+        /// <param name="op"></param>
+        /// <param name="before"></param>
+        /// <returns></returns>
+        public GradLoopState GetGradState(Operation op, bool before)
+        {
+            ControlFlowContext forward_ctxt = null;
+            if (before && util.IsLoopExit(op))
+            {
+                forward_ctxt = op._get_control_flow_context();
+                forward_ctxt = forward_ctxt.outer_context;
+                if (forward_ctxt != null)
+                    forward_ctxt = forward_ctxt.GetWhileContext();
+            }
+            else
+                forward_ctxt = util.GetWhileContext(op);
+            if (forward_ctxt != null)
+                return _map.get(forward_ctxt);
+            return null;
+        }
+
+        public Tensor[] ProcessUnusedLoopExits(Dictionary<string, int> pending_count, List<Operation> to_ops_set)
+        {
+            var loop_exits = new List<Tensor>();
+            foreach(var grad_state in _map.Values)
+            {
+                foreach(var y in grad_state.forward_loop_exits)
+                {
+                    if(!pending_count.ContainsKey(y.op.name))
+                    {
+                        grad_state.pending_exits_count -= 1;
+                        if (!to_ops_set.Contains(y.op))
+                            grad_state.unused_exits.append(y);
+                        if (grad_state.pending_exits_count == 0)
+                            loop_exits.extend(grad_state.unused_exits);
+                    }
+                }
+
+                foreach(var y in grad_state.forward_context.loop_enters)
+                {
+                    if (!pending_count.ContainsKey(y.op.name))
+                        pending_count[y.op.name] = 1;
+                }
+            }
+
+            return loop_exits.ToArray();
+        }
+
+        public void EnterGradWhileContext(Operation op, bool before)
+        {
+            var grad_state = GetGradState(op, before);
+            if (grad_state != null)
+                grad_state.grad_context.Enter();
+        }
 
         //  def ExitGradWhileContext(self, op, before):
         //    """Exit the WhileContext for gradient computation."""
@@ -118,6 +141,32 @@ public class ControlFlowState
         //        if loop_exit.op not in between_ops:
         //          between_ops.add(loop_exit.op)
         //          between_op_list.append(loop_exit.op)
+        public void AddWhileContext(Operation op, List<Operation> between_op_list, List<Operation> between_ops)
+        {
+            var forward_ctxt = op.GetWhileContext();
+            var grad_state = _map.ContainsKey(forward_ctxt) ? _map[forward_ctxt] : null;
+            if(grad_state == null)
+            {
+                GradLoopState outer_grad_state = null;
+                var outer_forward_ctxt = forward_ctxt.outer_context;
+                if (outer_forward_ctxt != null)
+                    outer_forward_ctxt = outer_forward_ctxt.GetWhileContext();
+                if (outer_forward_ctxt != null)
+                    outer_grad_state = _map[outer_forward_ctxt];
+                grad_state = new GradLoopState(forward_ctxt, outer_grad_state);
+                _map[forward_ctxt] = grad_state;
+
+                // We need to include all exits of a loop for backprop.
+                foreach (var loop_exit in grad_state.forward_loop_exits)
+                {
+                    if(!between_ops.Contains(loop_exit.op))
+                    {
+                        between_ops.add(loop_exit.op);
+                        between_op_list.append(loop_exit.op);
+                    }
+                }
+            }
+        }
 
         //  def ZerosLikeForExit(self, val):
         //    """Create zeros_like gradient for a loop exit.
@@ -174,70 +223,69 @@ public class ControlFlowState
         //        result = array_ops.zeros_like(val, optimize=False)
         //    return result
 
-        //  def ZerosLike(self, op, index):
-        //    """Create zeros_like for the specified output of an op.
-
-        //    If op is in a while loop that is part of gradients(), this method
-        //    must be called in its grad loop context.
-
-        //    Args:
-        //      op: A tensorflow operation.
-        //      index: the index for a specific output of the op.
-
-        //    Returns:
-        //      A zero tensor of the same shape of op.outputs[index].
-        //    """
-        //    if util.IsLoopSwitch(op):
-        //      return None
-        //    if op.graph._building_function:  # pylint: disable=protected-access
-        //      # The optimization here is tricky to apply to functions
-        //      return array_ops.zeros_like(op.outputs[index])
-        //    dead_branch = util.IsSwitch(op)
-        //    forward_ctxt = _GetWhileContext(op)
-        //    grad_state = self._map.get(forward_ctxt)
-        //    if grad_state is None:
-        //      # op is not in a while loop that is part of gradients().
-        //      return ZerosLikeOutsideLoop(op, index)
-        //    op_ctxt = op._get_control_flow_context()
-        //    val = ops.convert_to_tensor(op.outputs[index], name="tensor")
-        //    shape = val.get_shape()
-        //    if shape.is_fully_defined():
-        //      # If the shape is known statically, just create a zero tensor with
-        //      # the right shape in the grad loop context.
-        //      result = constant_op.constant(0, shape=shape.dims, dtype=val.dtype)
-        //      if dead_branch:
-        //        # op is a cond switch. Guard the zero tensor with a switch.
-        //        pred = grad_state.history_map.get(op_ctxt.pred.name)
-        //        branch = op_ctxt.branch
-        //        result = _SwitchRefOrTensor(result, pred)[1 - branch]
-        //    else:
-        //      # Unknown shape so keep a history of the shape at runtime.
-        //      if dead_branch:
-        //        # Need to add a special switch to guard the value.
-        //        pred = op_ctxt.pred
-        //        branch = op_ctxt.branch
-        //        op_ctxt.outer_context.Enter()
-        //        val = _SwitchRefOrTensor(op.inputs[0], pred)[1 - branch]
-        //        zeros_shape = array_ops.shape_internal(val, optimize=False)
-        //        op_ctxt.outer_context.Exit()
-        //        val.op._set_control_flow_context(op_ctxt)
-        //        zeros_shape.op._set_control_flow_context(op_ctxt)
-        //      else:
-        //        op_ctxt.Enter()
-        //        zeros_shape = array_ops.shape_internal(val, optimize=False)
-        //        op_ctxt.Exit()
-
-        //      # Add forward accumulator for shape.
-        //      grad_state.grad_context.Exit()
-        //      history_zeros_shape = grad_state.AddForwardAccumulator(
-        //          zeros_shape, dead_branch=dead_branch)
-        //      grad_state.grad_context.Enter()
-
-        //      # Create a zero tensor with the right shape.
-        //      shape = grad_state.AddBackpropAccumulatedValue(history_zeros_shape,
-        //                                                     zeros_shape, dead_branch)
-        //      result = array_ops.zeros(shape, val.dtype)
-        //    return result
+        public Tensor ZerosLike(Operation op, int index)
+        {
+            if (util.IsLoopSwitch(op))
+                return null;
+            if (op.graph.building_function)
+                return array_ops.zeros_like(op.outputs[index]);
+            var dead_branch = util.IsSwitch(op);
+            var forward_ctxt = util.GetWhileContext(op);
+            var grad_state = _map.get(forward_ctxt);
+            // op is not in a while loop that is part of gradients().
+            if (grad_state == null)
+                return ZerosLikeOutsideLoop(op, index);
+            throw new NotImplementedException("ZerosLike");
+        }
+
+        public Tensor ZerosLikeOutsideLoop(Operation op, int index)
+        {
+            var val = op.outputs[index];
+            if (!util.IsSwitch(op))
+            {
+                if (val.dtype == dtypes.resource)
+                    throw new NotImplementedException("ZerosLikeOutsideLoop");
+                /*return array_ops.zeros(
+                  gen_resource_variable_ops.variable_shape(val),
+                  dtype: default_gradient.get_zeros_dtype(val));*/
+                return array_ops.zeros_like(val, optimize: false);
+            }
+            else
+                throw new NotImplementedException("ZerosLikeOutsideLoop");
+        }
+
+        /// <summary>
+        /// Create zeros_like gradient for a loop exit.
+        /// </summary>
+        /// <param name="val"></param>
+        /// <returns></returns>
+        public Tensor ZerosLikeForExit(Tensor val)
+        {
+            Tensor result = null;
+            var val_shape = val.TensorShape;
+            var forward_ctxt = val.op._get_control_flow_context();
+            var outer_forward_ctxt = forward_ctxt.outer_context;
+            if (outer_forward_ctxt != null)
+                outer_forward_ctxt = outer_forward_ctxt.GetWhileContext();
+            GradLoopState outer_grad_state = null;
+            if (outer_forward_ctxt != null)
+                outer_grad_state = _map.get(outer_forward_ctxt);
+            // This is a nested loop.
+            if (outer_grad_state != null)
+            {
+                throw new NotImplementedException("ZerosLikeForExit");
+            }
+            else
+            {
+                // If the shape is known statically, just create a zero tensor
+                // with the right shape.
+                if (val_shape.is_fully_defined())
+                    result = array_ops.zeros(val_shape.dims, val.dtype);
+                else
+                    result = array_ops.zeros_like(val, optimize: false);
+            }
+            return result;
+        }
 
         //  def PostProcessing(self):
         //    """Perform postprocessing at the end of gradients().