_SwitchGrad

Oceania2018 · Oceania2018 · commit a8a515682ef6 · 2019-11-02T08:59:36.000-05:00
diff --git a/src/TensorFlowNET.Core/Gradients/control_flow_grad.cs b/src/TensorFlowNET.Core/Gradients/control_flow_grad.cs
@@ -45,7 +45,19 @@ public static Tensor[] _SwitchGrad(Operation op, Tensor[] grads)
             switch (op_ctxt)
             {
                 case WhileContext cwhile:
-                    throw new NotImplementedException("_SwitchGrad WhileContext");
+                    {
+                        var merge_grad = grad_ctxt.grad_state.switch_map.get(op);
+                        if (merge_grad != null)
+                            throw new NotImplementedException("_SwitchGrad merge_grad != null");
+                        else if (grads[0] != null)
+                        {
+                            merge_grad = merge(new[] { grads[0], grads[0] }, name: "b_switch")[0];
+                            grad_ctxt.grad_state.switch_map[op] = merge_grad;
+                            return new Tensor[] { merge_grad, null };
+                        }
+                        else
+                            return new Tensor[] { null, null };
+                    }
                 case CondContext ccond:
                     {
                         var zero_grad = grads[1 - op_ctxt.branch];
@@ -74,7 +86,7 @@ public static Tensor[] _SwitchGrad(Operation op, Tensor[] grads)
         /// <param name="inputs"></param>
         /// <param name="name"></param>
         /// <returns></returns>
-        internal static Tensor[] merge(Tensor[] inputs, string name = null)
+        internal static MergeOutput merge(Tensor[] inputs, string name = null)
         {
             return tf_with(ops.name_scope(name, "Merge", inputs), scope =>
             {
@@ -146,7 +158,7 @@ public static Tensor[] _MergeGrad(Operation op, Tensor[] grads)
         }
 
         [RegisterGradient("RefMerge")]
-        public Tensor[] _RefMergeGrad(Operation op, Tensor[] grads)
+        public static Tensor[] _RefMergeGrad(Operation op, Tensor[] grads)
         {
             return _MergeGrad(op, grads);
         }
@@ -155,43 +167,32 @@ public Tensor[] _RefMergeGrad(Operation op, Tensor[] grads)
         /// Gradients for an exit op are calculated using an Enter op.
         /// </summary>
         [RegisterGradient("Exit")]
-        public Tensor[] _ExitGrad(Operation op, Tensor[] grads)
+        public static Tensor[] _ExitGrad(Operation op, Tensor[] grads)
         {
-            throw new NotImplementedException("_ExitGrad");
-            //  graph = ops.get_default_graph()
-            //# pylint: disable=protected-access
-            //  op_ctxt = op._get_control_flow_context()
-            //  grad_ctxt = graph._get_control_flow_context()
-            //  # pylint: enable=protected-access
-            //  if not grad_ctxt.back_prop:
-            //    # The flag `back_prop` is set by users to suppress gradient
-            //    # computation for this loop. If the attribute `back_prop` is false,
-            //    # no gradient computation.
-            //    return None
+            var grad = grads[0];
+            var graph = ops.get_default_graph();
+            var op_ctxt = op._get_control_flow_context();
+            var grad_ctxt = graph._get_control_flow_context() as WhileContext;
+            // The flag `back_prop` is set by users to suppress gradient
+            // computation for this loop. If the attribute `back_prop` is false,
+            // no gradient computation.
+            if (!grad_ctxt.back_prop)
+                return null;
+
+            if (op_ctxt.grad_state != null)
+                throw new TypeError("Second-order gradient for while loops not supported.");
+
+            grad_ctxt.AddName(grad.name);
 
-            //  if op_ctxt.grad_state:
-            //    raise TypeError("Second-order gradient for while loops not supported.")
+            grad_ctxt.Enter();
+            var result = control_flow_ops._Enter(
+                  grad, grad_ctxt.name, is_constant: false,
+                  parallel_iterations: grad_ctxt.parallel_iterations,
+                 name: "b_exit");
 
-            //  if isinstance(grad, ops.Tensor) :
-            //    grad_ctxt.AddName(grad.name)
-            //  else:
-            //    if not isinstance(grad, (ops.IndexedSlices, sparse_tensor.SparseTensor)):
-            //      raise TypeError("Type %s not supported" % type(grad))
-            //    grad_ctxt.AddName(grad.values.name)
-            //    grad_ctxt.AddName(grad.indices.name)
-            //    dense_shape = grad.dense_shape
-            //    if dense_shape is not None:
-            //      grad_ctxt.AddName(dense_shape.name)
-            //  grad_ctxt.Enter()
-            //  # pylint: disable=protected-access
-            //  result = control_flow_ops._Enter(
-            //      grad, grad_ctxt.name, is_constant=False,
-            //      parallel_iterations=grad_ctxt.parallel_iterations,
-            //      name="b_exit")
-            //  # pylint: enable=protected-access
-            //  grad_ctxt.loop_enters.append(result)
-            //  grad_ctxt.Exit()
-            //  return result
+            grad_ctxt.loop_enters.append(result);
+            grad_ctxt.Exit();
+            return new[] { result };
         }
 
         /// <summary>
@@ -200,15 +201,15 @@ public Tensor[] _ExitGrad(Operation op, Tensor[] grads)
         ///  Note that the backprop next_iteration is added in switch grad.
         /// </summary>
         [RegisterGradient("NextIteration")]
-        public Tensor[] _NextIterationGrad(object _, Tensor[] grad)
+        public static Tensor[] _NextIterationGrad(Operation op, Tensor[] grads)
         {
-            return grad;
+            return grads;
         }
 
         [RegisterGradient("RefNextIteration")]
-        public Tensor[] _RefNextIterationGrad(object _, Tensor[] grad)
+        public static Tensor[] _RefNextIterationGrad(Operation op, Tensor[] grads)
         {
-            return grad;
+            return grads;
         }
 
         /// <summary>
@@ -218,33 +219,39 @@ public Tensor[] _RefNextIterationGrad(object _, Tensor[] grad)
         ///  For loop invariants, we need to add an accumulator loop.
         /// </summary>
         [RegisterGradient("Enter")]
-        public Tensor[] _EnterGrad(Tensor op, Tensor[] grad)
+        public static Tensor[] _EnterGrad(Operation op, Tensor[] grads)
         {
-            throw new NotImplementedException("_EnterGrad");
-            //  graph = ops.get_default_graph()
-            //# pylint: disable=protected-access
-            //  grad_ctxt = graph._get_control_flow_context()
-            //  # pylint: enable=protected-access
-            //  if not grad_ctxt.back_prop:
-            //    # Skip gradient computation, if the attribute `back_prop` is false.
-            //    return grad
-            //  if grad_ctxt.grad_state is None:
-            //    # Pass the gradient through if we are not in a gradient while context.
-            //    return grad
-            //  if op.get_attr("is_constant"):
-            //    # Add a gradient accumulator for each loop invariant.
-            //    if isinstance(grad, ops.Tensor) :
-            //      result = grad_ctxt.AddBackpropAccumulator(op, grad)
-            //    elif isinstance(grad, ops.IndexedSlices) :
-            //      result = grad_ctxt.AddBackpropIndexedSlicesAccumulator(op, grad)
-            //    else:
-            //      # TODO(yuanbyu, lukasr): Add support for SparseTensor.
-            //      raise TypeError("Type %s not supported" % type(grad))
-            //  else:
-            //    result = exit(grad)
-            //    grad_ctxt.loop_exits.append(result)
-            //    grad_ctxt.ExitResult([result])
-            //  return result
+            Tensor result = null;
+            var grad = grads[0];
+            var graph = ops.get_default_graph();
+            var grad_ctxt = graph._get_control_flow_context() as WhileContext;
+            if (!grad_ctxt.back_prop)
+                // Skip gradient computation, if the attribute `back_prop` is false.
+                return grads;
+            if (grad_ctxt.grad_state == null)
+                // Pass the gradient through if we are not in a gradient while context.
+                return grads;
+            if (op.get_attr<bool>("is_constant"))
+            {
+                throw new NotImplementedException("_EnterGrad is_constant");
+                //  Add a gradient accumulator for each loop invariant.
+                //    if isinstance(grad, ops.Tensor) :
+                //      result = grad_ctxt.AddBackpropAccumulator(op, grad)
+                //    elif isinstance(grad, ops.IndexedSlices) :
+                //      result = grad_ctxt.AddBackpropIndexedSlicesAccumulator(op, grad)
+                //    else:
+                //      # TODO(yuanbyu, lukasr): Add support for SparseTensor.
+                //      raise TypeError("Type %s not supported" % type(grad))
+            }
+
+            else
+            {
+                result = control_flow_ops.exit(grad);
+                grad_ctxt.loop_exits.append(result);
+                grad_ctxt.ExitResult(new[] { result });
+            }
+
+            return new Tensor[] { result };
         }