BasicLSTMCell

Oceania2018 · Oceania2018 · commit a70077bbb479 · 2019-11-23T09:21:12.000-06:00
diff --git a/src/TensorFlowNET.Core/APIs/tf.math.cs b/src/TensorFlowNET.Core/APIs/tf.math.cs
@@ -251,7 +251,7 @@ public Tensor _clip_by_value(Tensor t, Tensor clip_value_min, Tensor clip_value_
         ///    greater than <c>clip_value_max</c> are set to <c>clip_value_max</c>.
         /// </remarks>
         public Tensor clip_by_value (Tensor t, Tensor clip_value_min, Tensor clip_value_max, string name = "ClipByValue") 
-            => gen_ops.clip_by_value(t, clip_value_min, clip_value_max, name);
+            => clip_ops.clip_by_value(t, clip_value_min, clip_value_max, name);
 
         public Tensor sub(Tensor a, Tensor b) 
             => gen_math_ops.sub(a, b);
diff --git a/src/TensorFlowNET.Core/Framework/tensor_shape.cs b/src/TensorFlowNET.Core/Framework/tensor_shape.cs
@@ -24,6 +24,16 @@ public static void assert_is_compatible_with(this Tensor self, Tensor other)
             }
         }
 
+        public static Dimension dimension_at_index(TensorShape shape, int index)
+        {
+            return shape.rank < 0 ?
+                new Dimension(-1) :
+                new Dimension(shape.dims[index]);
+        }
+
+        public static int dimension_value(Dimension dimension)
+            => dimension.value;
+
         public static TensorShape as_shape(this Shape shape)
              => new TensorShape(shape.Dimensions);
     }
diff --git a/src/TensorFlowNET.Core/Operations/NnOps/BasicLSTMCell.cs b/src/TensorFlowNET.Core/Operations/NnOps/BasicLSTMCell.cs
@@ -0,0 +1,57 @@
+﻿using System;
+using System.Collections.Generic;
+using System.Linq;
+using System.Text;
+using System.Threading.Tasks;
+using static Tensorflow.Binding;
+using Tensorflow.Operations.Activation;
+using Tensorflow.Keras.Engine;
+using Tensorflow.Operations;
+
+namespace Tensorflow
+{
+    /// <summary>
+    /// Basic LSTM recurrent network cell.
+    /// The implementation is based on: http://arxiv.org/abs/1409.2329.
+    /// </summary>
+    public class BasicLSTMCell : LayerRnnCell
+    {
+        int _num_units;
+        float _forget_bias;
+        bool _state_is_tuple;
+        IActivation _activation;
+
+        /// <summary>
+        /// Initialize the basic LSTM cell.
+        /// </summary>
+        /// <param name="num_units">The number of units in the LSTM cell.</param>
+        /// <param name="forget_bias"></param>
+        /// <param name="state_is_tuple"></param>
+        /// <param name="activation"></param>
+        /// <param name="reuse"></param>
+        /// <param name="name"></param>
+        /// <param name="dtype"></param>
+        public BasicLSTMCell(int num_units, float forget_bias = 1.0f, bool state_is_tuple = true,
+            IActivation activation = null, bool? reuse = null, string name = null,
+            TF_DataType dtype = TF_DataType.DtInvalid) : base(_reuse: reuse, name: name, dtype: dtype)
+        {
+            input_spec = new InputSpec(ndim: 2);
+            _num_units = num_units;
+            _forget_bias = forget_bias;
+            _state_is_tuple = state_is_tuple;
+            _activation = activation;
+            if (_activation == null)
+                _activation = tf.nn.tanh();
+        }
+
+        public LSTMStateTuple state_size
+        {
+            get
+            {
+                return _state_is_tuple ? 
+                    new LSTMStateTuple(_num_units, _num_units) : 
+                    (LSTMStateTuple)(2 * _num_units);
+            }
+        }
+    }
+}
diff --git a/src/TensorFlowNET.Core/Operations/NnOps/BasicRNNCell.cs b/src/TensorFlowNET.Core/Operations/NnOps/BasicRNNCell.cs
@@ -16,6 +16,7 @@ limitations under the License.
 
 using System;
 using Tensorflow.Keras.Engine;
+using Tensorflow.Operations;
 using static Tensorflow.Binding;
 
 namespace Tensorflow
@@ -25,7 +26,7 @@ public class BasicRnnCell : LayerRnnCell
         int _num_units;
         Func<Tensor, string, Tensor> _activation;
 
-        public override int state_size => _num_units;
+        public override LSTMStateTuple state_size => _num_units;
         public override int output_size => _num_units;
         public VariableV1 _kernel;
         string _WEIGHTS_VARIABLE_NAME = "kernel";
diff --git a/src/TensorFlowNET.Core/Operations/NnOps/LSTMStateTuple.cs b/src/TensorFlowNET.Core/Operations/NnOps/LSTMStateTuple.cs
@@ -0,0 +1,41 @@
+﻿using System;
+using System.Collections.Generic;
+using System.Text;
+
+namespace Tensorflow.Operations
+{
+    /// <summary>
+    /// Tuple used by LSTM Cells for `state_size`, `zero_state`, and output state.
+    /// 
+    /// Stores two elements: `(c, h)`, in that order. Where `c` is the hidden state
+    /// and `h` is the output.
+    /// 
+    /// Only used when `state_is_tuple=True`.
+    /// </summary>
+    public class LSTMStateTuple
+    {
+        int c;
+        int h;
+
+        public LSTMStateTuple(int c)
+        {
+            this.c = c;
+        }
+
+        public LSTMStateTuple(int c, int h)
+        {
+            this.c = c;
+            this.h = h;
+        }
+
+        public static implicit operator int(LSTMStateTuple tuple)
+        {
+            return tuple.c;
+        }
+
+        public static implicit operator LSTMStateTuple(int c)
+        {
+            return new LSTMStateTuple(c);
+        }
+    }
+}
diff --git a/src/TensorFlowNET.Core/Operations/NnOps/LayerRNNCell.cs b/src/TensorFlowNET.Core/Operations/NnOps/LayerRNNCell.cs
diff --git a/src/TensorFlowNET.Core/Operations/NnOps/RNNCell.cs b/src/TensorFlowNET.Core/Operations/NnOps/RNNCell.cs
@@ -49,7 +49,7 @@ public abstract class RnnCell : Layers.Layer
         /// difference between TF and Keras RNN cell.
         /// </summary>
         protected bool _is_tf_rnn_cell = false;
-        public virtual int state_size { get; }
+        public virtual LSTMStateTuple state_size { get; }
 
         public virtual int output_size { get; }
 
diff --git a/src/TensorFlowNET.Core/Operations/NnOps/rnn.cs b/src/TensorFlowNET.Core/Operations/NnOps/rnn.cs
@@ -18,13 +18,106 @@ limitations under the License.
 using System;
 using System.Collections.Generic;
 using System.Linq;
+using Tensorflow.Framework;
 using Tensorflow.Util;
 using static Tensorflow.Binding;
 
 namespace Tensorflow.Operations
 {
-    internal class rnn
+    public class rnn
     {
+        /// <summary>
+        /// Creates a bidirectional recurrent neural network.
+        /// </summary>
+        public static void static_bidirectional_rnn(BasicLSTMCell cell_fw, 
+            BasicLSTMCell cell_bw,
+            Tensor[] inputs,
+            Tensor initial_state_fw = null,
+            Tensor initial_state_bw = null,
+            TF_DataType dtype = TF_DataType.DtInvalid,
+            Tensor sequence_length = null,
+            string scope = null)
+        {
+            if (inputs == null || inputs.Length == 0)
+                throw new ValueError("inputs must not be empty");
+
+            tf_with(tf.variable_scope(scope ?? "bidirectional_rnn"), delegate
+            {
+                // Forward direction
+                tf_with(tf.variable_scope("fw"), fw_scope =>
+                {
+                    static_rnn(
+                      cell_fw,
+                      inputs,
+                      initial_state_fw,
+                      dtype,
+                      sequence_length,
+                      scope: fw_scope);
+                });
+            });
+        }
+
+        public static void static_rnn(BasicLSTMCell cell,
+            Tensor[] inputs,
+            Tensor initial_state,
+            TF_DataType dtype = TF_DataType.DtInvalid,
+            Tensor sequence_length = null,
+            VariableScope scope = null)
+        {
+            // Create a new scope in which the caching device is either
+            // determined by the parent scope, or is set to place the cached
+            // Variable using the same placement as for the rest of the RNN.
+            if (scope == null)
+                tf_with(tf.variable_scope("rnn"), varscope =>
+                {
+                    throw new NotImplementedException("static_rnn");
+                });
+            else
+                tf_with(tf.variable_scope(scope), varscope =>
+                {
+                    Dimension fixed_batch_size = null;
+                    Dimension batch_size = null;
+                    Tensor batch_size_tensor = null;
+
+                    // Obtain the first sequence of the input
+                    var first_input = inputs[0];
+                    if (first_input.TensorShape.rank != 1)
+                    {
+                        var input_shape = first_input.TensorShape.with_rank_at_least(2);
+                        fixed_batch_size = input_shape.dims[0];
+                        var flat_inputs = nest.flatten2(inputs);
+                        foreach (var flat_input in flat_inputs)
+                        {
+                            input_shape = flat_input.TensorShape.with_rank_at_least(2);
+                            batch_size = tensor_shape.dimension_at_index(input_shape, 0);
+                            var input_size = input_shape[1];
+                            fixed_batch_size.merge_with(batch_size);
+                            foreach (var (i, size) in enumerate(input_size.dims))
+                            {
+                                if (size < 0)
+                                    throw new ValueError($"Input size (dimension {i} of inputs) must be accessible via " +
+                                        "shape inference, but saw value None.");
+                            }
+                        }
+                    }
+                    else
+                        fixed_batch_size = first_input.TensorShape.with_rank_at_least(1).dims[0];
+
+                    if (tensor_shape.dimension_value(fixed_batch_size) >= 0)
+                        batch_size = tensor_shape.dimension_value(fixed_batch_size);
+                    else
+                        batch_size_tensor = array_ops.shape(first_input)[0];
+
+                    Tensor state = null;
+                    if (initial_state != null)
+                        state = initial_state;
+                    else
+                    {
+                        cell.get_initial_state(batch_size: batch_size_tensor, dtype: dtype);
+                    }
+                });
+        }
+
         public static (Tensor, Tensor) dynamic_rnn(RnnCell cell, Tensor inputs_tensor,
             Tensor sequence_length = null, Tensor initial_state = null, 
             TF_DataType dtype = TF_DataType.DtInvalid,
diff --git a/src/TensorFlowNET.Core/Operations/clip_ops.cs b/src/TensorFlowNET.Core/Operations/clip_ops.cs
@@ -0,0 +1,45 @@
+﻿/*****************************************************************************
+   Copyright 2018 The TensorFlow.NET Authors. All Rights Reserved.
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
+******************************************************************************/
+
+using System;
+using System.Collections.Generic;
+using System.Linq;
+using System.Text;
+using System.Threading.Tasks;
+using static Tensorflow.Binding;
+
+namespace Tensorflow
+{
+    public class clip_ops
+    {
+        public static Tensor clip_by_value(Tensor t, Tensor clip_value_min, Tensor clip_value_max, string name = null)
+        {
+            return tf_with(ops.name_scope(name, "clip_by_value", new { t, clip_value_min, clip_value_max }), delegate
+            {
+                var values = ops.convert_to_tensor(t, name: "t");
+                // Go through list of tensors, for each value in each tensor clip
+                var t_min = math_ops.minimum(values, clip_value_max);
+                // Assert that the shape is compatible with the initial shape,
+                // to prevent unintentional broadcasting.
+                _ = values.TensorShape.merge_with(t_min.shape);
+                var t_max = math_ops.maximum(t_min, clip_value_min, name: name);
+                _ = values.TensorShape.merge_with(t_max.shape);
+
+                return t_max;
+            });
+        }
+    }
+}
diff --git a/src/TensorFlowNET.Core/TensorFlow.Binding.csproj b/src/TensorFlowNET.Core/TensorFlow.Binding.csproj
@@ -1,7 +1,7 @@
 ﻿<Project Sdk="Microsoft.NET.Sdk">
 
   <PropertyGroup>
-    <TargetFrameworks>net472;netstandard2.0</TargetFrameworks>
+    <TargetFramework>netstandard2.0</TargetFramework>
     <AssemblyName>TensorFlow.NET</AssemblyName>
     <RootNamespace>Tensorflow</RootNamespace>
     <TargetTensorFlow>1.14.1</TargetTensorFlow>
diff --git a/src/TensorFlowNET.Core/Tensors/Dimension.cs b/src/TensorFlowNET.Core/Tensors/Dimension.cs
@@ -22,6 +22,12 @@ public Dimension merge_with(Dimension other)
                 return new Dimension(_value);
         }
 
+        public static implicit operator Dimension(int value)
+            => new Dimension(value);
+
+        public static implicit operator int(Dimension dimension)
+            => dimension.value;
+
         public override string ToString() => $"Dimension({_value})";
     }
 }
diff --git a/src/TensorFlowNET.Core/Tensors/Tensor.cs b/src/TensorFlowNET.Core/Tensors/Tensor.cs
@@ -162,9 +162,9 @@ public int[] shape
                 using (var status = new Status())
                 {
                     if (value == null)
-                        c_api.TF_GraphSetTensorShape(this.graph, this._as_tf_output(), null, -1, status);
+                        c_api.TF_GraphSetTensorShape(graph, _as_tf_output(), null, -1, status);
                     else
-                        c_api.TF_GraphSetTensorShape(this.graph, this._as_tf_output(), value.Select(Convert.ToInt64).ToArray(), value.Length, status);
+                        c_api.TF_GraphSetTensorShape(graph, _as_tf_output(), value.Select(Convert.ToInt64).ToArray(), value.Length, status);
 
                     status.Check(true);
                 }

Original file line number	Diff line number	Diff line change
`@@ -24,6 +24,16 @@ public static void assert_is_compatible_with(this Tensor self, Tensor other)`
`24`	`24`	`}`
`25`	`25`	`}`
`26`	`26`
	`27`	`+ public static Dimension dimension_at_index(TensorShape shape, int index)`
	`28`	`+ {`
	`29`	`+ return shape.rank < 0 ?`
	`30`	`+ new Dimension(-1) :`
	`31`	`+ new Dimension(shape.dims[index]);`
	`32`	`+ }`
	`33`	`+`
	`34`	`+ public static int dimension_value(Dimension dimension)`
	`35`	`+ => dimension.value;`
	`36`	`+`
`27`	`37`	`public static TensorShape as_shape(this Shape shape)`
`28`	`38`	`=> new TensorShape(shape.Dimensions);`
`29`	`39`	`}`