SciSharp
diff --git a/‎src/TensorFlowNET.Core/APIs/tf.layers.cs
Lines changed: 1 addition & 2 deletions b/‎src/TensorFlowNET.Core/APIs/tf.layers.cs
Lines changed: 1 addition & 2 deletions
diff --git a/‎src/TensorFlowNET.Core/APIs/tf.nn.cs
Lines changed: 2 additions & 2 deletions b/‎src/TensorFlowNET.Core/APIs/tf.nn.cs
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/TensorFlowNET.Core/Framework/meta_graph.cs
Lines changed: 6 additions & 1 deletion b/‎src/TensorFlowNET.Core/Framework/meta_graph.cs
Lines changed: 6 additions & 1 deletion
diff --git a/‎src/TensorFlowNET.Core/Functions/c_api.function.cs
Lines changed: 16 additions & 1 deletion b/‎src/TensorFlowNET.Core/Functions/c_api.function.cs
Lines changed: 16 additions & 1 deletion
diff --git a/‎src/TensorFlowNET.Core/Gradients/math_grad.cs
Lines changed: 4 additions & 7 deletions b/‎src/TensorFlowNET.Core/Gradients/math_grad.cs
Lines changed: 4 additions & 7 deletions
diff --git a/‎src/TensorFlowNET.Core/Gradients/nn_grad.cs
Lines changed: 5 additions & 5 deletions b/‎src/TensorFlowNET.Core/Gradients/nn_grad.cs
Lines changed: 5 additions & 5 deletions
diff --git a/‎src/TensorFlowNET.Core/Graphs/Graph.cs
Lines changed: 0 additions & 6 deletions b/‎src/TensorFlowNET.Core/Graphs/Graph.cs
Lines changed: 0 additions & 6 deletions
diff --git a/‎src/TensorFlowNET.Core/Graphs/c_api.graph.cs
Lines changed: 1 addition & 1 deletion b/‎src/TensorFlowNET.Core/Graphs/c_api.graph.cs
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/TensorFlowNET.Core/Keras/ArgsDefinition/TensorLikeDataAdapterArgs.cs
Lines changed: 16 additions & 0 deletions b/‎src/TensorFlowNET.Core/Keras/ArgsDefinition/TensorLikeDataAdapterArgs.cs
Lines changed: 16 additions & 0 deletions
diff --git a/‎src/TensorFlowNET.Core/Keras/Engine/DataAdapters/DataHandler.cs
Lines changed: 2 additions & 0 deletions b/‎src/TensorFlowNET.Core/Keras/Engine/DataAdapters/DataHandler.cs
Lines changed: 2 additions & 0 deletions
diff --git a/‎src/TensorFlowNET.Core/Keras/Engine/DataAdapters/TensorLikeDataAdapter.cs
Lines changed: 2 additions & 1 deletion b/‎src/TensorFlowNET.Core/Keras/Engine/DataAdapters/TensorLikeDataAdapter.cs
Lines changed: 2 additions & 1 deletion
diff --git a/‎src/TensorFlowNET.Core/Keras/Engine/Layer.State.cs
Lines changed: 21 additions & 0 deletions b/‎src/TensorFlowNET.Core/Keras/Engine/Layer.State.cs
Lines changed: 21 additions & 0 deletions
diff --git a/‎src/TensorFlowNET.Core/Keras/Engine/Model.cs
Lines changed: 33 additions & 2 deletions b/‎src/TensorFlowNET.Core/Keras/Engine/Model.cs
Lines changed: 33 additions & 2 deletions
diff --git a/‎src/TensorFlowNET.Core/Keras/Layers/Embedding.cs
Lines changed: 4 additions & 0 deletions b/‎src/TensorFlowNET.Core/Keras/Layers/Embedding.cs
Lines changed: 4 additions & 0 deletions
diff --git a/‎src/TensorFlowNET.Core/Keras/Layers/LayersApi.cs
Lines changed: 6 additions & 3 deletions b/‎src/TensorFlowNET.Core/Keras/Layers/LayersApi.cs
Lines changed: 6 additions & 3 deletions
diff --git a/‎src/TensorFlowNET.Core/Operations/Initializers/TruncatedNormal.cs
Lines changed: 3 additions & 3 deletions b/‎src/TensorFlowNET.Core/Operations/Initializers/TruncatedNormal.cs
Lines changed: 3 additions & 3 deletions
diff --git a/‎src/TensorFlowNET.Core/Operations/Operation.cs
Lines changed: 30 additions & 1 deletion b/‎src/TensorFlowNET.Core/Operations/Operation.cs
Lines changed: 30 additions & 1 deletion
@@ -193,8 +193,7 @@ public Tensor dense(Tensor inputs,
                     Name = name
                 });
 
-                throw new NotImplementedException("");
-                //return layer.apply(inputs).Item1;
+                return layer.Apply(inputs);
             }
 
             /// <summary>
 
@@ -66,8 +66,8 @@ public Tensor dropout(Tensor x, Tensor keep_prob = null, Tensor noise_shape = nu
                 Tensor keep = null;
                 if (keep_prob != null)
                     keep = 1.0f - keep_prob;
-
-                return nn_ops.dropout_v2(x, rate: rate.Value, noise_shape: noise_shape, seed: seed, name: name);
+                var rate_tensor = rate.HasValue ? tf.constant(rate.Value) : keep;
+                return nn_ops.dropout_v2(x, rate: rate_tensor, noise_shape: noise_shape, seed: seed, name: name);
             }
 
             /// <summary>
 
@@ -150,7 +150,7 @@ public static (Dictionary<string, IVariableV1>, ITensorOrOperation[]) import_sco
             var variables = graph.get_collection<IVariableV1>(tf.GraphKeys.GLOBAL_VARIABLES,
                                      scope: scope_to_prepend_to_names);
             var var_list = new Dictionary<string, IVariableV1>();
-            // variables.ForEach(v => var_list[ops.strip_name_scope(v.Name, scope_to_prepend_to_names)] = v);
+            variables.ForEach(v => var_list[ops.strip_name_scope(v.Name, scope_to_prepend_to_names)] = v);
 
             return (var_list, imported_return_elements);
         }
@@ -277,6 +277,11 @@ private static void add_collection_def(MetaGraphDef meta_graph_def,
                             var proto = x_ref_var.to_proto(export_scope);
                             col_def.BytesList.Value.Add(proto.ToByteString());
                         }
+                        else if(x is ResourceVariable x_res_var)
+                        {
+                            var proto = x_res_var.to_proto(export_scope);
+                            col_def.BytesList.Value.Add(proto.ToByteString());
+                        }
                     }
                     break;
                 case List<RefVariable> collection_list:
 
@@ -31,8 +31,23 @@ public partial class c_api
         /// <param name="output_func_def"></param>
         /// <param name="status"></param>
         [DllImport(TensorFlowLibName)]
-        public static extern void TF_FunctionToFunctionDef(IntPtr func, IntPtr output_func_def, SafeStatusHandle status);
+        public static extern void TF_FunctionToFunctionDef(IntPtr func, SafeBufferHandle output_func_def, SafeStatusHandle status);
 
+        [DllImport(TensorFlowLibName)]
+        public static extern IntPtr TF_GraphToFunction(IntPtr fn_body, string fn_name,
+            bool append_hash_to_fn_name,
+            int num_opers, IntPtr[] opers,
+            int ninputs, TF_Output[] inputs,
+            int noutputs, TF_Output[] outputs,
+            IntPtr output_names,
+            IntPtr opts,
+            string description,
+            SafeStatusHandle status);
+
+        [DllImport(TensorFlowLibName)]
+        public static extern IntPtr TF_FunctionName(IntPtr func);
 
+        [DllImport(TensorFlowLibName)]
+        public static extern void TF_GraphCopyFunction(IntPtr g, IntPtr func, IntPtr grad, SafeStatusHandle status);
     }
 }
@@ -327,8 +327,9 @@ public static Tensor[] _MeanGrad(Operation op, Tensor[] grads)
             var output_shape = op.outputs[0]._shape_tuple();
 
             Tensor result, factor_tensor;
-            if(input_shape != null &&
-                output_shape != null)
+            if(tf.executing_eagerly() 
+                && input_shape != null 
+                && output_shape != null)
             {
                 var input_size = np.prod(input_shape);
                 var output_size = np.prod(output_shape);
@@ -339,11 +340,7 @@ public static Tensor[] _MeanGrad(Operation op, Tensor[] grads)
             {
                 var input_shape_tensor = array_ops.shape(op.inputs[0]);
                 var output_shape_tensor = array_ops.shape(op.outputs[0]);
-                var factor = _safe_shape_div(math_ops.reduce_prod(input_shape_tensor), math_ops.reduce_prod(output_shape_tensor));
-                throw new NotImplementedException("");
-#pragma warning disable CS0162 // Unreachable code detected
-                factor_tensor = null;
-#pragma warning restore CS0162 // Unreachable code detected
+                factor_tensor = _safe_shape_div(math_ops.reduce_prod(input_shape_tensor), math_ops.reduce_prod(output_shape_tensor));
             }
 
             result = math_ops.truediv(sum_grad, math_ops.cast(factor_tensor, sum_grad.dtype));
 
@@ -128,10 +128,10 @@ public static Tensor[] _SparseSoftmaxCrossEntropyWithLogitsGrad(Operation op, Te
         [RegisterGradient("Conv2D")]
         public static Tensor[] _Conv2DGrad(Operation op, Tensor[] grads)
         {
-            var dilations = op.get_attr<int[]>("dilations");
-            var strides = op.get_attr<int[]>("strides");
+            var dilations = op.get_attr_list<int>("dilations");
+            var strides = op.get_attr_list<int>("strides");
             var padding = op.get_attr<string>("padding");
-            var explicit_paddings = op.get_attr<int[]>("explicit_paddings");
+            var explicit_paddings = op.get_attr_list<int>("explicit_paddings");
             var use_cudnn_on_gpu = op.get_attr<bool>("use_cudnn_on_gpu");
             var data_format = op.get_attr<string>("data_format");
             var shape = gen_array_ops.shape_n(new Tensor[] { op.inputs[0], op.inputs[1] });
@@ -287,8 +287,8 @@ public static Tensor[] _MaxPoolGrad(Operation op, Tensor[] grads)
                   op.inputs[0],
                   op.outputs[0],
                   grad,
-                  op.get_attr("ksize") as int[],
-                  op.get_attr("strides") as int[],
+                  op.get_attr_list<int>("ksize"),
+                  op.get_attr_list<int>("strides"),
                   padding: op.get_attr("padding").ToString(),
                   data_format: op.get_attr("data_format").ToString())
             };
 
@@ -293,12 +293,6 @@ public Operation create_op(string op_type, Tensor[] inputs, TF_DataType[] dtypes
 
             _create_op_helper(op, compute_device);
 
-            /*Console.Write($"create_op: {op_type} '{node_def.Name}'");
-            Console.Write($", inputs: {(inputs.Length == 0 ? "empty" : String.Join(", ", inputs.Select(x => x.name)))}");
-            Console.Write($", control_inputs: {(control_inputs.Length == 0 ? "empty" : String.Join(", ", control_inputs.Select(x => x.name)))}");
-            Console.Write($", outputs: {(op.outputs.Length == 0 ? "empty" : String.Join(", ", op.outputs.Select(x => x.name)))}");
-            Console.WriteLine();*/
-
             return op;
         }
 
 
@@ -139,7 +139,7 @@ public partial class c_api
         /// <param name="status">TF_Status*</param>
         [DllImport(TensorFlowLibName)]
         public static extern void TF_GraphToGraphDef(IntPtr graph, SafeBufferHandle output_graph_def, SafeStatusHandle status);
-        
+
         /// <summary>
         /// Returns the number of dimensions of the Tensor referenced by `output`
         /// in `graph`.
 
@@ -0,0 +1,16 @@
+using System;
+using System.Collections.Generic;
+using System.Text;
+
+namespace Tensorflow.Keras.ArgsDefinition
+{
+    public class TensorLikeDataAdapterArgs
+    {
+        public Tensor X { get; set; }
+        public Tensor Y { get; set; }
+        public int BatchSize { get; set; }
+        public int Steps { get; set; }
+        public int Epochs { get; set; }
+        public bool Shuffle { get; set; }
+    }
+}
@@ -27,7 +27,9 @@ public class DataHandler
 
         public DataHandler(DataHandlerArgs args)
         {
+            this.args = args;
 
+            var adapter_cls = new TensorLikeDataAdapter(new TensorLikeDataAdapterArgs { });
         }
     }
 }
@@ -1,6 +1,7 @@
 using System;
 using System.Collections.Generic;
 using System.Text;
+using Tensorflow.Keras.ArgsDefinition;
 using static Tensorflow.Binding;
 
 namespace Tensorflow.Keras.Engine.DataAdapters
@@ -10,7 +11,7 @@ namespace Tensorflow.Keras.Engine.DataAdapters
     /// </summary>
     public class TensorLikeDataAdapter : IDataAdapter
     {
-        public TensorLikeDataAdapter()
+        public TensorLikeDataAdapter(TensorLikeDataAdapterArgs args)
         {
             tf.data.Dataset.range(5);
         }
 
@@ -0,0 +1,21 @@
+using System;
+using System.Collections.Generic;
+using System.Text;
+
+namespace Tensorflow.Keras.Engine
+{
+    public partial class Layer
+    {
+        Dictionary<Layer, object> trainable_state;
+        Dictionary<Layer, object> _get_trainable_state()
+        {
+            trainable_state = new Dictionary<Layer, object>();
+            throw new NotImplementedException("");
+        }
+
+        void _set_trainable_state(Dictionary<Layer, object> trainable_state)
+        {
+            throw new NotImplementedException("");
+        }
+    }
+}
@@ -1,6 +1,7 @@
-using NumSharp;
+using static Tensorflow.Binding;
 using System;
 using Tensorflow.Keras.ArgsDefinition;
+using Tensorflow.Keras.Engine.DataAdapters;
 using Tensorflow.Keras.Losses;
 using Tensorflow.Keras.Optimizers;
 
@@ -21,6 +22,7 @@ public class Model : Layer
 #pragma warning restore CS0108 // Member hides inherited member; missing new keyword
         string loss;
         IOptimizer optimizer;
+        IVariableV1 _steps_per_execution;
 
         public Model(ModelArgs args) 
             : base(args)
@@ -37,10 +39,25 @@ public void compile(string optimizerName, string lossName)
                     break;
             }
 
+            int experimental_steps_per_execution = 1;
+            _configure_steps_per_execution(experimental_steps_per_execution);
+
+            _reset_compile_cache();
+
             loss = lossName;
             _is_compiled = true;
+        }
+
+        void _configure_steps_per_execution(int steps_per_execution)
+        {
+            _steps_per_execution = tf.Variable(steps_per_execution,
+                dtype: TF_DataType.TF_INT64,
+                aggregation: VariableAggregation.OnlyFirstReplica);
+        }
+
+        void _reset_compile_cache()
+        {
 
-            // Prepare list of loss functions, same size of model outputs.
         }
 
         public void compile(string optimizerName, ILossFunc lossName)
@@ -70,6 +87,20 @@ public Tensor predict(Tensor x,
             int workers = 1,
             bool use_multiprocessing = false)
         {
+            var data_handler = new DataHandler(new DataHandlerArgs
+            {
+                X = x,
+                BatchSize = batch_size,
+                StepsPerEpoch = steps,
+                InitialEpoch = 0,
+                Epochs = 1,
+                MaxQueueSize = max_queue_size,
+                Workers = workers,
+                UseMultiprocessing = use_multiprocessing,
+                Model = this,
+                StepsPerExecution = _steps_per_execution
+            });
+
             throw new NotImplementedException("");
         }
     }
 
@@ -14,6 +14,7 @@ You may obtain a copy of the License at
    limitations under the License.
 ******************************************************************************/
 
+using System.Linq;
 using Tensorflow.Keras.ArgsDefinition;
 using Tensorflow.Keras.Engine;
 using static Tensorflow.Binding;
@@ -44,6 +45,9 @@ public Embedding(EmbeddingArgs args)
             if (args.InputShape == null)
                 args.InputShape = args.InputLength;
 
+            if (args.BatchInputShape == null)
+                args.BatchInputShape = new int[] { args.BatchSize }.Concat(args.InputShape.dims).ToArray();
+
             embeddings_initializer = embeddings_initializer ?? tf.random_uniform_initializer;
             SupportsMasking = mask_zero;
         }
 
@@ -34,10 +34,13 @@ public Dense Dense(int units,
 
         /// <summary>
         /// Turns positive integers (indexes) into dense vectors of fixed size.
+        /// This layer can only be used as the first layer in a model.
+        /// e.g. [[4], [20]] -> [[0.25, 0.1], [0.6, -0.2]]
+        /// https://www.tensorflow.org/api_docs/python/tf/keras/layers/Embedding
         /// </summary>
-        /// <param name="input_dim"></param>
-        /// <param name="output_dim"></param>
-        /// <param name="embeddings_initializer"></param>
+        /// <param name="input_dim">Size of the vocabulary, i.e. maximum integer index + 1.</param>
+        /// <param name="output_dim">Dimension of the dense embedding.</param>
+        /// <param name="embeddings_initializer">Initializer for the embeddings matrix (see keras.initializers).</param>
         /// <param name="mask_zero"></param>
         /// <returns></returns>
         public Embedding Embedding(int input_dim,
 
@@ -36,9 +36,9 @@ public TruncatedNormal(float mean = 0.0f,
 
         public Tensor Apply(InitializerArgs args)
         {
-            if (args.DType == TF_DataType.DtInvalid)
-                args.DType = this.dtype;
-            return random_ops.truncated_normal(args.Shape, mean, stddev, dtype : dtype, seed: seed);
+            if (args.DType != TF_DataType.DtInvalid)
+                dtype = args.DType;
+            return random_ops.truncated_normal(args.Shape, mean, stddev, dtype: dtype, seed: seed);
         }
     }
 }
@@ -230,6 +230,35 @@ private object[] _reconstruct_sequence_inputs(OpDef op_def, Tensor[] inputs, Map
         public virtual T get_attr<T>(string name)
             => (T)get_attr(name);
 
+        public virtual T[] get_attr_list<T>(string name)
+        {
+            if (tf.executing_eagerly())
+                return (T[])get_attr(name);
+
+            AttrValue x = null;
+
+            lock (Locks.ProcessWide)
+            {
+                using var buf = new Buffer();
+                c_api.TF_OperationGetAttrValueProto(_handle, name, buf.Handle, tf.Status.Handle);
+                tf.Status.Check(true);
+
+                x = AttrValue.Parser.ParseFrom(buf.DangerousMemoryBlock.Stream());
+            }
+
+            string oneof_value = x.ValueCase.ToString();
+            if (string.IsNullOrEmpty(oneof_value))
+                return null;
+
+            switch (typeof(T).Name)
+            {
+                case nameof(Int32):
+                    return x.List.I.Select(x => (T)Convert.ChangeType(x, typeof(T))).ToArray();
+                default:
+                    return null;
+            }
+        }
+
         public virtual object get_attr(string name)
         {
             AttrValue x = null;
@@ -250,7 +279,7 @@ public virtual object get_attr(string name)
             if (oneof_value == "list")
                 throw new NotImplementedException($"Unsupported field type in {x.ToString()}");
 
-            if (oneof_value == "type")
+            if (string.Equals("type", oneof_value, StringComparison.OrdinalIgnoreCase))
                 return x.Type;
 
             object result = x.GetType().GetProperty(oneof_value).GetValue(x);
Original file line number	Diff line number	Diff line change
`@@ -193,8 +193,7 @@ public Tensor dense(Tensor inputs,`
`193`	`193`	`Name = name`
`194`	`194`	`});`
`195`	`195`
`196`		`- throw new NotImplementedException("");`
`197`		`- //return layer.apply(inputs).Item1;`
	`196`	`+ return layer.Apply(inputs);`
`198`	`197`	`}`
`199`	`198`
`200`	`199`	`/// <summary>`
Original file line number	Diff line number	Diff line change
`@@ -150,7 +150,7 @@ public static (Dictionary<string, IVariableV1>, ITensorOrOperation[]) import_sco`
`150`	`150`	`var variables = graph.get_collection<IVariableV1>(tf.GraphKeys.GLOBAL_VARIABLES,`
`151`	`151`	`scope: scope_to_prepend_to_names);`
`152`	`152`	`var var_list = new Dictionary<string, IVariableV1>();`
`153`		`- // variables.ForEach(v => var_list[ops.strip_name_scope(v.Name, scope_to_prepend_to_names)] = v);`
	`153`	`+ variables.ForEach(v => var_list[ops.strip_name_scope(v.Name, scope_to_prepend_to_names)] = v);`
`154`	`154`
`155`	`155`	`return (var_list, imported_return_elements);`
`156`	`156`	`}`
`@@ -277,6 +277,11 @@ private static void add_collection_def(MetaGraphDef meta_graph_def,`
`277`	`277`	`var proto = x_ref_var.to_proto(export_scope);`
`278`	`278`	`col_def.BytesList.Value.Add(proto.ToByteString());`
`279`	`279`	`}`
	`280`	`+ else if(x is ResourceVariable x_res_var)`
	`281`	`+ {`
	`282`	`+ var proto = x_res_var.to_proto(export_scope);`
	`283`	`+ col_def.BytesList.Value.Add(proto.ToByteString());`
	`284`	`+ }`
`280`	`285`	`}`
`281`	`286`	`break;`
`282`	`287`	`case List<RefVariable> collection_list:`
Original file line number	Diff line number	Diff line change
`@@ -27,7 +27,9 @@ public class DataHandler`
`27`	`27`
`28`	`28`	`public DataHandler(DataHandlerArgs args)`
`29`	`29`	`{`
	`30`	`+ this.args = args;`
`30`	`31`
	`32`	`+ var adapter_cls = new TensorLikeDataAdapter(new TensorLikeDataAdapterArgs { });`
`31`	`33`	`}`
`32`	`34`	`}`
`33`	`35`	`}`
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,7 @@`
`1`	`1`	`using System;`
`2`	`2`	`using System.Collections.Generic;`
`3`	`3`	`using System.Text;`
	`4`	`+using Tensorflow.Keras.ArgsDefinition;`
`4`	`5`	`using static Tensorflow.Binding;`
`5`	`6`
`6`	`7`	`namespace Tensorflow.Keras.Engine.DataAdapters`
`@@ -10,7 +11,7 @@ namespace Tensorflow.Keras.Engine.DataAdapters`
`10`	`11`	`/// </summary>`
`11`	`12`	`public class TensorLikeDataAdapter : IDataAdapter`
`12`	`13`	`{`
`13`		`- public TensorLikeDataAdapter()`
	`14`	`+ public TensorLikeDataAdapter(TensorLikeDataAdapterArgs args)`
`14`	`15`	`{`
`15`	`16`	`tf.data.Dataset.range(5);`
`16`	`17`	`}`
Original file line number	Diff line number	Diff line change
`@@ -36,9 +36,9 @@ public TruncatedNormal(float mean = 0.0f,`
`36`	`36`
`37`	`37`	`public Tensor Apply(InitializerArgs args)`
`38`	`38`	`{`
`39`		`- if (args.DType == TF_DataType.DtInvalid)`
`40`		`- args.DType = this.dtype;`
`41`		`- return random_ops.truncated_normal(args.Shape, mean, stddev, dtype : dtype, seed: seed);`
	`39`	`+ if (args.DType != TF_DataType.DtInvalid)`
	`40`	`+ dtype = args.DType;`
	`41`	`+ return random_ops.truncated_normal(args.Shape, mean, stddev, dtype: dtype, seed: seed);`
`42`	`42`	`}`
`43`	`43`	`}`
`44`	`44`	`}`