SciSharp
diff --git a/‎src/TensorFlowNET.Core/Eager/EagerRunner.RecordGradient.cs‎
Lines changed: 1 addition & 2 deletions b/‎src/TensorFlowNET.Core/Eager/EagerRunner.RecordGradient.cs‎
Lines changed: 1 addition & 2 deletions
diff --git a/‎src/TensorFlowNET.Core/Gradients/Tape.RecordOperation.cs‎
Lines changed: 1 addition & 2 deletions b/‎src/TensorFlowNET.Core/Gradients/Tape.RecordOperation.cs‎
Lines changed: 1 addition & 2 deletions
diff --git a/‎src/TensorFlowNET.Core/Gradients/Tape.cs‎
Lines changed: 2 additions & 3 deletions b/‎src/TensorFlowNET.Core/Gradients/Tape.cs‎
Lines changed: 2 additions & 3 deletions
diff --git a/‎src/TensorFlowNET.Core/Gradients/array_grad.cs‎
Lines changed: 33 additions & 25 deletions b/‎src/TensorFlowNET.Core/Gradients/array_grad.cs‎
Lines changed: 33 additions & 25 deletions
diff --git a/‎src/TensorFlowNET.Core/Graphs/AutoGraphAttribute.cs‎
Lines changed: 7 additions & 0 deletions b/‎src/TensorFlowNET.Core/Graphs/AutoGraphAttribute.cs‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎…re/Keras/ArgsDefinition/LeakyReLUArgs.cs‎ ‎…gsDefinition/Activation/LeakyReLuArgs.cs‎src/TensorFlowNET.Core/Keras/ArgsDefinition/LeakyReLUArgs.cs renamed to src/TensorFlowNET.Core/Keras/ArgsDefinition/Activation/LeakyReLuArgs.cs
Lines changed: 1 addition & 1 deletion b/‎…re/Keras/ArgsDefinition/LeakyReLUArgs.cs‎ ‎…gsDefinition/Activation/LeakyReLuArgs.cs‎src/TensorFlowNET.Core/Keras/ArgsDefinition/LeakyReLUArgs.cs renamed to src/TensorFlowNET.Core/Keras/ArgsDefinition/Activation/LeakyReLuArgs.cs
Lines changed: 1 addition & 1 deletion
diff --git a/‎….Core/Keras/ArgsDefinition/Conv2DArgs.cs‎ ‎…ArgsDefinition/Convolution/Conv2DArgs.cs‎src/TensorFlowNET.Core/Keras/ArgsDefinition/Conv2DArgs.cs renamed to src/TensorFlowNET.Core/Keras/ArgsDefinition/Convolution/Conv2DArgs.cs b/‎….Core/Keras/ArgsDefinition/Conv2DArgs.cs‎ ‎…ArgsDefinition/Convolution/Conv2DArgs.cs‎src/TensorFlowNET.Core/Keras/ArgsDefinition/Conv2DArgs.cs renamed to src/TensorFlowNET.Core/Keras/ArgsDefinition/Convolution/Conv2DArgs.cs
diff --git a/‎…eras/ArgsDefinition/ConvolutionalArgs.cs‎ ‎…inition/Convolution/ConvolutionalArgs.cs‎src/TensorFlowNET.Core/Keras/ArgsDefinition/ConvolutionalArgs.cs renamed to src/TensorFlowNET.Core/Keras/ArgsDefinition/Convolution/ConvolutionalArgs.cs b/‎…eras/ArgsDefinition/ConvolutionalArgs.cs‎ ‎…inition/Convolution/ConvolutionalArgs.cs‎src/TensorFlowNET.Core/Keras/ArgsDefinition/ConvolutionalArgs.cs renamed to src/TensorFlowNET.Core/Keras/ArgsDefinition/Convolution/ConvolutionalArgs.cs
diff --git a/‎…T.Core/Keras/ArgsDefinition/DenseArgs.cs‎ ‎…e/Keras/ArgsDefinition/Core/DenseArgs.cs‎src/TensorFlowNET.Core/Keras/ArgsDefinition/DenseArgs.cs renamed to src/TensorFlowNET.Core/Keras/ArgsDefinition/Core/DenseArgs.cs b/‎…T.Core/Keras/ArgsDefinition/DenseArgs.cs‎ ‎…e/Keras/ArgsDefinition/Core/DenseArgs.cs‎src/TensorFlowNET.Core/Keras/ArgsDefinition/DenseArgs.cs renamed to src/TensorFlowNET.Core/Keras/ArgsDefinition/Core/DenseArgs.cs
diff --git a/‎…re/Keras/ArgsDefinition/EmbeddingArgs.cs‎ ‎…ras/ArgsDefinition/Core/EmbeddingArgs.cs‎src/TensorFlowNET.Core/Keras/ArgsDefinition/EmbeddingArgs.cs renamed to src/TensorFlowNET.Core/Keras/ArgsDefinition/Core/EmbeddingArgs.cs b/‎…re/Keras/ArgsDefinition/EmbeddingArgs.cs‎ ‎…ras/ArgsDefinition/Core/EmbeddingArgs.cs‎src/TensorFlowNET.Core/Keras/ArgsDefinition/EmbeddingArgs.cs renamed to src/TensorFlowNET.Core/Keras/ArgsDefinition/Core/EmbeddingArgs.cs
@@ -1,6 +1,5 @@
 using System;
 using System.Linq;
-using Microsoft.Extensions.Logging;
 using Tensorflow.Gradients;
 using static Tensorflow.Binding;
 using static Tensorflow.tensorflow;
@@ -39,7 +38,7 @@ public bool RecordGradient(string op_name,
                 }*/
             }
 
-            tf.Logger.LogDebug($"RecordGradient: should_record={should_record}, op_name={op_name}");
+            tf.Logger.Debug($"RecordGradient: should_record={should_record}, op_name={op_name}");
             if (!should_record) return should_record;
 
             Tensor[] op_outputs;
 
@@ -1,6 +1,5 @@
 using System;
 using System.Collections.Generic;
-using Microsoft.Extensions.Logging;
 using Tensorflow.Util;
 using static Tensorflow.tensorflow;
 using static Tensorflow.Binding;
@@ -36,7 +35,7 @@ public void RecordOperation(string op_type,
             foreach (var o in output_tensors)
             {
                 tensor_tape_[o.GetID()] = op_id;
-                tf.Logger.LogDebug($"RecordOperation: tensor_tape_[{o.GetID()}] = {op_id}");
+                tf.Logger.Debug($"RecordOperation: tensor_tape_[{o.GetID()}] = {op_id}");
                 tensor_usage_[o.GetID()] = 1;
                 tensors.Add(o);
             }
 
@@ -1,7 +1,6 @@
 using System;
 using System.Collections.Generic;
 using Tensorflow.Util;
-using Microsoft.Extensions.Logging;
 using static Tensorflow.Binding;
 using static Tensorflow.tensorflow;
 
@@ -44,7 +43,7 @@ public void Watch(long tensor_id)
             if (!CouldBackprop())
                 return;
 
-            tf.Logger.LogDebug($"Watch tensor_id={tensor_id}");
+            tf.Logger.Debug($"Watch tensor_id={tensor_id}");
             tensor_tape_.emplace(tensor_id, -1);
         }
 
@@ -56,7 +55,7 @@ public bool ShouldRecord(long[] tensor_ids, TF_DataType[] dtypes)
                 {
                     if (IsDtypeTrainable(dtypes[i]))
                     {
-                        tf.Logger.LogDebug($"tape.h->ShouldRecord: should_record = true, tensor_tape_.size()={tensor_tape_.Count}, tensor_ids[{i}]={tensor_ids[i]}");
+                        tf.Logger.Debug($"tape.h->ShouldRecord: should_record = true, tensor_tape_.size()={tensor_tape_.Count}, tensor_ids[{i}]={tensor_ids[i]}");
                         return true;
                     }
                 }
 
@@ -16,6 +16,7 @@ limitations under the License.
 
 using System.Collections.Generic;
 using System.Linq;
+using Tensorflow.Eager;
 using Tensorflow.Framework;
 using static Tensorflow.Binding;
 
@@ -82,7 +83,14 @@ private static Tensor[] _ConcatGradHelper(Operation op, Tensor grad, int start_v
                 .ToArray();
 
             var out_grads = new List<Tensor>();
-            if (constant_op.is_constant(concat_dim))
+            if(concat_dim is EagerTensor)
+            {
+                var non_neg_concat_dim = (int)concat_dim % input_values[0].rank;
+                var sizes = input_values.Select(x => x.shape[non_neg_concat_dim]).ToArray();
+                var sizes_tensor = constant_op.constant(sizes);
+                out_grads = gen_array_ops.split_v(grad, sizes_tensor, sizes[0], non_neg_concat_dim).ToList();
+            }
+            else if (constant_op.is_constant(concat_dim))
             {
                 /*If concat_dim is a constant defined in a different context,
                 then we duplicate it in the current context to avoid passing it
@@ -97,33 +105,33 @@ through an Enter node.
                     var value = tensor_util.constant_value(concat_dim);
                     concat_dim = constant_op.constant(value: value, dtype: concat_dim.dtype);
                 }
-            }
 
-            // Using mod here for convenience since concat_dim is already verified
-            // in concat implementation to be within the allowed [-rank, rank) range.
-            var non_neg_concat_dim = concat_dim % array_ops.rank(input_values[0]);
+                // Using mod here for convenience since concat_dim is already verified
+                // in concat implementation to be within the allowed [-rank, rank) range.
+                var non_neg_concat_dim = concat_dim % array_ops.rank(input_values[0]);
 
-            // Get the inputs' tensor shapes
-            var sizes = _ExtractInputShapes(input_values);
+                // Get the inputs' tensor shapes
+                var sizes = _ExtractInputShapes(input_values);
 
-            /* The magic number of 16 was found through benchmarking a range of sizes
-             on CPUs and a Maxwell TitanX.  A speedup was seen in a large majority of
-             cases when switching implementations at N=16, but it is possible that
-             there will be a small number of performance regressions.*/
-            if (len(sizes) > 16)
-            {
-                // extract the size of each input along the concat dimension
-                var slice = array_ops.slice(array_ops.stack(sizes, axis: 1),
-                        new Tensor[] { non_neg_concat_dim, tf.constant(0) },
-                        new Tensor[] { tf.constant(1), tf.constant(-1) });
-                var squeeze_sizes = array_ops.squeeze(slice);
-                out_grads = array_ops.split(axis: grad, value: squeeze_sizes, num_split: (int)non_neg_concat_dim).ToList();
-            }
-            else
-            {
-                var offset = gen_array_ops.concat_offset(non_neg_concat_dim, sizes);
-                foreach (var (begin, size) in zip(offset, sizes))
-                    out_grads.Add(gen_array_ops.slice(grad, begin, size));
+                /* The magic number of 16 was found through benchmarking a range of sizes
+                 on CPUs and a Maxwell TitanX.  A speedup was seen in a large majority of
+                 cases when switching implementations at N=16, but it is possible that
+                 there will be a small number of performance regressions.*/
+                if (len(sizes) > 16)
+                {
+                    // extract the size of each input along the concat dimension
+                    var slice = array_ops.slice(array_ops.stack(sizes, axis: 1),
+                            new Tensor[] { non_neg_concat_dim, tf.constant(0) },
+                            new Tensor[] { tf.constant(1), tf.constant(-1) });
+                    var squeeze_sizes = array_ops.squeeze(slice);
+                    out_grads = array_ops.split(axis: grad, value: squeeze_sizes, num_split: (int)non_neg_concat_dim).ToList();
+                }
+                else
+                {
+                    var offset = gen_array_ops.concat_offset(non_neg_concat_dim, sizes);
+                    foreach (var (begin, size) in zip(offset, sizes))
+                        out_grads.Add(gen_array_ops.slice(grad, begin, size));
+                }
             }
 
             return (end_value_index <= dim_index ?
 
@@ -56,6 +56,8 @@ public override void OnEntry(MethodExecutionArgs args)
 
         public override void OnExit(MethodExecutionArgs args)
         {
+            var returnValue = mark_as_return(args.ReturnValue as Tensors);
+
             var opers = graph._nodes_by_name.Values.Select(x => x as Operation).ToArray();
 
             if (args.ReturnValue is Tensors outputs)
@@ -102,5 +104,10 @@ public override void OnExit(MethodExecutionArgs args)
             // run function
             args.ReturnValue = function(originalInputs);
         }
+
+        Tensor mark_as_return(Tensor tensor)
+        {
+            return array_ops.identity(tensor);
+        }
     }
 }
@@ -4,7 +4,7 @@
 
 namespace Tensorflow.Keras.ArgsDefinition
 {
-    public class LeakyReLUArgs : LayerArgs
+    public class LeakyReLuArgs : LayerArgs
     {
         /// <summary>
         /// Negative slope coefficient.
Original file line number	Diff line number	Diff line change
`@@ -1,7 +1,6 @@`
`1`	`1`	`using System;`
`2`	`2`	`using System.Collections.Generic;`
`3`	`3`	`using Tensorflow.Util;`
`4`		`-using Microsoft.Extensions.Logging;`
`5`	`4`	`using static Tensorflow.Binding;`
`6`	`5`	`using static Tensorflow.tensorflow;`
`7`	`6`
`@@ -44,7 +43,7 @@ public void Watch(long tensor_id)`
`44`	`43`	`if (!CouldBackprop())`
`45`	`44`	`return;`
`46`	`45`
`47`		`- tf.Logger.LogDebug($"Watch tensor_id={tensor_id}");`
	`46`	`+ tf.Logger.Debug($"Watch tensor_id={tensor_id}");`
`48`	`47`	`tensor_tape_.emplace(tensor_id, -1);`
`49`	`48`	`}`
`50`	`49`
`@@ -56,7 +55,7 @@ public bool ShouldRecord(long[] tensor_ids, TF_DataType[] dtypes)`
`56`	`55`	`{`
`57`	`56`	`if (IsDtypeTrainable(dtypes[i]))`
`58`	`57`	`{`
`59`		`- tf.Logger.LogDebug($"tape.h->ShouldRecord: should_record = true, tensor_tape_.size()={tensor_tape_.Count}, tensor_ids[{i}]={tensor_ids[i]}");`
	`58`	`+ tf.Logger.Debug($"tape.h->ShouldRecord: should_record = true, tensor_tape_.size()={tensor_tape_.Count}, tensor_ids[{i}]={tensor_ids[i]}");`
`60`	`59`	`return true;`
`61`	`60`	`}`
`62`	`61`	`}`
Original file line number	Diff line number	Diff line change
`@@ -56,6 +56,8 @@ public override void OnEntry(MethodExecutionArgs args)`
`56`	`56`
`57`	`57`	`public override void OnExit(MethodExecutionArgs args)`
`58`	`58`	`{`
	`59`	`+ var returnValue = mark_as_return(args.ReturnValue as Tensors);`
	`60`	`+`
`59`	`61`	`var opers = graph._nodes_by_name.Values.Select(x => x as Operation).ToArray();`
`60`	`62`
`61`	`63`	`if (args.ReturnValue is Tensors outputs)`
`@@ -102,5 +104,10 @@ public override void OnExit(MethodExecutionArgs args)`
`102`	`104`	`// run function`
`103`	`105`	`args.ReturnValue = function(originalInputs);`
`104`	`106`	`}`
	`107`	`+`
	`108`	`+ Tensor mark_as_return(Tensor tensor)`
	`109`	`+ {`
	`110`	`+ return array_ops.identity(tensor);`
	`111`	`+ }`
`105`	`112`	`}`
`106`	`113`	`}`
Original file line number	Diff line number	Diff line change
`@@ -4,7 +4,7 @@`
`4`	`4`
`5`	`5`	`namespace Tensorflow.Keras.ArgsDefinition`
`6`	`6`	`{`
`7`		`- public class LeakyReLUArgs : LayerArgs`
	`7`	`+ public class LeakyReLuArgs : LayerArgs`
`8`	`8`	`{`
`9`	`9`	`/// <summary>`
`10`	`10`	`/// Negative slope coefficient.`