From 9412729ca9968d05d12051b8e8542e2504ba2f6c Mon Sep 17 00:00:00 2001
From: Steven <steven@darebait.com>
Date: Sun, 19 Jun 2022 01:16:50 -0700
Subject: [PATCH 01/33] Fix Conv2dTranspose bias

Conv2dTranspose defaults to have use_bias = true but currently throws a not implemented exception when the parameter is true.
---
 src/TensorFlowNET.Keras/Layers/LayersApi.cs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/TensorFlowNET.Keras/Layers/LayersApi.cs b/src/TensorFlowNET.Keras/Layers/LayersApi.cs
index aa4f416f6..548e3ff95 100644
--- a/src/TensorFlowNET.Keras/Layers/LayersApi.cs
+++ b/src/TensorFlowNET.Keras/Layers/LayersApi.cs
@@ -235,7 +235,7 @@ public Conv2DTranspose Conv2DTranspose(int filters,
             string data_format = null,
             Shape dilation_rate = null,
             string activation = null,
-            bool use_bias = true,
+            bool use_bias = false,
             string kernel_initializer = null,
             string bias_initializer = null,
             string kernel_regularizer = null,

From 21210795d0fb7963c13fb99604b7e7e46df2443d Mon Sep 17 00:00:00 2001
From: Alexander Novikov <novikov_alexander@live.ru>
Date: Wed, 27 Sep 2023 13:16:28 +0000
Subject: [PATCH 02/33] gradient descent tests

---
 .../Variables/variables.py.cs                 |   7 +-
 .../GradientTest/GradientTest.cs              |   2 -
 test/TensorFlowNET.UnitTest/PythonTest.cs     | 178 +++++++++++++++++-
 .../Training/GradientDescentOptimizerTests.cs |  68 +++++++
 4 files changed, 250 insertions(+), 5 deletions(-)
 create mode 100644 test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs

diff --git a/src/TensorFlowNET.Core/Variables/variables.py.cs b/src/TensorFlowNET.Core/Variables/variables.py.cs
index 0c07e0243..f3ae248e6 100644
--- a/src/TensorFlowNET.Core/Variables/variables.py.cs
+++ b/src/TensorFlowNET.Core/Variables/variables.py.cs
@@ -72,7 +72,9 @@ public static List<IVariableV1> global_variables(string scope = null)
         public static Operation variables_initializer(IVariableV1[] var_list, string name = "init")
         {
             if (var_list.Length > 0)
+            {
                 return control_flow_ops.group(var_list.Select(x => x.Initializer).ToArray(), name);
+            }
             else
                 return gen_control_flow_ops.no_op(name: name);
         }
@@ -155,7 +157,10 @@ public static Operation _safe_initial_value_from_op(string name, Operation op, D
 
         public static Tensor global_variables_initializer()
         {
-            throw new NotImplementedException();
+            // if context.executing_eagerly():
+            //      return control_flow_ops.no_op(name = "global_variables_initializer")
+            var group =  variables_initializer(global_variables().ToArray());
+            return group;
         }
     }
 }
diff --git a/test/TensorFlowNET.Graph.UnitTest/GradientTest/GradientTest.cs b/test/TensorFlowNET.Graph.UnitTest/GradientTest/GradientTest.cs
index fc2280051..e2d6db912 100644
--- a/test/TensorFlowNET.Graph.UnitTest/GradientTest/GradientTest.cs
+++ b/test/TensorFlowNET.Graph.UnitTest/GradientTest/GradientTest.cs
@@ -776,8 +776,6 @@ public void testUnconnectedGradientsNoneUnconnectedGradients()
         [TestMethod]
         public void testUnconnectedGradientsZerosUnconnectedGradients()
         {
-
-
             //def testUnconnectedGradientsZerosUnconnectedGradients(self):
             //  with ops.Graph().as_default():
             //    x = constant(1.0, shape=[2, 2])
diff --git a/test/TensorFlowNET.UnitTest/PythonTest.cs b/test/TensorFlowNET.UnitTest/PythonTest.cs
index 50cc2b328..12fd72360 100644
--- a/test/TensorFlowNET.UnitTest/PythonTest.cs
+++ b/test/TensorFlowNET.UnitTest/PythonTest.cs
@@ -144,6 +144,37 @@ public void assertAllClose(double value, NDArray array2, double eps = 1e-5)
             Assert.IsTrue(np.allclose(array1, array2, rtol: eps));
         }
 
+        private class CollectionComparer : System.Collections.IComparer
+        {
+            private readonly double _epsilon;
+
+            public CollectionComparer(double eps = 1e-06) {
+                _epsilon = eps;
+            }
+            public int Compare(object x, object y)
+            {
+                var a = (double)x;
+                var b = (double)y;
+
+                double delta = Math.Abs(a - b);
+                if (delta < _epsilon)
+                {
+                    return 0;
+                }
+                return a.CompareTo(b);
+            }
+        }
+
+        public void assertAllCloseAccordingToType<T>(
+            T[] expected,
+            T[] given,
+            double eps = 1e-6,
+            float float_eps = 1e-6f)
+        {
+            // TODO: check if any of arguments is not double and change toletance
+            CollectionAssert.AreEqual(expected, given, new CollectionComparer(eps));
+        }
+
         public void assertProtoEquals(object toProto, object o)
         {
             throw new NotImplementedException();
@@ -153,6 +184,20 @@ public void assertProtoEquals(object toProto, object o)
 
         #region tensor evaluation and test session
 
+        private Session _cached_session = null;
+        private Graph _cached_graph = null;
+        private object _cached_config = null;
+        private bool _cached_force_gpu = false;
+
+        private void _ClearCachedSession()
+        {
+            if (self._cached_session != null)
+            {
+                self._cached_session.Dispose();
+                self._cached_session = null;
+            }
+        }
+
         //protected object _eval_helper(Tensor[] tensors)
         //{
         //    if (tensors == null)
@@ -218,9 +263,56 @@ public T evaluate<T>(Tensor tensor)
         }
 
 
-        public Session cached_session()
+        ///Returns a TensorFlow Session for use in executing tests.
+        public Session cached_session(
+            Graph graph = null, object config = null, bool use_gpu = false, bool force_gpu = false)
         {
-            throw new NotImplementedException();
+            // This method behaves differently than self.session(): for performance reasons
+            // `cached_session` will by default reuse the same session within the same
+            // test.The session returned by this function will only be closed at the end
+            // of the test(in the TearDown function).
+
+            // Use the `use_gpu` and `force_gpu` options to control where ops are run.If
+            // `force_gpu` is True, all ops are pinned to `/ device:GPU:0`. Otherwise, if
+            // `use_gpu` is True, TensorFlow tries to run as many ops on the GPU as
+            // possible.If both `force_gpu and `use_gpu` are False, all ops are pinned to
+            // the CPU.
+
+            // Example:
+            // python
+            // class MyOperatorTest(test_util.TensorFlowTestCase) :
+            //   def testMyOperator(self):
+            //     with self.cached_session() as sess:
+            //       valid_input = [1.0, 2.0, 3.0, 4.0, 5.0]
+            //     result = MyOperator(valid_input).eval()
+            //       self.assertEqual(result, [1.0, 2.0, 3.0, 5.0, 8.0]
+            //       invalid_input = [-1.0, 2.0, 7.0]
+            //     with self.assertRaisesOpError("negative input not supported"):
+            //         MyOperator(invalid_input).eval()
+
+
+            // Args:
+            //   graph: Optional graph to use during the returned session.
+            //   config: An optional config_pb2.ConfigProto to use to configure the
+            //     session.
+            //   use_gpu: If True, attempt to run as many ops as possible on GPU.
+            //   force_gpu: If True, pin all ops to `/device:GPU:0`.
+
+            // Yields:
+            //   A Session object that should be used as a context manager to surround
+            //   the graph building and execution code in a test case.
+
+
+            // TODO:
+            //  if context.executing_eagerly():
+            //    return self._eval_helper(tensors)
+            //  else:
+            {
+                var sess = self._get_cached_session(
+                    graph, config, force_gpu, crash_if_inconsistent_args: true);
+                using var cached = self._constrain_devices_and_set_default(sess, use_gpu, force_gpu);
+                return cached;
+            }
         }
 
         //Returns a TensorFlow Session for use in executing tests.
@@ -268,6 +360,40 @@ public Session session(Graph graph = null, object config = null, bool use_gpu =
             return s.as_default();
         }
 
+        private Session _constrain_devices_and_set_default(Session sess, bool use_gpu, bool force_gpu)
+        {
+            // Set the session and its graph to global default and constrain devices."""
+            if (tf.executing_eagerly())
+                return null;
+            else
+            {
+                sess.graph.as_default();
+                sess.as_default();
+                {
+                    if (force_gpu)
+                    {
+                        // TODO:
+
+                        // Use the name of an actual device if one is detected, or
+                        // '/device:GPU:0' otherwise
+                        /* var gpu_name = gpu_device_name();
+                        if (!gpu_name)
+                            gpu_name = "/device:GPU:0"
+                        using (sess.graph.device(gpu_name)) {
+                            yield return sess;
+                        }*/
+                        return sess;
+                    }
+                    else if (use_gpu)
+                        return sess;
+                    else
+                        using (sess.graph.device("/device:CPU:0"))
+                            return sess;
+                }
+
+            }
+        }
+
         // See session() for details.
         private Session _create_session(Graph graph, object cfg, bool forceGpu)
         {
@@ -312,6 +438,54 @@ private Session _create_session(Graph graph, object cfg, bool forceGpu)
             return new Session(graph);//, config = prepare_config(config))
         }
 
+        private Session _get_cached_session(
+                          Graph graph = null,
+                          object config = null,
+                          bool force_gpu = false,
+                          bool crash_if_inconsistent_args = true)
+        {
+            // See cached_session() for documentation.
+            if (self._cached_session == null)
+            {
+                var sess = self._create_session(graph, config, force_gpu);
+                self._cached_session = sess;
+                self._cached_graph = graph;
+                self._cached_config = config;
+                self._cached_force_gpu = force_gpu;
+                return sess;
+            }
+            else
+            {
+
+                if (crash_if_inconsistent_args && !self._cached_graph.Equals(graph))
+                    throw new ValueError(@"The graph used to get the cached session is 
+                                           different than the one that was used to create the
+                                           session. Maybe create a new session with 
+                                           self.session()");
+                if (crash_if_inconsistent_args && !self._cached_config.Equals(config))
+                {
+                    throw new ValueError(@"The config used to get the cached session is 
+                                           different than the one that was used to create the 
+                                           session. Maybe create a new session with 
+                                           self.session()");
+                }
+                if (crash_if_inconsistent_args && !self._cached_force_gpu.Equals(force_gpu))
+                {
+                    throw new ValueError(@"The force_gpu value used to get the cached session is 
+                                           different than the one that was used to create the 
+                                           session. Maybe create a new session with 
+                                           self.session()");
+                }
+                return _cached_session;
+            }
+        }
+
+        [TestCleanup]
+        public void Cleanup()
+        {
+            _ClearCachedSession();
+        }
+
         #endregion
 
         public void AssetSequenceEqual<T>(T[] a, T[] b)
diff --git a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
new file mode 100644
index 000000000..977544ae9
--- /dev/null
+++ b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
@@ -0,0 +1,68 @@
+﻿using Microsoft.VisualStudio.TestTools.UnitTesting;
+using System;
+using System.Linq;
+using System.Runtime.Intrinsics.X86;
+using System.Security.AccessControl;
+using Tensorflow.NumPy;
+using TensorFlowNET.UnitTest;
+using static Tensorflow.Binding;
+
+namespace Tensorflow.Keras.UnitTest.Optimizers
+{
+    [TestClass]
+    public class GradientDescentOptimizerTest : PythonTest
+    {
+        private void TestBasicGeneric<T>() where T : struct
+        {
+            var dtype = Type.GetTypeCode(typeof(T)) switch
+            {
+                TypeCode.Single => np.float32,
+                TypeCode.Double => np.float64,
+                _ => throw new NotImplementedException(),
+            };
+
+            // train.GradientDescentOptimizer is V1 only API.
+            tf.Graph().as_default();
+            using (self.cached_session())
+            {
+                var var0 = tf.Variable(new[] { 1.0, 2.0 }, dtype: dtype);
+                var var1 = tf.Variable(new[] { 3.0, 4.0 }, dtype: dtype);
+                var grads0 = tf.constant(new[] { 0.1, 0.1 }, dtype: dtype);
+                var grads1 = tf.constant(new[] { 0.01, 0.01 }, dtype: dtype);
+                var optimizer = tf.train.GradientDescentOptimizer(3.0f);
+                var grads_and_vars = new[] {
+                    Tuple.Create(grads0, var0 as IVariableV1),
+                    Tuple.Create(grads1, var1 as IVariableV1)
+                };
+                var sgd_op = optimizer.apply_gradients(grads_and_vars);
+
+                var global_variables = variables.global_variables_initializer();
+                self.evaluate<T>(global_variables);
+                // Fetch params to validate initial values
+                // TODO: use self.evaluate<T[]> instead of self.evaluate<double[]>
+                self.assertAllCloseAccordingToType(new double[] { 1.0, 2.0 }, self.evaluate<double[]>(var0));
+                self.assertAllCloseAccordingToType(new double[] { 3.0, 4.0 }, self.evaluate<double[]>(var1));
+                // Run 1 step of sgd
+                sgd_op.run();
+                // Validate updated params
+                self.assertAllCloseAccordingToType(
+                    new double[] { 1.0 - 3.0 * 0.1, 2.0 - 3.0 * 0.1 },
+                    self.evaluate<double[]>(var0));
+                self.assertAllCloseAccordingToType(
+                    new double[] { 3.0 - 3.0 * 0.01, 4.0 - 3.0 * 0.01 },
+                    self.evaluate<double[]>(var1));
+                // TODO: self.assertEqual(0, len(optimizer.variables()));
+            }
+        }
+
+        [TestMethod]
+        public void TestBasic()
+        {
+            //TODO: add np.half
+            TestBasicGeneric<float>();
+            TestBasicGeneric<double>();
+        }
+
+
+    }
+}

From 53bd70bed3828a81e83bc1a2edbe1b3cbfab197a Mon Sep 17 00:00:00 2001
From: Wanglongzhi2001 <583087864@qq.com>
Date: Tue, 7 Nov 2023 22:54:08 +0800
Subject: [PATCH 03/33] fix: fix the validation_pack when multiple input

---
 src/TensorFlowNET.Core/Util/Data.cs           | 26 ++++++++++++++-----
 .../Engine/DataAdapters/DataAdapter.cs        | 14 +++++++---
 .../Engine/Model.Evaluate.cs                  |  8 +++++-
 src/TensorFlowNET.Keras/Engine/Model.Fit.cs   | 23 +++++++++++++---
 4 files changed, 56 insertions(+), 15 deletions(-)

diff --git a/src/TensorFlowNET.Core/Util/Data.cs b/src/TensorFlowNET.Core/Util/Data.cs
index a14c69b18..4e5a65434 100644
--- a/src/TensorFlowNET.Core/Util/Data.cs
+++ b/src/TensorFlowNET.Core/Util/Data.cs
@@ -1,4 +1,5 @@
-﻿using Tensorflow.NumPy;
+﻿using OneOf;
+using Tensorflow.NumPy;
 
 namespace Tensorflow.Util
 {
@@ -8,10 +9,10 @@ namespace Tensorflow.Util
     /// </summary>
     public class ValidationDataPack
     {
-        public NDArray val_x;
+        public OneOf<NDArray, NDArray[]> val_x;
         public NDArray val_y;
         public NDArray val_sample_weight = null;
-
+        public bool val_x_is_array = false;
         public ValidationDataPack((NDArray, NDArray) validation_data)
         {
             this.val_x = validation_data.Item1;
@@ -27,15 +28,17 @@ public ValidationDataPack((NDArray, NDArray, NDArray) validation_data)
 
         public ValidationDataPack((IEnumerable<NDArray>, NDArray) validation_data)
         {
-            this.val_x = validation_data.Item1.ToArray()[0];
+            this.val_x = validation_data.Item1.ToArray();
             this.val_y = validation_data.Item2;
+            val_x_is_array = true;
         }
 
         public ValidationDataPack((IEnumerable<NDArray>, NDArray, NDArray) validation_data)
         {
-            this.val_x = validation_data.Item1.ToArray()[0];
+            this.val_x = validation_data.Item1.ToArray();
             this.val_y = validation_data.Item2;
             this.val_sample_weight = validation_data.Item3;
+            val_x_is_array = true;
         }
 
         public static implicit operator ValidationDataPack((NDArray, NDArray) validation_data)
@@ -52,15 +55,24 @@ public static implicit operator ValidationDataPack((IEnumerable<NDArray>, NDArra
 
         public void Deconstruct(out NDArray val_x, out NDArray val_y)
         {
-            val_x = this.val_x;
+            val_x = this.val_x.AsT0;
             val_y = this.val_y;
         }
 
         public void Deconstruct(out NDArray val_x, out NDArray val_y, out NDArray val_sample_weight)
         {
-            val_x = this.val_x;
+            val_x = this.val_x.AsT0;
+            val_y = this.val_y;
+            val_sample_weight = this.val_sample_weight;
+        }
+
+        // add a unuse parameter to make it different from Deconstruct(out NDArray val_x, out NDArray val_y, out NDArray val_sample_weight)
+        public void Deconstruct(out NDArray[] val_x_array, out NDArray val_y, out NDArray val_sample_weight, out NDArray unuse)
+        {
+            val_x_array = this.val_x.AsT1;
             val_y = this.val_y;
             val_sample_weight = this.val_sample_weight;
+            unuse = null;
         }
     }
 }
diff --git a/src/TensorFlowNET.Keras/Engine/DataAdapters/DataAdapter.cs b/src/TensorFlowNET.Keras/Engine/DataAdapters/DataAdapter.cs
index b2750496a..590f30a78 100644
--- a/src/TensorFlowNET.Keras/Engine/DataAdapters/DataAdapter.cs
+++ b/src/TensorFlowNET.Keras/Engine/DataAdapters/DataAdapter.cs
@@ -92,9 +92,17 @@ public static ((IEnumerable<NDArray>, NDArray, NDArray), ValidationDataPack) tra
             var train_y = y[new Slice(0, train_count)];
             var val_x = x.Select(x => x[new Slice(train_count)] as NDArray);
             var val_y = y[new Slice(train_count)];
-            NDArray tmp_sample_weight = sample_weight;
-            sample_weight = sample_weight[new Slice(0, train_count)];
-            ValidationDataPack validation_data = (val_x, val_y, tmp_sample_weight[new Slice(train_count)]);
+
+            ValidationDataPack validation_data;
+            if (sample_weight != null)
+            {
+                validation_data = (val_x, val_y, sample_weight[new Slice(train_count)]);
+                sample_weight = sample_weight[new Slice(0, train_count)];
+            }
+            else
+            {
+                validation_data = (val_x, val_y);
+            }
             return ((train_x, train_y, sample_weight), validation_data);
         }
     }
diff --git a/src/TensorFlowNET.Keras/Engine/Model.Evaluate.cs b/src/TensorFlowNET.Keras/Engine/Model.Evaluate.cs
index 474d5e5a5..b3264429e 100644
--- a/src/TensorFlowNET.Keras/Engine/Model.Evaluate.cs
+++ b/src/TensorFlowNET.Keras/Engine/Model.Evaluate.cs
@@ -70,13 +70,19 @@ public Dictionary<string, float> evaluate(NDArray x, NDArray y,
             return evaluate(data_handler, callbacks, is_val, test_function);
         }
 
-        public Dictionary<string, float> evaluate(IEnumerable<Tensor> x, Tensor y, int verbose = 1, bool is_val = false)
+        public Dictionary<string, float> evaluate(
+            IEnumerable<Tensor> x, 
+            Tensor y, 
+            int verbose = 1,
+            NDArray sample_weight = null,
+            bool is_val = false)
         {
             var data_handler = new DataHandler(new DataHandlerArgs
             {
                 X = new Tensors(x.ToArray()),
                 Y = y,
                 Model = this,
+                SampleWeight = sample_weight,
                 StepsPerExecution = _steps_per_execution
             });
 
diff --git a/src/TensorFlowNET.Keras/Engine/Model.Fit.cs b/src/TensorFlowNET.Keras/Engine/Model.Fit.cs
index d61211c71..13a1b63bc 100644
--- a/src/TensorFlowNET.Keras/Engine/Model.Fit.cs
+++ b/src/TensorFlowNET.Keras/Engine/Model.Fit.cs
@@ -7,6 +7,7 @@
 using System.Diagnostics;
 using Tensorflow.Keras.Callbacks;
 using Tensorflow.Util;
+using OneOf;
 
 namespace Tensorflow.Keras.Engine
 {
@@ -287,10 +288,24 @@ History FitInternal(DataHandler data_handler, int epochs, int verbose, List<ICal
 
                 if (validation_data != null)
                 {
-                    // Because evaluate calls call_test_batch_end, this interferes with our output on the screen
-                    // so we need to pass a is_val parameter to stop on_test_batch_end
-                    var (val_x, val_y, val_sample_weight) = validation_data;
-                    var val_logs = evaluate(val_x, val_y, sample_weight:val_sample_weight, is_val:true);
+                    NDArray val_x;
+                    NDArray[] val_x_array;
+                    NDArray val_y;
+                    NDArray val_sample_weight;
+                    Dictionary<string, float> val_logs;
+                    if (!validation_data.val_x_is_array)
+                    {
+                        (val_x, val_y, val_sample_weight) = validation_data;
+                        // Because evaluate calls call_test_batch_end, this interferes with our output on the screen
+                        // so we need to pass a is_val parameter to stop on_test_batch_end
+                        val_logs = evaluate(val_x, val_y, sample_weight: val_sample_weight, is_val: true);
+
+                    }
+                    else
+                    {
+                        (val_x_array, val_y, val_sample_weight, _) = validation_data;
+                         val_logs = evaluate(val_x_array, val_y, sample_weight: val_sample_weight, is_val: true);
+                    }
                     foreach (var log in val_logs)
                     {
                         logs["val_" + log.Key] = log.Value;

From d453fb6611f4acb3ab405579ae804279d6e07cbe Mon Sep 17 00:00:00 2001
From: Wanglongzhi2001 <583087864@qq.com>
Date: Tue, 7 Nov 2023 23:34:37 +0800
Subject: [PATCH 04/33] refactor: declare some field of ValidationPack as
 internal

---
 src/TensorFlowNET.Core/Util/Data.cs | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/TensorFlowNET.Core/Util/Data.cs b/src/TensorFlowNET.Core/Util/Data.cs
index 4e5a65434..388efc50f 100644
--- a/src/TensorFlowNET.Core/Util/Data.cs
+++ b/src/TensorFlowNET.Core/Util/Data.cs
@@ -9,9 +9,9 @@ namespace Tensorflow.Util
     /// </summary>
     public class ValidationDataPack
     {
-        public OneOf<NDArray, NDArray[]> val_x;
-        public NDArray val_y;
-        public NDArray val_sample_weight = null;
+        internal OneOf<NDArray, NDArray[]> val_x;
+        internal NDArray val_y;
+        internal NDArray val_sample_weight = null;
         public bool val_x_is_array = false;
         public ValidationDataPack((NDArray, NDArray) validation_data)
         {
@@ -33,7 +33,7 @@ public ValidationDataPack((IEnumerable<NDArray>, NDArray) validation_data)
             val_x_is_array = true;
         }
 
-        public ValidationDataPack((IEnumerable<NDArray>, NDArray, NDArray) validation_data)
+        internal ValidationDataPack((IEnumerable<NDArray>, NDArray, NDArray) validation_data)
         {
             this.val_x = validation_data.Item1.ToArray();
             this.val_y = validation_data.Item2;

From 47e9019a187744bf31e315525ffe352dad36a00c Mon Sep 17 00:00:00 2001
From: Wanglongzhi2001 <583087864@qq.com>
Date: Tue, 7 Nov 2023 23:36:15 +0800
Subject: [PATCH 05/33] refactor: fix a typo

---
 src/TensorFlowNET.Core/Util/Data.cs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/TensorFlowNET.Core/Util/Data.cs b/src/TensorFlowNET.Core/Util/Data.cs
index 388efc50f..fe3466ed0 100644
--- a/src/TensorFlowNET.Core/Util/Data.cs
+++ b/src/TensorFlowNET.Core/Util/Data.cs
@@ -33,7 +33,7 @@ public ValidationDataPack((IEnumerable<NDArray>, NDArray) validation_data)
             val_x_is_array = true;
         }
 
-        internal ValidationDataPack((IEnumerable<NDArray>, NDArray, NDArray) validation_data)
+        public ValidationDataPack((IEnumerable<NDArray>, NDArray, NDArray) validation_data)
         {
             this.val_x = validation_data.Item1.ToArray();
             this.val_y = validation_data.Item2;

From 2a377e2f91b40083f5de86f01b57b32bad5a5932 Mon Sep 17 00:00:00 2001
From: Alexander Novikov <novikov_alexander@live.ru>
Date: Tue, 7 Nov 2023 19:23:34 +0000
Subject: [PATCH 06/33] tests are passing

---
 .../Variables/variables.py.cs                 |  8 ----
 test/TensorFlowNET.UnitTest/PythonTest.cs     | 40 ++++++++++++-------
 .../Training/GradientDescentOptimizerTests.cs | 33 +++++++++------
 3 files changed, 46 insertions(+), 35 deletions(-)

diff --git a/src/TensorFlowNET.Core/Variables/variables.py.cs b/src/TensorFlowNET.Core/Variables/variables.py.cs
index f3ae248e6..91f57e292 100644
--- a/src/TensorFlowNET.Core/Variables/variables.py.cs
+++ b/src/TensorFlowNET.Core/Variables/variables.py.cs
@@ -154,13 +154,5 @@ public static Operation _safe_initial_value_from_op(string name, Operation op, D
 
             return op;
         }
-
-        public static Tensor global_variables_initializer()
-        {
-            // if context.executing_eagerly():
-            //      return control_flow_ops.no_op(name = "global_variables_initializer")
-            var group =  variables_initializer(global_variables().ToArray());
-            return group;
-        }
     }
 }
diff --git a/test/TensorFlowNET.UnitTest/PythonTest.cs b/test/TensorFlowNET.UnitTest/PythonTest.cs
index 12fd72360..090ef097c 100644
--- a/test/TensorFlowNET.UnitTest/PythonTest.cs
+++ b/test/TensorFlowNET.UnitTest/PythonTest.cs
@@ -6,6 +6,7 @@
 using System.Linq;
 using Tensorflow;
 using static Tensorflow.Binding;
+using System.Collections.Generic;
 
 namespace TensorFlowNET.UnitTest
 {
@@ -144,11 +145,12 @@ public void assertAllClose(double value, NDArray array2, double eps = 1e-5)
             Assert.IsTrue(np.allclose(array1, array2, rtol: eps));
         }
 
-        private class CollectionComparer : System.Collections.IComparer
+        private class CollectionComparer : IComparer
         {
             private readonly double _epsilon;
 
-            public CollectionComparer(double eps = 1e-06) {
+            public CollectionComparer(double eps = 1e-06)
+            {
                 _epsilon = eps;
             }
             public int Compare(object x, object y)
@@ -166,13 +168,15 @@ public int Compare(object x, object y)
         }
 
         public void assertAllCloseAccordingToType<T>(
-            T[] expected,
-            T[] given,
+            ICollection expected,
+            ICollection<T> given,
             double eps = 1e-6,
             float float_eps = 1e-6f)
         {
             // TODO: check if any of arguments is not double and change toletance
-            CollectionAssert.AreEqual(expected, given, new CollectionComparer(eps));
+            // remove givenAsDouble and cast expected instead
+            var givenAsDouble = given.Select(x => Convert.ToDouble(x)).ToArray();
+            CollectionAssert.AreEqual(expected, givenAsDouble, new CollectionComparer(eps));
         }
 
         public void assertProtoEquals(object toProto, object o)
@@ -241,17 +245,25 @@ public T evaluate<T>(Tensor tensor)
             //    return self._eval_helper(tensors)
             //  else:
             {
-                var sess = tf.Session();
+                var sess = tf.get_default_session();
                 var ndarray = tensor.eval(sess);
-                if (typeof(T) == typeof(double))
+                if (typeof(T) == typeof(double)
+                    || typeof(T) == typeof(float)
+                    || typeof(T) == typeof(int))
+                {
+                    result = Convert.ChangeType(ndarray, typeof(T));
+                }
+                else if (typeof(T) == typeof(double[]))
+                {
+                    result = ndarray.ToMultiDimArray<double>();
+                }
+                else if (typeof(T) == typeof(float[]))
                 {
-                    double x = ndarray;
-                    result = x;
+                    result = ndarray.ToMultiDimArray<float>();
                 }
-                else if (typeof(T) == typeof(int))
+                else if (typeof(T) == typeof(int[]))
                 {
-                    int x = ndarray;
-                    result = x;
+                    result = ndarray.ToMultiDimArray<int>();
                 }
                 else
                 {
@@ -457,12 +469,12 @@ private Session _get_cached_session(
             else
             {
 
-                if (crash_if_inconsistent_args && !self._cached_graph.Equals(graph))
+                if (crash_if_inconsistent_args && self._cached_graph != null && !self._cached_graph.Equals(graph))
                     throw new ValueError(@"The graph used to get the cached session is 
                                            different than the one that was used to create the
                                            session. Maybe create a new session with 
                                            self.session()");
-                if (crash_if_inconsistent_args && !self._cached_config.Equals(config))
+                if (crash_if_inconsistent_args && self._cached_config != null && !self._cached_config.Equals(config))
                 {
                     throw new ValueError(@"The config used to get the cached session is 
                                            different than the one that was used to create the 
diff --git a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
index 977544ae9..3059068f4 100644
--- a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
+++ b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
@@ -1,8 +1,6 @@
 ﻿using Microsoft.VisualStudio.TestTools.UnitTesting;
 using System;
 using System.Linq;
-using System.Runtime.Intrinsics.X86;
-using System.Security.AccessControl;
 using Tensorflow.NumPy;
 using TensorFlowNET.UnitTest;
 using static Tensorflow.Binding;
@@ -12,18 +10,23 @@ namespace Tensorflow.Keras.UnitTest.Optimizers
     [TestClass]
     public class GradientDescentOptimizerTest : PythonTest
     {
-        private void TestBasicGeneric<T>() where T : struct
+        private static TF_DataType GetTypeForNumericType<T>() where T : struct
         {
-            var dtype = Type.GetTypeCode(typeof(T)) switch
+            return Type.GetTypeCode(typeof(T)) switch
             {
                 TypeCode.Single => np.float32,
                 TypeCode.Double => np.float64,
                 _ => throw new NotImplementedException(),
             };
+        }
+
+        private void TestBasicGeneric<T>() where T : struct
+        {
+            var dtype = GetTypeForNumericType<T>();
 
             // train.GradientDescentOptimizer is V1 only API.
             tf.Graph().as_default();
-            using (self.cached_session())
+            using (var sess = self.cached_session())
             {
                 var var0 = tf.Variable(new[] { 1.0, 2.0 }, dtype: dtype);
                 var var1 = tf.Variable(new[] { 3.0, 4.0 }, dtype: dtype);
@@ -36,21 +39,25 @@ private void TestBasicGeneric<T>() where T : struct
                 };
                 var sgd_op = optimizer.apply_gradients(grads_and_vars);
 
-                var global_variables = variables.global_variables_initializer();
-                self.evaluate<T>(global_variables);
+                var global_variables = tf.global_variables_initializer();
+                sess.run(global_variables);
+
                 // Fetch params to validate initial values
+                var initialVar0 = sess.run(var0);
+                var valu = var0.eval(sess);
+                var initialVar1 = sess.run(var1);
                 // TODO: use self.evaluate<T[]> instead of self.evaluate<double[]>
-                self.assertAllCloseAccordingToType(new double[] { 1.0, 2.0 }, self.evaluate<double[]>(var0));
-                self.assertAllCloseAccordingToType(new double[] { 3.0, 4.0 }, self.evaluate<double[]>(var1));
+                self.assertAllCloseAccordingToType(new[] { 1.0, 2.0 }, self.evaluate<T[]>(var0));
+                self.assertAllCloseAccordingToType(new[] { 3.0, 4.0 }, self.evaluate<T[]>(var1));
                 // Run 1 step of sgd
                 sgd_op.run();
                 // Validate updated params
                 self.assertAllCloseAccordingToType(
-                    new double[] { 1.0 - 3.0 * 0.1, 2.0 - 3.0 * 0.1 },
-                    self.evaluate<double[]>(var0));
+                    new[] { 1.0 - 3.0 * 0.1, 2.0 - 3.0 * 0.1 },
+                    self.evaluate<T[]>(var0));
                 self.assertAllCloseAccordingToType(
-                    new double[] { 3.0 - 3.0 * 0.01, 4.0 - 3.0 * 0.01 },
-                    self.evaluate<double[]>(var1));
+                    new[] { 3.0 - 3.0 * 0.01, 4.0 - 3.0 * 0.01 },
+                    self.evaluate<T[]>(var1));
                 // TODO: self.assertEqual(0, len(optimizer.variables()));
             }
         }

From f7b8dba00b2465114926072d4a82924dc35596d7 Mon Sep 17 00:00:00 2001
From: Alexander <novikov_alexander@live.ru>
Date: Wed, 8 Nov 2023 15:16:02 +0000
Subject: [PATCH 07/33] small fixes

---
 .../Training/GradientDescentOptimizerTests.cs      | 14 ++++++--------
 1 file changed, 6 insertions(+), 8 deletions(-)

diff --git a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
index 3059068f4..1a650a864 100644
--- a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
+++ b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
@@ -1,4 +1,5 @@
-﻿using Microsoft.VisualStudio.TestTools.UnitTesting;
+﻿using Microsoft.VisualStudio.TestPlatform.Utilities;
+using Microsoft.VisualStudio.TestTools.UnitTesting;
 using System;
 using System.Linq;
 using Tensorflow.NumPy;
@@ -20,7 +21,7 @@ private static TF_DataType GetTypeForNumericType<T>() where T : struct
             };
         }
 
-        private void TestBasicGeneric<T>() where T : struct
+        private void TestBasic<T>() where T : struct
         {
             var dtype = GetTypeForNumericType<T>();
 
@@ -42,11 +43,9 @@ private void TestBasicGeneric<T>() where T : struct
                 var global_variables = tf.global_variables_initializer();
                 sess.run(global_variables);
 
-                // Fetch params to validate initial values
                 var initialVar0 = sess.run(var0);
-                var valu = var0.eval(sess);
                 var initialVar1 = sess.run(var1);
-                // TODO: use self.evaluate<T[]> instead of self.evaluate<double[]>
+                // Fetch params to validate initial values
                 self.assertAllCloseAccordingToType(new[] { 1.0, 2.0 }, self.evaluate<T[]>(var0));
                 self.assertAllCloseAccordingToType(new[] { 3.0, 4.0 }, self.evaluate<T[]>(var1));
                 // Run 1 step of sgd
@@ -66,10 +65,9 @@ private void TestBasicGeneric<T>() where T : struct
         public void TestBasic()
         {
             //TODO: add np.half
-            TestBasicGeneric<float>();
-            TestBasicGeneric<double>();
+            TestBasic<float>();
+            TestBasic<double>();
         }
 
-
     }
 }

From c906f46aadaf2e2f0d1769f026270ba912ef95be Mon Sep 17 00:00:00 2001
From: Alexander <novikov_alexander@live.ru>
Date: Wed, 8 Nov 2023 15:24:13 +0000
Subject: [PATCH 08/33] learning rate test

---
 .../Training/GradientDescentOptimizerTests.cs | 49 +++++++++++++++++++
 1 file changed, 49 insertions(+)

diff --git a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
index 1a650a864..92fe97706 100644
--- a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
+++ b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
@@ -1,6 +1,7 @@
 ﻿using Microsoft.VisualStudio.TestPlatform.Utilities;
 using Microsoft.VisualStudio.TestTools.UnitTesting;
 using System;
+using System.Diagnostics;
 using System.Linq;
 using Tensorflow.NumPy;
 using TensorFlowNET.UnitTest;
@@ -69,5 +70,53 @@ public void TestBasic()
             TestBasic<double>();
         }
 
+        private void TestTensorLearningRate<T>() where T : struct
+        {
+            var dtype = GetTypeForNumericType<T>();
+
+            // train.GradientDescentOptimizer is V1 only API.
+            tf.Graph().as_default();
+            using (var sess = self.cached_session())
+            {
+                var var0 = tf.Variable(new[] { 1.0, 2.0 }, dtype: dtype);
+                var var1 = tf.Variable(new[] { 3.0, 4.0 }, dtype: dtype);
+                var grads0 = tf.constant(new[] { 0.1, 0.1 }, dtype: dtype);
+                var grads1 = tf.constant(new[] { 0.01, 0.01 }, dtype: dtype);
+                var lrate = constant_op.constant(3.0);
+                var grads_and_vars = new[] {
+                    Tuple.Create(grads0, var0 as IVariableV1),
+                    Tuple.Create(grads1, var1 as IVariableV1)
+                };
+                var sgd_op = tf.train.GradientDescentOptimizer(lrate)
+                    .apply_gradients(grads_and_vars);
+
+                var global_variables = tf.global_variables_initializer();
+                sess.run(global_variables);
+
+                var initialVar0 = sess.run(var0);
+                var initialVar1 = sess.run(var1);
+                // Fetch params to validate initial values
+                self.assertAllCloseAccordingToType(new[] { 1.0, 2.0 }, self.evaluate<T[]>(var0));
+                self.assertAllCloseAccordingToType(new[] { 3.0, 4.0 }, self.evaluate<T[]>(var1));
+                // Run 1 step of sgd
+                sgd_op.run();
+                // Validate updated params
+                self.assertAllCloseAccordingToType(
+                    new[] { 1.0 - 3.0 * 0.1, 2.0 - 3.0 * 0.1 },
+                    self.evaluate<T[]>(var0));
+                self.assertAllCloseAccordingToType(
+                    new[] { 3.0 - 3.0 * 0.01, 4.0 - 3.0 * 0.01 },
+                    self.evaluate<T[]>(var1));
+                // TODO: self.assertEqual(0, len(optimizer.variables()));
+            }
+        }
+
+        [TestMethod]
+        public void TestTensorLearningRate()
+        {
+            //TODO: add np.half
+            TestTensorLearningRate<float>();
+            TestTensorLearningRate<double>();
+        }
     }
 }

From 149caaec11b649e6f9e85320a1f18689c32cae6c Mon Sep 17 00:00:00 2001
From: Alexander <novikov_alexander@live.ru>
Date: Fri, 10 Nov 2023 02:44:01 +0000
Subject: [PATCH 09/33] test ci

---
 .../Training/GradientDescentOptimizerTests.cs        | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
index 92fe97706..98738528d 100644
--- a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
+++ b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
@@ -27,8 +27,8 @@ private void TestBasic<T>() where T : struct
             var dtype = GetTypeForNumericType<T>();
 
             // train.GradientDescentOptimizer is V1 only API.
-            tf.Graph().as_default();
-            using (var sess = self.cached_session())
+            //tf.Graph().as_default();
+            /*using (var sess = self.cached_session())
             {
                 var var0 = tf.Variable(new[] { 1.0, 2.0 }, dtype: dtype);
                 var var1 = tf.Variable(new[] { 3.0, 4.0 }, dtype: dtype);
@@ -59,7 +59,7 @@ private void TestBasic<T>() where T : struct
                     new[] { 3.0 - 3.0 * 0.01, 4.0 - 3.0 * 0.01 },
                     self.evaluate<T[]>(var1));
                 // TODO: self.assertEqual(0, len(optimizer.variables()));
-            }
+            }*/
         }
 
         [TestMethod]
@@ -67,7 +67,7 @@ public void TestBasic()
         {
             //TODO: add np.half
             TestBasic<float>();
-            TestBasic<double>();
+            // TestBasic<double>();
         }
 
         private void TestTensorLearningRate<T>() where T : struct
@@ -115,8 +115,8 @@ private void TestTensorLearningRate<T>() where T : struct
         public void TestTensorLearningRate()
         {
             //TODO: add np.half
-            TestTensorLearningRate<float>();
-            TestTensorLearningRate<double>();
+            // TestTensorLearningRate<float>();
+            // TestTensorLearningRate<double>();
         }
     }
 }

From 2cb5fd66f842832a2254155f296a54764473f5cd Mon Sep 17 00:00:00 2001
From: Alexander <novikov_alexander@live.ru>
Date: Fri, 10 Nov 2023 13:53:40 +0000
Subject: [PATCH 10/33] new graph

---
 .../Training/BasicLinearModel.cs                |  2 ++
 .../Training/GradientDescentOptimizerTests.cs   | 17 +++++++----------
 2 files changed, 9 insertions(+), 10 deletions(-)

diff --git a/test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs b/test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs
index 1283ecaf2..a37f28920 100644
--- a/test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs
+++ b/test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs
@@ -15,6 +15,8 @@ public class BasicLinearModel
         [TestMethod]
         public void LinearRegression()
         {
+            tf.Graph().as_default();
+
             // Initialize the weights to `5.0` and the bias to `0.0`
             // In practice, these should be initialized to random values (for example, with `tf.random.normal`)
             var W = tf.Variable(5.0f);
diff --git a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
index 98738528d..1632f1e73 100644
--- a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
+++ b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
@@ -1,8 +1,5 @@
-﻿using Microsoft.VisualStudio.TestPlatform.Utilities;
-using Microsoft.VisualStudio.TestTools.UnitTesting;
+﻿using Microsoft.VisualStudio.TestTools.UnitTesting;
 using System;
-using System.Diagnostics;
-using System.Linq;
 using Tensorflow.NumPy;
 using TensorFlowNET.UnitTest;
 using static Tensorflow.Binding;
@@ -27,8 +24,8 @@ private void TestBasic<T>() where T : struct
             var dtype = GetTypeForNumericType<T>();
 
             // train.GradientDescentOptimizer is V1 only API.
-            //tf.Graph().as_default();
-            /*using (var sess = self.cached_session())
+            tf.Graph().as_default();
+            using (var sess = self.cached_session())
             {
                 var var0 = tf.Variable(new[] { 1.0, 2.0 }, dtype: dtype);
                 var var1 = tf.Variable(new[] { 3.0, 4.0 }, dtype: dtype);
@@ -59,7 +56,7 @@ private void TestBasic<T>() where T : struct
                     new[] { 3.0 - 3.0 * 0.01, 4.0 - 3.0 * 0.01 },
                     self.evaluate<T[]>(var1));
                 // TODO: self.assertEqual(0, len(optimizer.variables()));
-            }*/
+            }
         }
 
         [TestMethod]
@@ -67,7 +64,7 @@ public void TestBasic()
         {
             //TODO: add np.half
             TestBasic<float>();
-            // TestBasic<double>();
+            TestBasic<double>();
         }
 
         private void TestTensorLearningRate<T>() where T : struct
@@ -115,8 +112,8 @@ private void TestTensorLearningRate<T>() where T : struct
         public void TestTensorLearningRate()
         {
             //TODO: add np.half
-            // TestTensorLearningRate<float>();
-            // TestTensorLearningRate<double>();
+            TestTensorLearningRate<float>();
+            TestTensorLearningRate<double>();
         }
     }
 }

From 09d466d697e58d97598bbee248ffd7ceb8a7be92 Mon Sep 17 00:00:00 2001
From: Alexander <novikov_alexander@live.ru>
Date: Fri, 10 Nov 2023 14:00:51 +0000
Subject: [PATCH 11/33] ci test

---
 test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs b/test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs
index a37f28920..d0da1d5b9 100644
--- a/test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs
+++ b/test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs
@@ -15,7 +15,9 @@ public class BasicLinearModel
         [TestMethod]
         public void LinearRegression()
         {
-            tf.Graph().as_default();
+            var graph = tf.Graph().as_default();
+            var sess = new Session(graph);
+            sess.as_default();
 
             // Initialize the weights to `5.0` and the bias to `0.0`
             // In practice, these should be initialized to random values (for example, with `tf.random.normal`)

From c5b4928bd6eaa9fcff9d0e71932cd7c1587d1eb6 Mon Sep 17 00:00:00 2001
From: Alexander <novikov_alexander@live.ru>
Date: Fri, 10 Nov 2023 14:28:41 +0000
Subject: [PATCH 12/33] correct namespace

passing
---
 test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs      | 4 ----
 .../Training/GradientDescentOptimizerTests.cs                 | 4 ++--
 2 files changed, 2 insertions(+), 6 deletions(-)

diff --git a/test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs b/test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs
index d0da1d5b9..1283ecaf2 100644
--- a/test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs
+++ b/test/TensorFlowNET.UnitTest/Training/BasicLinearModel.cs
@@ -15,10 +15,6 @@ public class BasicLinearModel
         [TestMethod]
         public void LinearRegression()
         {
-            var graph = tf.Graph().as_default();
-            var sess = new Session(graph);
-            sess.as_default();
-
             // Initialize the weights to `5.0` and the bias to `0.0`
             // In practice, these should be initialized to random values (for example, with `tf.random.normal`)
             var W = tf.Variable(5.0f);
diff --git a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
index 1632f1e73..d766890b2 100644
--- a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
+++ b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
@@ -1,10 +1,10 @@
 ﻿using Microsoft.VisualStudio.TestTools.UnitTesting;
 using System;
+using Tensorflow;
 using Tensorflow.NumPy;
-using TensorFlowNET.UnitTest;
 using static Tensorflow.Binding;
 
-namespace Tensorflow.Keras.UnitTest.Optimizers
+namespace TensorFlowNET.UnitTest.Training
 {
     [TestClass]
     public class GradientDescentOptimizerTest : PythonTest

From fc8f493187bd382bc994c4f79c17b369611cca36 Mon Sep 17 00:00:00 2001
From: Alexander <novikov_alexander@live.ru>
Date: Fri, 10 Nov 2023 20:47:49 +0000
Subject: [PATCH 13/33] common assembly for python test

---
 TensorFlow.NET.sln                            |  23 +-
 .../PythonTest.cs                             | 448 ------------------
 .../TensorFlowNET.Graph.UnitTest.csproj       |   1 +
 .../Tensorflow.Binding.UnitTest.csproj        |   1 +
 .../PythonTest.cs                             |   3 -
 .../Tensorflow.UnitTest.csproj                |  24 +
 6 files changed, 48 insertions(+), 452 deletions(-)
 delete mode 100644 test/TensorFlowNET.Graph.UnitTest/PythonTest.cs
 rename test/{TensorFlowNET.UnitTest => Tensorflow.UnitTest}/PythonTest.cs (99%)
 create mode 100644 test/Tensorflow.UnitTest/Tensorflow.UnitTest.csproj

diff --git a/TensorFlow.NET.sln b/TensorFlow.NET.sln
index 214b039d4..e0c273568 100644
--- a/TensorFlow.NET.sln
+++ b/TensorFlow.NET.sln
@@ -39,7 +39,9 @@ Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Tensorflow.Benchmark", "too
 EndProject
 Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Tensorflow.Console", "tools\TensorFlowNET.Console\Tensorflow.Console.csproj", "{1DC32255-BA1F-4D6D-A9C9-5BD5ED71CAA0}"
 EndProject
-Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "TensorFlow.Kernel.UnitTest", "test\TensorFlow.Kernel.UnitTest\TensorFlow.Kernel.UnitTest.csproj", "{654A027D-1364-4729-880B-144DFE1FF5BB}"
+Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "TensorFlow.Kernel.UnitTest", "test\TensorFlow.Kernel.UnitTest\TensorFlow.Kernel.UnitTest.csproj", "{654A027D-1364-4729-880B-144DFE1FF5BB}"
+EndProject
+Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "Tensorflow.UnitTest", "test\Tensorflow.UnitTest\Tensorflow.UnitTest.csproj", "{A73DF5A6-866E-4AED-9017-AA2EE86368C4}"
 EndProject
 Global
 	GlobalSection(SolutionConfigurationPlatforms) = preSolution
@@ -342,6 +344,24 @@ Global
 		{654A027D-1364-4729-880B-144DFE1FF5BB}.Release|x64.Build.0 = Release|Any CPU
 		{654A027D-1364-4729-880B-144DFE1FF5BB}.Release|x86.ActiveCfg = Release|Any CPU
 		{654A027D-1364-4729-880B-144DFE1FF5BB}.Release|x86.Build.0 = Release|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.Debug|Any CPU.ActiveCfg = Debug|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.Debug|Any CPU.Build.0 = Debug|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.Debug|x64.ActiveCfg = Debug|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.Debug|x64.Build.0 = Debug|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.Debug|x86.ActiveCfg = Debug|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.Debug|x86.Build.0 = Debug|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.GPU|Any CPU.ActiveCfg = Debug|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.GPU|Any CPU.Build.0 = Debug|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.GPU|x64.ActiveCfg = Debug|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.GPU|x64.Build.0 = Debug|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.GPU|x86.ActiveCfg = Debug|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.GPU|x86.Build.0 = Debug|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.Release|Any CPU.ActiveCfg = Release|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.Release|Any CPU.Build.0 = Release|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.Release|x64.ActiveCfg = Release|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.Release|x64.Build.0 = Release|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.Release|x86.ActiveCfg = Release|Any CPU
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4}.Release|x86.Build.0 = Release|Any CPU
 	EndGlobalSection
 	GlobalSection(SolutionProperties) = preSolution
 		HideSolutionNode = FALSE
@@ -363,6 +383,7 @@ Global
 		{C23563DB-FE21-48E7-A411-87A109E4A899} = {E1A5D2B7-10AF-4876-85C0-7714EF274214}
 		{1DC32255-BA1F-4D6D-A9C9-5BD5ED71CAA0} = {E1A5D2B7-10AF-4876-85C0-7714EF274214}
 		{654A027D-1364-4729-880B-144DFE1FF5BB} = {1B0918B9-65AD-4F34-A287-AF4597B27DBD}
+		{A73DF5A6-866E-4AED-9017-AA2EE86368C4} = {1B0918B9-65AD-4F34-A287-AF4597B27DBD}
 	EndGlobalSection
 	GlobalSection(ExtensibilityGlobals) = postSolution
 		SolutionGuid = {2DEAD3CC-486B-4918-A607-50B0DE7B114A}
diff --git a/test/TensorFlowNET.Graph.UnitTest/PythonTest.cs b/test/TensorFlowNET.Graph.UnitTest/PythonTest.cs
deleted file mode 100644
index ccf59f5ae..000000000
--- a/test/TensorFlowNET.Graph.UnitTest/PythonTest.cs
+++ /dev/null
@@ -1,448 +0,0 @@
-﻿using Microsoft.VisualStudio.TestTools.UnitTesting;
-using Newtonsoft.Json.Linq;
-using Tensorflow.NumPy;
-using System;
-using System.Collections;
-using System.Linq;
-using Tensorflow;
-using static Tensorflow.Binding;
-using OneOf.Types;
-using System.Collections.Generic;
-
-namespace TensorFlowNET.UnitTest
-{
-    /// <summary>
-    /// Use as base class for test classes to get additional assertions
-    /// </summary>
-    public class PythonTest
-    {
-        #region python compatibility layer
-        protected PythonTest self { get => this; }
-        protected int None => -1;
-        #endregion
-
-        #region pytest assertions
-
-        public void assertItemsEqual(ICollection given, ICollection expected)
-        {
-            if (given is Hashtable && expected is Hashtable)
-            {
-                Assert.AreEqual(JObject.FromObject(expected).ToString(), JObject.FromObject(given).ToString());
-                return;
-            }
-            Assert.IsNotNull(expected);
-            Assert.IsNotNull(given);
-            var e = expected.OfType<object>().ToArray();
-            var g = given.OfType<object>().ToArray();
-            Assert.AreEqual(e.Length, g.Length, $"The collections differ in length expected {e.Length} but got {g.Length}");
-            for (int i = 0; i < e.Length; i++)
-            {
-                /*if (g[i] is NDArray && e[i] is NDArray)
-                    assertItemsEqual((g[i] as NDArray).GetData<object>(), (e[i] as NDArray).GetData<object>());
-                else*/
-                if (e[i] is ICollection && g[i] is ICollection)
-                    assertEqual(g[i], e[i]);
-                else
-                    Assert.AreEqual(e[i], g[i], $"Items differ at index {i}, expected {e[i]} but got {g[i]}");
-            }
-        }
-
-        public void assertAllEqual(ICollection given, ICollection expected)
-        {
-            assertItemsEqual(given, expected);
-        }
-
-        public void assertFloat32Equal(float expected, float actual, string msg)
-        {
-            float eps = 1e-6f;
-            Assert.IsTrue(Math.Abs(expected - actual) < eps * Math.Max(1.0f, Math.Abs(expected)), $"{msg}: expected {expected} vs actual {actual}");
-        }
-
-        public void assertFloat64Equal(double expected, double actual, string msg)
-        {
-            double eps = 1e-16f;
-            Assert.IsTrue(Math.Abs(expected - actual) < eps * Math.Max(1.0f, Math.Abs(expected)), $"{msg}: expected {expected} vs actual {actual}");
-        }
-
-        public void assertEqual(object given, object expected)
-        {
-            /*if (given is NDArray && expected is NDArray)
-            {
-                assertItemsEqual((given as NDArray).GetData<object>(), (expected as NDArray).GetData<object>());
-                return;
-            }*/
-            if (given is Hashtable && expected is Hashtable)
-            {
-                Assert.AreEqual(JObject.FromObject(expected).ToString(), JObject.FromObject(given).ToString());
-                return;
-            }
-            if (given is ICollection && expected is ICollection)
-            {
-                assertItemsEqual(given as ICollection, expected as ICollection);
-                return;
-            }
-            if (given is float && expected is float)
-            {
-                assertFloat32Equal((float)expected, (float)given, "");
-                return;
-            }
-            if (given is double && expected is double)
-            {
-                assertFloat64Equal((double)expected, (double)given, "");
-                return;
-            }
-            Assert.AreEqual(expected, given);
-        }
-
-        public void assertEquals(object given, object expected)
-        {
-            assertEqual(given, expected);
-        }
-
-        public void assert(object given)
-        {
-            if (given is bool)
-                Assert.IsTrue((bool)given);
-            Assert.IsNotNull(given);
-        }
-
-        public void assertIsNotNone(object given)
-        {
-            Assert.IsNotNull(given);
-        }
-
-        public void assertFalse(bool cond)
-        {
-            Assert.IsFalse(cond);
-        }
-
-        public void assertTrue(bool cond)
-        {
-            Assert.IsTrue(cond);
-        }
-
-        public void assertAllClose(NDArray array1, NDArray array2, double eps = 1e-5)
-        {
-            Assert.IsTrue(np.allclose(array1, array2, rtol: eps));
-        }
-
-        public void assertAllClose(double value, NDArray array2, double eps = 1e-5)
-        {
-            var array1 = np.ones_like(array2) * value;
-            // Assert.IsTrue(np.allclose(array1, array2, rtol: eps));
-        }
-
-        public void assertProtoEquals(object toProto, object o)
-        {
-            throw new NotImplementedException();
-        }
-
-        #endregion
-
-        #region tensor evaluation and test session
-
-        private Session _cached_session = null;
-        private Graph _cached_graph = null;
-        private object _cached_config = null;
-        private bool _cached_force_gpu = false;
-
-        private void _ClearCachedSession()
-        {
-            if (self._cached_session != null)
-            {
-                self._cached_session.Dispose();
-                self._cached_session = null;
-            }
-        }
-
-
-        //protected object _eval_helper(Tensor[] tensors)
-        //{
-        //    if (tensors == null)
-        //        return null;
-        //    return nest.map_structure(self._eval_tensor, tensors);
-        //}
-
-        protected object _eval_tensor(object tensor)
-        {
-            if (tensor == null)
-                return None;
-            //else if (callable(tensor))
-            //     return self._eval_helper(tensor())
-            else
-            {
-                try
-                {
-                    //TODO:
-                    //       if sparse_tensor.is_sparse(tensor):
-                    //         return sparse_tensor.SparseTensorValue(tensor.indices, tensor.values,
-                    //                                                tensor.dense_shape)
-                    //return (tensor as Tensor).numpy();
-                }
-                catch (Exception)
-                {
-                    throw new ValueError("Unsupported type: " + tensor.GetType());
-                }
-                return null;
-            }
-        }
-
-        /// <summary>
-        /// This function is used in many original tensorflow unit tests to evaluate tensors 
-        /// in a test session with special settings (for instance constant folding off)
-        /// 
-        /// </summary>
-        public T evaluate<T>(Tensor tensor)
-        {
-            object result = null;
-            //  if context.executing_eagerly():
-            //    return self._eval_helper(tensors)
-            //  else:
-            {
-                var sess = tf.Session();
-                var ndarray = tensor.eval(sess);
-                if (typeof(T) == typeof(double))
-                {
-                    double x = ndarray;
-                    result = x;
-                }
-                else if (typeof(T) == typeof(int))
-                {
-                    int x = ndarray;
-                    result = x;
-                }
-                else
-                {
-                    result = ndarray;
-                }
-
-                return (T)result;
-            }
-        }
-
-        ///Returns a TensorFlow Session for use in executing tests.
-        public Session cached_session(
-            Graph graph = null, object config = null, bool use_gpu = false, bool force_gpu = false)
-        {
-            // This method behaves differently than self.session(): for performance reasons
-            // `cached_session` will by default reuse the same session within the same
-            // test.The session returned by this function will only be closed at the end
-            // of the test(in the TearDown function).
-
-            // Use the `use_gpu` and `force_gpu` options to control where ops are run.If
-            // `force_gpu` is True, all ops are pinned to `/ device:GPU:0`. Otherwise, if
-            // `use_gpu` is True, TensorFlow tries to run as many ops on the GPU as
-            // possible.If both `force_gpu and `use_gpu` are False, all ops are pinned to
-            // the CPU.
-
-            // Example:
-            // python
-            // class MyOperatorTest(test_util.TensorFlowTestCase) :
-            //   def testMyOperator(self):
-            //     with self.cached_session() as sess:
-            //       valid_input = [1.0, 2.0, 3.0, 4.0, 5.0]
-            //     result = MyOperator(valid_input).eval()
-            //       self.assertEqual(result, [1.0, 2.0, 3.0, 5.0, 8.0]
-            //       invalid_input = [-1.0, 2.0, 7.0]
-            //     with self.assertRaisesOpError("negative input not supported"):
-            //         MyOperator(invalid_input).eval()
-
-
-            // Args:
-            //   graph: Optional graph to use during the returned session.
-            //   config: An optional config_pb2.ConfigProto to use to configure the
-            //     session.
-            //   use_gpu: If True, attempt to run as many ops as possible on GPU.
-            //   force_gpu: If True, pin all ops to `/device:GPU:0`.
-
-            // Yields:
-            //   A Session object that should be used as a context manager to surround
-            //   the graph building and execution code in a test case.
-
-
-            // TODO:
-            //  if context.executing_eagerly():
-            //    return self._eval_helper(tensors)
-            //  else:
-            {
-                var sess = self._get_cached_session(
-                    graph, config, force_gpu, crash_if_inconsistent_args: true);
-                using var cached = self._constrain_devices_and_set_default(sess, use_gpu, force_gpu);
-                return cached; 
-            }
-        }
-
-        //Returns a TensorFlow Session for use in executing tests.
-        public Session session(Graph graph = null, object config = null, bool use_gpu = false, bool force_gpu = false)
-        {
-            //Note that this will set this session and the graph as global defaults.
-
-            //Use the `use_gpu` and `force_gpu` options to control where ops are run.If
-            //`force_gpu` is True, all ops are pinned to `/device:GPU:0`. Otherwise, if
-            //`use_gpu` is True, TensorFlow tries to run as many ops on the GPU as
-            //possible.If both `force_gpu and `use_gpu` are False, all ops are pinned to
-            //the CPU.
-
-            //Example:
-            //```python
-            //class MyOperatorTest(test_util.TensorFlowTestCase):
-            //  def testMyOperator(self):
-            //    with self.session(use_gpu= True):
-            //      valid_input = [1.0, 2.0, 3.0, 4.0, 5.0]
-            //    result = MyOperator(valid_input).eval()
-            //      self.assertEqual(result, [1.0, 2.0, 3.0, 5.0, 8.0]
-            //      invalid_input = [-1.0, 2.0, 7.0]
-            //    with self.assertRaisesOpError("negative input not supported"):
-            //        MyOperator(invalid_input).eval()
-            //```
-
-            //Args:
-            //  graph: Optional graph to use during the returned session.
-            //  config: An optional config_pb2.ConfigProto to use to configure the
-            //    session.
-            //  use_gpu: If True, attempt to run as many ops as possible on GPU.
-            //  force_gpu: If True, pin all ops to `/device:GPU:0`.
-
-            //Yields:
-            //  A Session object that should be used as a context manager to surround
-            //  the graph building and execution code in a test case.
-
-            Session s = null;
-            //if (context.executing_eagerly())
-            //  yield None
-            //else 
-            //{
-            s = self._create_session(graph, config, force_gpu);
-            //}
-            return s.as_default();
-        }
-
-        private Session _constrain_devices_and_set_default(Session sess, bool use_gpu, bool force_gpu)
-        {
-            // Set the session and its graph to global default and constrain devices."""
-            if (tf.executing_eagerly())
-                return null;
-            else {
-                sess.graph.as_default();
-                sess.as_default();
-                {
-                    if (force_gpu)
-                    {
-                        // TODO:
-
-                        // Use the name of an actual device if one is detected, or
-                        // '/device:GPU:0' otherwise
-                        /* var gpu_name = gpu_device_name();
-                        if (!gpu_name)
-                            gpu_name = "/device:GPU:0"
-                        using (sess.graph.device(gpu_name)) {
-                            yield return sess;
-                        }*/
-                        return sess;
-                    }
-                    else if (use_gpu)
-                        return sess;
-                    else 
-                        using (sess.graph.device("/device:CPU:0"))
-                            return sess;
-                }
-                
-            }
-        }
-
-        // See session() for details.
-        private Session _create_session(Graph graph, object cfg, bool forceGpu)
-        {
-            var prepare_config = new Func<object, object>((config) =>
-            {
-                //  """Returns a config for sessions.
-                //  Args:
-                //        config: An optional config_pb2.ConfigProto to use to configure the
-                //      session.
-                //  Returns:
-                //    A config_pb2.ConfigProto object.
-
-                //TODO: config
-
-                //  # use_gpu=False. Currently many tests rely on the fact that any device
-                //  # will be used even when a specific device is supposed to be used.
-                //  allow_soft_placement = not force_gpu
-                //  if config is None:
-                //    config = config_pb2.ConfigProto()
-                //    config.allow_soft_placement = allow_soft_placement
-                //    config.gpu_options.per_process_gpu_memory_fraction = 0.3
-                //  elif not allow_soft_placement and config.allow_soft_placement:
-                //    config_copy = config_pb2.ConfigProto()
-                //    config_copy.CopyFrom(config)
-                //    config = config_copy
-                //    config.allow_soft_placement = False
-                //  # Don't perform optimizations for tests so we don't inadvertently run
-                //  # gpu ops on cpu
-                //  config.graph_options.optimizer_options.opt_level = -1
-                //  # Disable Grappler constant folding since some tests & benchmarks
-                //  # use constant input and become meaningless after constant folding.
-                //  # DO NOT DISABLE GRAPPLER OPTIMIZERS WITHOUT CONSULTING WITH THE
-                //  # GRAPPLER TEAM.
-                //  config.graph_options.rewrite_options.constant_folding = (
-                //      rewriter_config_pb2.RewriterConfig.OFF)
-                //  config.graph_options.rewrite_options.pin_to_host_optimization = (
-                //      rewriter_config_pb2.RewriterConfig.OFF)
-                return config;
-            });
-            //TODO: use this instead of normal session
-            //return new ErrorLoggingSession(graph = graph, config = prepare_config(config))
-            return new Session(graph);//, config = prepare_config(config))
-        }
-
-        private Session _get_cached_session(
-                          Graph graph = null,
-                          object config = null,
-                          bool force_gpu = false,
-                          bool crash_if_inconsistent_args = true)
-        {
-            // See cached_session() for documentation.
-            if (self._cached_session == null)
-            {
-                var sess = self._create_session(graph, config, force_gpu);
-                self._cached_session = sess;
-                self._cached_graph = graph;
-                self._cached_config = config;
-                self._cached_force_gpu = force_gpu;
-                return sess;
-            } else {
-
-                if (crash_if_inconsistent_args && !self._cached_graph.Equals(graph))
-                    throw new ValueError(@"The graph used to get the cached session is 
-                                           different than the one that was used to create the
-                                           session. Maybe create a new session with 
-                                           self.session()");
-                if (crash_if_inconsistent_args && !self._cached_config.Equals(config)) {
-                    throw new ValueError(@"The config used to get the cached session is 
-                                           different than the one that was used to create the 
-                                           session. Maybe create a new session with 
-                                           self.session()");
-                }
-                if (crash_if_inconsistent_args && !self._cached_force_gpu.Equals(force_gpu)) {
-                    throw new ValueError(@"The force_gpu value used to get the cached session is 
-                                           different than the one that was used to create the 
-                                           session. Maybe create a new session with 
-                                           self.session()");
-                }
-                return _cached_session;
-            }
-        }
-
-        [TestCleanup]
-        public void Cleanup()
-        {
-            _ClearCachedSession();
-        }
-
-        #endregion
-
-        public void AssetSequenceEqual<T>(T[] a, T[] b)
-        {
-            Assert.IsTrue(Enumerable.SequenceEqual(a, b));
-        }
-    }
-}
diff --git a/test/TensorFlowNET.Graph.UnitTest/TensorFlowNET.Graph.UnitTest.csproj b/test/TensorFlowNET.Graph.UnitTest/TensorFlowNET.Graph.UnitTest.csproj
index 78a0938c5..74663c1cb 100644
--- a/test/TensorFlowNET.Graph.UnitTest/TensorFlowNET.Graph.UnitTest.csproj
+++ b/test/TensorFlowNET.Graph.UnitTest/TensorFlowNET.Graph.UnitTest.csproj
@@ -36,6 +36,7 @@
   <ItemGroup>
     <ProjectReference Include="..\..\src\TensorFlowNET.Core\Tensorflow.Binding.csproj" />
     <ProjectReference Include="..\..\tools\Tensorflow.UnitTest.RedistHolder\Tensorflow.UnitTest.RedistHolder.csproj" />
+    <ProjectReference Include="..\Tensorflow.UnitTest\Tensorflow.UnitTest.csproj" />
     <ProjectReference Include="..\TensorFlowNET.Keras.UnitTest\Tensorflow.Keras.UnitTest.csproj" />
   </ItemGroup>
 
diff --git a/test/TensorFlowNET.UnitTest/Tensorflow.Binding.UnitTest.csproj b/test/TensorFlowNET.UnitTest/Tensorflow.Binding.UnitTest.csproj
index 7a6a7f92c..5264cb104 100644
--- a/test/TensorFlowNET.UnitTest/Tensorflow.Binding.UnitTest.csproj
+++ b/test/TensorFlowNET.UnitTest/Tensorflow.Binding.UnitTest.csproj
@@ -51,6 +51,7 @@
     <ProjectReference Include="..\..\src\TensorFlowNET.Core\Tensorflow.Binding.csproj" />
     <ProjectReference Include="..\..\src\TensorFlowNET.Text\Tensorflow.Text.csproj" />
     <ProjectReference Include="..\..\tools\Tensorflow.UnitTest.RedistHolder\Tensorflow.UnitTest.RedistHolder.csproj" />
+    <ProjectReference Include="..\Tensorflow.UnitTest\Tensorflow.UnitTest.csproj" />
   </ItemGroup>
 
   <ItemGroup>
diff --git a/test/TensorFlowNET.UnitTest/PythonTest.cs b/test/Tensorflow.UnitTest/PythonTest.cs
similarity index 99%
rename from test/TensorFlowNET.UnitTest/PythonTest.cs
rename to test/Tensorflow.UnitTest/PythonTest.cs
index 090ef097c..b2412ea9f 100644
--- a/test/TensorFlowNET.UnitTest/PythonTest.cs
+++ b/test/Tensorflow.UnitTest/PythonTest.cs
@@ -1,12 +1,9 @@
 ﻿using Microsoft.VisualStudio.TestTools.UnitTesting;
 using Newtonsoft.Json.Linq;
 using Tensorflow.NumPy;
-using System;
 using System.Collections;
-using System.Linq;
 using Tensorflow;
 using static Tensorflow.Binding;
-using System.Collections.Generic;
 
 namespace TensorFlowNET.UnitTest
 {
diff --git a/test/Tensorflow.UnitTest/Tensorflow.UnitTest.csproj b/test/Tensorflow.UnitTest/Tensorflow.UnitTest.csproj
new file mode 100644
index 000000000..66a7d63bd
--- /dev/null
+++ b/test/Tensorflow.UnitTest/Tensorflow.UnitTest.csproj
@@ -0,0 +1,24 @@
+<Project Sdk="Microsoft.NET.Sdk">
+
+  <PropertyGroup>
+    <TargetFramework>net6.0</TargetFramework>
+    <ImplicitUsings>enable</ImplicitUsings>
+    <Nullable>enable</Nullable>
+
+    <IsPackable>false</IsPackable>
+    <IsTestProject>true</IsTestProject>
+  </PropertyGroup>
+
+  <ItemGroup>
+    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.5.0" />
+    <PackageReference Include="MSTest.TestAdapter" Version="2.2.10" />
+    <PackageReference Include="MSTest.TestFramework" Version="2.2.10" />
+    <PackageReference Include="coverlet.collector" Version="3.2.0" />
+  </ItemGroup>
+
+  <ItemGroup>
+    <ProjectReference Include="..\..\src\TensorFlowNET.Core\Tensorflow.Binding.csproj" />
+    <ProjectReference Include="..\..\tools\Tensorflow.UnitTest.RedistHolder\Tensorflow.UnitTest.RedistHolder.csproj" />
+  </ItemGroup>
+
+</Project>

From 165e9169e49841bb2d326ff903949244565a1a00 Mon Sep 17 00:00:00 2001
From: Alexander <novikov_alexander@live.ru>
Date: Fri, 10 Nov 2023 21:01:12 +0000
Subject: [PATCH 14/33] assert all close

---
 .../GradientTest/GradientTest.cs              | 22 +------------------
 test/Tensorflow.UnitTest/PythonTest.cs        | 18 +++++++--------
 2 files changed, 10 insertions(+), 30 deletions(-)

diff --git a/test/TensorFlowNET.Graph.UnitTest/GradientTest/GradientTest.cs b/test/TensorFlowNET.Graph.UnitTest/GradientTest/GradientTest.cs
index e2d6db912..cea6de172 100644
--- a/test/TensorFlowNET.Graph.UnitTest/GradientTest/GradientTest.cs
+++ b/test/TensorFlowNET.Graph.UnitTest/GradientTest/GradientTest.cs
@@ -625,25 +625,6 @@ public void testPartialDerivatives()
             }
         }
 
-        // TODO: remove when np.testing.assert_allclose(a, b) is implemented
-        private class CollectionComparer : System.Collections.IComparer
-        {
-            private readonly double _epsilon = 1e-07;
-
-            public int Compare(object x, object y)
-            {
-                var a = (double)x;
-                var b = (double)y;
-
-                double delta = Math.Abs(a - b);
-                if (delta < _epsilon)
-                {
-                    return 0;
-                }
-                return a.CompareTo(b);
-            }
-        }
-
         private struct Case
         {
             public Tensor[] grad1;
@@ -748,8 +729,7 @@ Tensor[] gradients(Tensor[] ys, Tensor[] xs, Tensor[] stop_gradients = null)
                     var npgrad2 = result[1];
                     foreach (var (a, b) in npgrad1.Zip(npgrad2))
                     {
-                        // TODO: np.testing.assert_allclose(a, b);
-                        CollectionAssert.AreEqual(a.ToArray(), b.ToArray(), new CollectionComparer());
+                        self.assertAllClose(a, b);
                     }
                 }
             }
diff --git a/test/Tensorflow.UnitTest/PythonTest.cs b/test/Tensorflow.UnitTest/PythonTest.cs
index b2412ea9f..650f70f2c 100644
--- a/test/Tensorflow.UnitTest/PythonTest.cs
+++ b/test/Tensorflow.UnitTest/PythonTest.cs
@@ -185,9 +185,9 @@ public void assertProtoEquals(object toProto, object o)
 
         #region tensor evaluation and test session
 
-        private Session _cached_session = null;
-        private Graph _cached_graph = null;
-        private object _cached_config = null;
+        private Session? _cached_session = null;
+        private Graph? _cached_graph = null;
+        private object? _cached_config = null;
         private bool _cached_force_gpu = false;
 
         private void _ClearCachedSession()
@@ -237,7 +237,7 @@ protected object _eval_tensor(object tensor)
         /// </summary>
         public T evaluate<T>(Tensor tensor)
         {
-            object result = null;
+            object? result = null;
             //  if context.executing_eagerly():
             //    return self._eval_helper(tensors)
             //  else:
@@ -274,7 +274,7 @@ public T evaluate<T>(Tensor tensor)
 
         ///Returns a TensorFlow Session for use in executing tests.
         public Session cached_session(
-            Graph graph = null, object config = null, bool use_gpu = false, bool force_gpu = false)
+            Graph? graph = null, object? config = null, bool use_gpu = false, bool force_gpu = false)
         {
             // This method behaves differently than self.session(): for performance reasons
             // `cached_session` will by default reuse the same session within the same
@@ -325,7 +325,7 @@ public Session cached_session(
         }
 
         //Returns a TensorFlow Session for use in executing tests.
-        public Session session(Graph graph = null, object config = null, bool use_gpu = false, bool force_gpu = false)
+        public Session session(Graph? graph = null, object? config = null, bool use_gpu = false, bool force_gpu = false)
         {
             //Note that this will set this session and the graph as global defaults.
 
@@ -359,7 +359,7 @@ public Session session(Graph graph = null, object config = null, bool use_gpu =
             //  A Session object that should be used as a context manager to surround
             //  the graph building and execution code in a test case.
 
-            Session s = null;
+            Session? s = null;
             //if (context.executing_eagerly())
             //  yield None
             //else 
@@ -448,8 +448,8 @@ private Session _create_session(Graph graph, object cfg, bool forceGpu)
         }
 
         private Session _get_cached_session(
-                          Graph graph = null,
-                          object config = null,
+                          Graph? graph = null,
+                          object? config = null,
                           bool force_gpu = false,
                           bool crash_if_inconsistent_args = true)
         {

From b906c9a69a15ad413f519db741335bdb1aedf07a Mon Sep 17 00:00:00 2001
From: Alexander <novikov_alexander@live.ru>
Date: Fri, 10 Nov 2023 21:16:42 +0000
Subject: [PATCH 15/33] fix nullability

---
 .../Tensorflow.Keras.UnitTest.csproj          |  1 +
 test/Tensorflow.UnitTest/PythonTest.cs        | 29 ++++++++++++++-----
 2 files changed, 22 insertions(+), 8 deletions(-)

diff --git a/test/TensorFlowNET.Keras.UnitTest/Tensorflow.Keras.UnitTest.csproj b/test/TensorFlowNET.Keras.UnitTest/Tensorflow.Keras.UnitTest.csproj
index 3910eba1c..e8b8d42b3 100644
--- a/test/TensorFlowNET.Keras.UnitTest/Tensorflow.Keras.UnitTest.csproj
+++ b/test/TensorFlowNET.Keras.UnitTest/Tensorflow.Keras.UnitTest.csproj
@@ -25,6 +25,7 @@
   <ItemGroup>
     <ProjectReference Include="..\..\src\TensorFlowNET.Keras\Tensorflow.Keras.csproj" />
     <ProjectReference Include="..\..\tools\Tensorflow.UnitTest.RedistHolder\Tensorflow.UnitTest.RedistHolder.csproj" />
+    <ProjectReference Include="..\TensorFlow.Kernel.UnitTest\TensorFlow.Kernel.UnitTest.csproj" />
   </ItemGroup>
 
   <ItemGroup>
diff --git a/test/Tensorflow.UnitTest/PythonTest.cs b/test/Tensorflow.UnitTest/PythonTest.cs
index 650f70f2c..5d1b1e0e1 100644
--- a/test/Tensorflow.UnitTest/PythonTest.cs
+++ b/test/Tensorflow.UnitTest/PythonTest.cs
@@ -86,9 +86,9 @@ public void assertEqual(object given, object expected)
                 Assert.AreEqual(JObject.FromObject(expected).ToString(), JObject.FromObject(given).ToString());
                 return;
             }
-            if (given is ICollection && expected is ICollection)
+            if (given is ICollection collectionGiven && expected is ICollection collectionExpected)
             {
-                assertItemsEqual(given as ICollection, expected as ICollection);
+                assertItemsEqual(collectionGiven, collectionExpected);
                 return;
             }
             if (given is float && expected is float)
@@ -150,8 +150,21 @@ public CollectionComparer(double eps = 1e-06)
             {
                 _epsilon = eps;
             }
-            public int Compare(object x, object y)
+            public int Compare(object? x, object? y)
             {
+                if (x == null && y == null)
+                {
+                    return 0;
+                }
+                else if (x == null)
+                {
+                    return -1; 
+                }
+                else if (y == null)
+                {
+                    return 1;
+                }
+
                 var a = (double)x;
                 var b = (double)y;
 
@@ -206,7 +219,7 @@ private void _ClearCachedSession()
         //    return nest.map_structure(self._eval_tensor, tensors);
         //}
 
-        protected object _eval_tensor(object tensor)
+        protected object? _eval_tensor(object tensor)
         {
             if (tensor == null)
                 return None;
@@ -273,7 +286,7 @@ public T evaluate<T>(Tensor tensor)
 
 
         ///Returns a TensorFlow Session for use in executing tests.
-        public Session cached_session(
+        public Session? cached_session(
             Graph? graph = null, object? config = null, bool use_gpu = false, bool force_gpu = false)
         {
             // This method behaves differently than self.session(): for performance reasons
@@ -369,7 +382,7 @@ public Session session(Graph? graph = null, object? config = null, bool use_gpu
             return s.as_default();
         }
 
-        private Session _constrain_devices_and_set_default(Session sess, bool use_gpu, bool force_gpu)
+        private Session? _constrain_devices_and_set_default(Session sess, bool use_gpu, bool force_gpu)
         {
             // Set the session and its graph to global default and constrain devices."""
             if (tf.executing_eagerly())
@@ -404,7 +417,7 @@ private Session _constrain_devices_and_set_default(Session sess, bool use_gpu, b
         }
 
         // See session() for details.
-        private Session _create_session(Graph graph, object cfg, bool forceGpu)
+        private Session _create_session(Graph? graph, object? cfg, bool forceGpu)
         {
             var prepare_config = new Func<object, object>((config) =>
             {
@@ -485,7 +498,7 @@ different than the one that was used to create the
                                            session. Maybe create a new session with 
                                            self.session()");
                 }
-                return _cached_session;
+                return self._cached_session;
             }
         }
 

From b6db9410b3c66ad30ac900330708060231e39809 Mon Sep 17 00:00:00 2001
From: Alexander <novikov_alexander@live.ru>
Date: Fri, 10 Nov 2023 21:20:13 +0000
Subject: [PATCH 16/33] update packages

---
 .../TensorFlow.Kernel.UnitTest.csproj                         | 2 +-
 .../TensorFlowNET.Graph.UnitTest.csproj                       | 2 +-
 .../Tensorflow.Keras.UnitTest.csproj                          | 2 +-
 .../Tensorflow.Native.UnitTest.csproj                         | 2 +-
 test/Tensorflow.UnitTest/Tensorflow.UnitTest.csproj           | 4 ++--
 .../TensorflowNET.Hub.Unittest/Tensorflow.Hub.Unittest.csproj | 2 +-
 6 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/test/TensorFlow.Kernel.UnitTest/TensorFlow.Kernel.UnitTest.csproj b/test/TensorFlow.Kernel.UnitTest/TensorFlow.Kernel.UnitTest.csproj
index 21b2731b7..461993408 100644
--- a/test/TensorFlow.Kernel.UnitTest/TensorFlow.Kernel.UnitTest.csproj
+++ b/test/TensorFlow.Kernel.UnitTest/TensorFlow.Kernel.UnitTest.csproj
@@ -10,7 +10,7 @@
   </PropertyGroup>
 
   <ItemGroup>
-    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.5.0" />
+    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.6.3" />
     <PackageReference Include="MSTest.TestAdapter" Version="2.2.10" />
     <PackageReference Include="MSTest.TestFramework" Version="2.2.10" />
     <PackageReference Include="coverlet.collector" Version="3.2.0" />
diff --git a/test/TensorFlowNET.Graph.UnitTest/TensorFlowNET.Graph.UnitTest.csproj b/test/TensorFlowNET.Graph.UnitTest/TensorFlowNET.Graph.UnitTest.csproj
index 74663c1cb..40dd53f74 100644
--- a/test/TensorFlowNET.Graph.UnitTest/TensorFlowNET.Graph.UnitTest.csproj
+++ b/test/TensorFlowNET.Graph.UnitTest/TensorFlowNET.Graph.UnitTest.csproj
@@ -24,7 +24,7 @@
   </PropertyGroup>
 
   <ItemGroup>
-    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.3.2" />
+    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.6.3" />
     <PackageReference Include="MSTest.TestAdapter" Version="2.2.10" />
     <PackageReference Include="MSTest.TestFramework" Version="2.2.10" />
     <PackageReference Include="coverlet.collector" Version="3.2.0">
diff --git a/test/TensorFlowNET.Keras.UnitTest/Tensorflow.Keras.UnitTest.csproj b/test/TensorFlowNET.Keras.UnitTest/Tensorflow.Keras.UnitTest.csproj
index e8b8d42b3..edac1c2ff 100644
--- a/test/TensorFlowNET.Keras.UnitTest/Tensorflow.Keras.UnitTest.csproj
+++ b/test/TensorFlowNET.Keras.UnitTest/Tensorflow.Keras.UnitTest.csproj
@@ -13,7 +13,7 @@
   </PropertyGroup>
 
   <ItemGroup>
-    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.3.2" />
+    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.6.3" />
     <PackageReference Include="MSTest.TestAdapter" Version="2.2.10" />
     <PackageReference Include="MSTest.TestFramework" Version="2.2.10" />
     <PackageReference Include="coverlet.collector" Version="3.2.0">
diff --git a/test/TensorFlowNET.Native.UnitTest/Tensorflow.Native.UnitTest.csproj b/test/TensorFlowNET.Native.UnitTest/Tensorflow.Native.UnitTest.csproj
index a4f1ec567..c054a8707 100644
--- a/test/TensorFlowNET.Native.UnitTest/Tensorflow.Native.UnitTest.csproj
+++ b/test/TensorFlowNET.Native.UnitTest/Tensorflow.Native.UnitTest.csproj
@@ -44,7 +44,7 @@
 
   <ItemGroup>
     <PackageReference Include="FluentAssertions" Version="5.10.3" />
-    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.3.2" />
+    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.6.3" />
     <PackageReference Include="MSTest.TestAdapter" Version="2.2.10" />
     <PackageReference Include="MSTest.TestFramework" Version="2.2.10" />
     <PackageReference Include="coverlet.collector" Version="3.2.0">
diff --git a/test/Tensorflow.UnitTest/Tensorflow.UnitTest.csproj b/test/Tensorflow.UnitTest/Tensorflow.UnitTest.csproj
index 66a7d63bd..9ad6bc7a5 100644
--- a/test/Tensorflow.UnitTest/Tensorflow.UnitTest.csproj
+++ b/test/Tensorflow.UnitTest/Tensorflow.UnitTest.csproj
@@ -1,4 +1,4 @@
-<Project Sdk="Microsoft.NET.Sdk">
+﻿<Project Sdk="Microsoft.NET.Sdk">
 
   <PropertyGroup>
     <TargetFramework>net6.0</TargetFramework>
@@ -10,7 +10,7 @@
   </PropertyGroup>
 
   <ItemGroup>
-    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.5.0" />
+    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.6.3" />
     <PackageReference Include="MSTest.TestAdapter" Version="2.2.10" />
     <PackageReference Include="MSTest.TestFramework" Version="2.2.10" />
     <PackageReference Include="coverlet.collector" Version="3.2.0" />
diff --git a/test/TensorflowNET.Hub.Unittest/Tensorflow.Hub.Unittest.csproj b/test/TensorflowNET.Hub.Unittest/Tensorflow.Hub.Unittest.csproj
index 4c3918e4a..c93b89256 100644
--- a/test/TensorflowNET.Hub.Unittest/Tensorflow.Hub.Unittest.csproj
+++ b/test/TensorflowNET.Hub.Unittest/Tensorflow.Hub.Unittest.csproj
@@ -9,7 +9,7 @@
   </PropertyGroup>
 
   <ItemGroup>
-    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.3.2" />
+    <PackageReference Include="Microsoft.NET.Test.Sdk" Version="17.6.3" />
     <PackageReference Include="MSTest.TestAdapter" Version="2.2.10" />
     <PackageReference Include="MSTest.TestFramework" Version="2.2.10" />
     <PackageReference Include="coverlet.collector" Version="3.1.2" />

From 7968dc360fbcbb57265e8a49192c8b028e9d0196 Mon Sep 17 00:00:00 2001
From: Alexander <novikov_alexander@live.ru>
Date: Sat, 11 Nov 2023 05:54:38 +0000
Subject: [PATCH 17/33] fix test

---
 test/Tensorflow.UnitTest/PythonTest.cs | 16 +++++++++++++---
 1 file changed, 13 insertions(+), 3 deletions(-)

diff --git a/test/Tensorflow.UnitTest/PythonTest.cs b/test/Tensorflow.UnitTest/PythonTest.cs
index 5d1b1e0e1..dff652933 100644
--- a/test/Tensorflow.UnitTest/PythonTest.cs
+++ b/test/Tensorflow.UnitTest/PythonTest.cs
@@ -133,13 +133,23 @@ public void assertTrue(bool cond)
 
         public void assertAllClose(NDArray array1, NDArray array2, double eps = 1e-5)
         {
-            Assert.IsTrue(np.allclose(array1, array2, rtol: eps));
+            CollectionAssert.AreEqual(array1.ToArray(), array2.ToArray(), new CollectionComparer(eps));
+
+            //TODO: Assert.IsTrue(np.allclose(array1, array2, rtol: eps));
         }
 
         public void assertAllClose(double value, NDArray array2, double eps = 1e-5)
         {
+            if (array2.shape.IsScalar)
+            {
+                double value2 = array2;
+                Assert.AreEqual(value, value2, eps);
+                return;
+            }
             var array1 = np.ones_like(array2) * value;
-            Assert.IsTrue(np.allclose(array1, array2, rtol: eps));
+            CollectionAssert.AreEqual(array1.ToArray(), array2.ToArray(), new CollectionComparer(eps));
+
+            //TODO: Assert.IsTrue(np.allclose(array1, array2, rtol: eps));
         }
 
         private class CollectionComparer : IComparer
@@ -158,7 +168,7 @@ public int Compare(object? x, object? y)
                 }
                 else if (x == null)
                 {
-                    return -1; 
+                    return -1;
                 }
                 else if (y == null)
                 {

From d54f7a62e0e66dee73eff78ce5c93acb195ce813 Mon Sep 17 00:00:00 2001
From: Alexander <novikov_alexander@live.ru>
Date: Mon, 13 Nov 2023 10:33:14 +0000
Subject: [PATCH 18/33] test: more gradients tests

---
 .../Training/GradientDescentOptimizerTests.cs | 113 ++++++++++++++++++
 test/Tensorflow.UnitTest/PythonTest.cs        |  45 +++++--
 2 files changed, 149 insertions(+), 9 deletions(-)

diff --git a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
index d766890b2..f7062f00d 100644
--- a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
+++ b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
@@ -1,5 +1,6 @@
 ﻿using Microsoft.VisualStudio.TestTools.UnitTesting;
 using System;
+using System.Linq;
 using Tensorflow;
 using Tensorflow.NumPy;
 using static Tensorflow.Binding;
@@ -67,6 +68,51 @@ public void TestBasic()
             TestBasic<double>();
         }
 
+        private void TestMinimizeResourceVariable<T>() where T : struct
+        {
+            var dtype = GetTypeForNumericType<T>();
+
+            // train.GradientDescentOptimizer is V1 only API.
+            tf.Graph().as_default();
+            using (var sess = self.cached_session())
+            {
+                var var0 = tf.Variable(new[,] { { 1.0f, 2.0f } }, dtype: dtype);
+                var var1 = tf.Variable(new[] { 3.0 }, dtype: dtype);
+                var x = tf.constant(new[,] { { 4.0f }, { 5.0f } }, dtype: dtype);
+
+                var pred = math_ops.matmul(var0, x) + var1;
+                var loss = pred * pred;
+                var sgd_op = tf.train.GradientDescentOptimizer(3.0f).minimize(loss);
+
+                var global_variables = tf.global_variables_initializer();
+                sess.run(global_variables);
+
+                sess.run(new[] { var0, var1 });
+                // Fetch params to validate initial values
+                self.assertAllCloseAccordingToType<T>(new[,] { { 1.0, 2.0 } }, self.evaluate<T[,]>(var0));
+                self.assertAllCloseAccordingToType(new[] { 3.0 }, self.evaluate<T[]>(var1));
+                // Run 1 step of sgd
+                sgd_op.run();
+                // Validate updated params
+                var np_pred = 1.0 * 4.0 + 2.0 * 5.0 + 3.0;
+                var np_grad = 2 * np_pred;
+                self.assertAllCloseAccordingToType(
+                    new[,] { { 1.0 - np_grad * 4.0, 2.0 - np_grad * 5.0 } },
+                    self.evaluate<T[,]>(var0));
+                self.assertAllCloseAccordingToType(
+                    new[] { 3.0 - np_grad },
+                    self.evaluate<T[]>(var1));
+            }
+        }
+
+        [TestMethod]
+        public void TestMinimizeResourceVariable()
+        {
+            //TODO: add np.half
+            TestMinimizeResourceVariable<float>();
+            TestMinimizeResourceVariable<double>();
+        }
+
         private void TestTensorLearningRate<T>() where T : struct
         {
             var dtype = GetTypeForNumericType<T>();
@@ -115,5 +161,72 @@ public void TestTensorLearningRate()
             TestTensorLearningRate<float>();
             TestTensorLearningRate<double>();
         }
+
+        public void TestGradWrtRef<T>() where T : struct
+        {
+            var dtype = GetTypeForNumericType<T>();
+
+            var graph = tf.Graph().as_default();
+            using (var sess = self.cached_session())
+            {
+                var opt = tf.train.GradientDescentOptimizer(3.0f);
+                var values = new[] { 1.0, 3.0 };
+                var vars_ = values.Select(
+                        v => tf.Variable(new[] { v }, dtype: dtype) as IVariableV1
+                    ).ToList();
+                var grads_and_vars = opt.compute_gradients(tf.add(vars_[0], vars_[1]), vars_);
+                sess.run(tf.global_variables_initializer());
+                foreach (var (grad, _) in grads_and_vars)
+                    self.assertAllCloseAccordingToType(new[] { 1.0 }, self.evaluate<T[]>(grad));
+
+            }
+        }
+
+        [TestMethod]
+        public void TestGradWrtRef()
+        {
+            TestGradWrtRef<float>();
+            TestGradWrtRef<double>();
+        }
+
+        public void TestWithGlobalStep<T>() where T : struct
+        {
+            var dtype = GetTypeForNumericType<T>();
+
+            tf.Graph().as_default();
+            using (var sess = self.cached_session())
+            {
+                var global_step = tf.Variable(0, trainable: false);
+                var var0 = tf.Variable(new[] { 1.0, 2.0 }, dtype: dtype);
+                var var1 = tf.Variable(new[] { 3.0, 4.0 }, dtype: dtype);
+                var grads0 = tf.constant(new[] { 0.1, 0.1 }, dtype: dtype);
+                var grads1 = tf.constant(new[] { 0.01, 0.01 }, dtype: dtype);
+                var grads_and_vars = new[] {
+                    Tuple.Create(grads0, var0 as IVariableV1),
+                    Tuple.Create(grads1, var1 as IVariableV1)
+                };
+                var sgd_op = tf.train.GradientDescentOptimizer(3.0f)
+                    .apply_gradients(grads_and_vars, global_step: global_step);
+
+                sess.run(tf.global_variables_initializer());
+                // Fetch params to validate initial values
+                self.assertAllCloseAccordingToType(new[] { 1.0, 2.0 }, self.evaluate<T[]>(var0));
+                self.assertAllCloseAccordingToType(new[] { 3.0, 4.0 }, self.evaluate<T[]>(var1));
+                // Run 1 step of sgd
+                sgd_op.run();
+                // Validate updated params and global_step
+                self.assertAllCloseAccordingToType(new[] { 1.0 - 3.0 * 0.1, 2.0 - 3.0 * 0.1 }, self.evaluate<T[]>(var0));
+                self.assertAllCloseAccordingToType(new[] { 3.0 - 3.0 * 0.01, 4.0 - 3.0 * 0.01 }, self.evaluate<T[]>(var1));
+                Assert.AreEqual(1, self.evaluate<int>(global_step));
+            }
+
+        }
+
+        [TestMethod]
+        public void TestWithGlobalStep()
+        {
+            TestWithGlobalStep<float>();
+            TestWithGlobalStep<double>();
+        }
     }
 }
diff --git a/test/Tensorflow.UnitTest/PythonTest.cs b/test/Tensorflow.UnitTest/PythonTest.cs
index dff652933..1ccd39f02 100644
--- a/test/Tensorflow.UnitTest/PythonTest.cs
+++ b/test/Tensorflow.UnitTest/PythonTest.cs
@@ -175,8 +175,8 @@ public int Compare(object? x, object? y)
                     return 1;
                 }
 
-                var a = (double)x;
-                var b = (double)y;
+                var a = Convert.ToDouble(x);
+                var b = Convert.ToDouble(y);
 
                 double delta = Math.Abs(a - b);
                 if (delta < _epsilon)
@@ -187,6 +187,19 @@ public int Compare(object? x, object? y)
             }
         }
 
+        public void assertAllCloseAccordingToType<T>(
+            double[,] expected,
+            T[,] given,
+            double eps = 1e-6,
+            float float_eps = 1e-6f)
+        {
+            Assert.AreEqual(expected.GetLength(0), given.GetLength(0));
+            Assert.AreEqual(expected.GetLength(1), given.GetLength(1));
+
+            var flattenGiven = given.Cast<T>().ToArray();
+            assertAllCloseAccordingToType(expected, flattenGiven, eps, float_eps);
+        }
+
         public void assertAllCloseAccordingToType<T>(
             ICollection expected,
             ICollection<T> given,
@@ -267,21 +280,35 @@ public T evaluate<T>(Tensor tensor)
             {
                 var sess = tf.get_default_session();
                 var ndarray = tensor.eval(sess);
-                if (typeof(T) == typeof(double)
-                    || typeof(T) == typeof(float)
-                    || typeof(T) == typeof(int))
+
+                if (typeof(T) == typeof(int))
+                {
+                    int i = ndarray;
+                    result = i;
+                }
+                else if (typeof(T) == typeof(float))
+                {
+                    float f = ndarray;
+                    result = f;
+                }
+                else if (typeof(T) == typeof(double))
                 {
-                    result = Convert.ChangeType(ndarray, typeof(T));
+                    double d = ndarray;
+                    result = d;
                 }
-                else if (typeof(T) == typeof(double[]))
+                else if (
+                    typeof(T) == typeof(double[])
+                    || typeof(T) == typeof(double[,]))
                 {
                     result = ndarray.ToMultiDimArray<double>();
                 }
-                else if (typeof(T) == typeof(float[]))
+                else if (typeof(T) == typeof(float[])
+                    || typeof(T) == typeof(float[,]))
                 {
                     result = ndarray.ToMultiDimArray<float>();
                 }
-                else if (typeof(T) == typeof(int[]))
+                else if (typeof(T) == typeof(int[]) 
+                    || typeof(T) == typeof(int[,]))
                 {
                     result = ndarray.ToMultiDimArray<int>();
                 }

From eb0f02577290d930930349870b161e85553e967a Mon Sep 17 00:00:00 2001
From: barfeous <nzksf2wa@duck.com>
Date: Mon, 12 Feb 2024 13:28:54 -0600
Subject: [PATCH 19/33] avoid modifying collection

---
 .../Training/Saving/SavedModel/AugmentedGraphView.cs          | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/TensorFlowNET.Core/Training/Saving/SavedModel/AugmentedGraphView.cs b/src/TensorFlowNET.Core/Training/Saving/SavedModel/AugmentedGraphView.cs
index a91933357..c6b26ff49 100644
--- a/src/TensorFlowNET.Core/Training/Saving/SavedModel/AugmentedGraphView.cs
+++ b/src/TensorFlowNET.Core/Training/Saving/SavedModel/AugmentedGraphView.cs
@@ -88,7 +88,7 @@ private ConcreteFunction maybe_uncache_variable_captures(ConcreteFunction concre
 
     public override (IList<Trackable>, IDictionary<Trackable, IEnumerable<TrackableReference>>) breadth_first_traversal()
     {
-        Trackable get_merged_trackable(Trackable x)
+        void merged_trackable(Trackable x)
         {
             // TODO: complete it with new definitions `Asset` and `TrackableConstant`.
             return x;
@@ -100,7 +100,7 @@ Trackable get_merged_trackable(Trackable x)
             // skip the deletion of cache (maybe do it later).
             foreach(var pair in _children_cache[obj])
             {
-                _children_cache[obj][pair.Key] = get_merged_trackable(pair.Value);
+                merged_trackable(pair.Value);
             }
         }
 

From 3448b6434680270026a0f938e913ff1f08f1df9b Mon Sep 17 00:00:00 2001
From: barfeous <nzksf2wa@duck.com>
Date: Wed, 14 Feb 2024 20:25:15 -0600
Subject: [PATCH 20/33] Remove parameter return from newly void local method

---
 .../Training/Saving/SavedModel/AugmentedGraphView.cs            | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/TensorFlowNET.Core/Training/Saving/SavedModel/AugmentedGraphView.cs b/src/TensorFlowNET.Core/Training/Saving/SavedModel/AugmentedGraphView.cs
index c6b26ff49..3b4bbdc63 100644
--- a/src/TensorFlowNET.Core/Training/Saving/SavedModel/AugmentedGraphView.cs
+++ b/src/TensorFlowNET.Core/Training/Saving/SavedModel/AugmentedGraphView.cs
@@ -91,8 +91,8 @@ public override (IList<Trackable>, IDictionary<Trackable, IEnumerable<TrackableR
         void merged_trackable(Trackable x)
         {
             // TODO: complete it with new definitions `Asset` and `TrackableConstant`.
-            return x;
         }
+
         var trackable_objects = base.breadth_first_traversal();
 
         foreach(var obj in _children_cache.Keys)

From 27a9e912f0aea535cd3124aac8c54269bfdb05c7 Mon Sep 17 00:00:00 2001
From: Rinne <AsakusaRinne@gmail.com>
Date: Mon, 11 Mar 2024 03:05:42 +0800
Subject: [PATCH 21/33] docs: update README.md

---
 README.md | 8 ++++++++
 1 file changed, 8 insertions(+)

diff --git a/README.md b/README.md
index 0198c873c..75cad0aa7 100644
--- a/README.md
+++ b/README.md
@@ -15,6 +15,14 @@
 
 English | [中文](docs/README-CN.md)
 
+> [!IMPORTANT]
+> We're happy that our work on tensorflow.net has attracted many users. However, at this time, none of the main maintainers of this repo is available for new features and bug fix. We won't refuse PRs and will help to review them.
+> 
+> If you would like to be a contributor or maintainer of tensorflow.net, we'd like to help you to start up.
+>
+> We feel sorry for that and we'll resume the maintaining for this project once one of us has bandwidth for it.
+>   
+
 *master branch and v0.100.x is corresponding to tensorflow v2.10, v0.6x branch is from tensorflow v2.6, v0.15-tensorflow1.15 is from tensorflow1.15. Please add `https://www.myget.org/F/scisharp/api/v3/index.json` to nuget source to use nightly release.*
 
 

From 4a31621a5632c7d6b2ebca1d36561458b91367c5 Mon Sep 17 00:00:00 2001
From: barfeous <nzksf2wa@duck.com>
Date: Sun, 28 Apr 2024 13:04:07 -0500
Subject: [PATCH 22/33] Use TryGetValue instead of ContainsKey + []

---
 .../Training/Saving/SavedModel/AugmentedGraphView.cs      | 8 ++------
 1 file changed, 2 insertions(+), 6 deletions(-)

diff --git a/src/TensorFlowNET.Core/Training/Saving/SavedModel/AugmentedGraphView.cs b/src/TensorFlowNET.Core/Training/Saving/SavedModel/AugmentedGraphView.cs
index 3b4bbdc63..9d0b3f001 100644
--- a/src/TensorFlowNET.Core/Training/Saving/SavedModel/AugmentedGraphView.cs
+++ b/src/TensorFlowNET.Core/Training/Saving/SavedModel/AugmentedGraphView.cs
@@ -109,15 +109,11 @@ void merged_trackable(Trackable x)
 
     public List<(string, Trackable)> list_dependencies(Trackable obj)
     {
-        IDictionary<string, Trackable> children;
-        if (!_children_cache.ContainsKey(obj))
+        if (!_children_cache.TryGetValue(obj, out var children))
         {
             children= new Dictionary<string, Trackable>();
         }
-        else
-        {
-            children= _children_cache[obj];
-        }
+
         List<(string, Trackable)> res = new();
         foreach(var pair in obj.deserialization_dependencies(children))
         {

From f5ba382e49ab0132308739c219ea09b6ac254223 Mon Sep 17 00:00:00 2001
From: Schoen Tannenbaum <169845314+SchoenTannenbaum@users.noreply.github.com>
Date: Mon, 20 May 2024 12:09:06 -0400
Subject: [PATCH 23/33] Regularizer addition and fixes

---
 .../Keras/Regularizers/IRegularizer.cs        | 17 ++++--
 .../CustomizedRegularizerJsonConverter.cs     | 57 +++++++++++++++++++
 .../Operations/Regularizers/L1.cs             | 33 +++++++++++
 .../Operations/Regularizers/L1L2.cs           | 48 ++++++++++++++++
 .../Operations/Regularizers/L2.cs             | 33 +++++++++++
 src/TensorFlowNET.Keras/Regularizers.cs       | 19 +++++--
 src/TensorFlowNET.Keras/Regularizers/L1.cs    | 19 -------
 src/TensorFlowNET.Keras/Regularizers/L1L2.cs  | 24 --------
 src/TensorFlowNET.Keras/Regularizers/L2.cs    | 17 ------
 9 files changed, 198 insertions(+), 69 deletions(-)
 create mode 100644 src/TensorFlowNET.Core/Keras/Saving/Json/CustomizedRegularizerJsonConverter.cs
 create mode 100644 src/TensorFlowNET.Core/Operations/Regularizers/L1.cs
 create mode 100644 src/TensorFlowNET.Core/Operations/Regularizers/L1L2.cs
 create mode 100644 src/TensorFlowNET.Core/Operations/Regularizers/L2.cs
 delete mode 100644 src/TensorFlowNET.Keras/Regularizers/L1.cs
 delete mode 100644 src/TensorFlowNET.Keras/Regularizers/L1L2.cs
 delete mode 100644 src/TensorFlowNET.Keras/Regularizers/L2.cs

diff --git a/src/TensorFlowNET.Core/Keras/Regularizers/IRegularizer.cs b/src/TensorFlowNET.Core/Keras/Regularizers/IRegularizer.cs
index f4045c7b2..e5de76ddb 100644
--- a/src/TensorFlowNET.Core/Keras/Regularizers/IRegularizer.cs
+++ b/src/TensorFlowNET.Core/Keras/Regularizers/IRegularizer.cs
@@ -1,7 +1,16 @@
-﻿namespace Tensorflow.Keras
+﻿using Newtonsoft.Json;
+using System.Collections.Generic;
+using Tensorflow.Keras.Saving.Common;
+
+namespace Tensorflow.Keras
 {
-    public interface IRegularizer
-    {
-        Tensor Apply(RegularizerArgs args);
+  [JsonConverter(typeof(CustomizedRegularizerJsonConverter))]
+  public interface IRegularizer
+  {
+    [JsonProperty("class_name")]
+    string ClassName { get; }
+    [JsonProperty("config")]
+    IDictionary<string, object> Config { get; }
+    Tensor Apply(RegularizerArgs args);
     }
 }
diff --git a/src/TensorFlowNET.Core/Keras/Saving/Json/CustomizedRegularizerJsonConverter.cs b/src/TensorFlowNET.Core/Keras/Saving/Json/CustomizedRegularizerJsonConverter.cs
new file mode 100644
index 000000000..4b1790aca
--- /dev/null
+++ b/src/TensorFlowNET.Core/Keras/Saving/Json/CustomizedRegularizerJsonConverter.cs
@@ -0,0 +1,57 @@
+﻿using Newtonsoft.Json.Linq;
+using Newtonsoft.Json;
+using System;
+using System.Collections.Generic;
+using System.Text;
+using Tensorflow.Operations.Regularizers;
+
+namespace Tensorflow.Keras.Saving.Common
+{
+  class RegularizerInfo
+  {
+    public string class_name { get; set; }
+    public JObject config { get; set; }
+  }
+
+  public class CustomizedRegularizerJsonConverter : JsonConverter
+    {
+        public override bool CanConvert(Type objectType)
+        {
+            return objectType == typeof(IRegularizer);
+        }
+
+        public override bool CanRead => true;
+
+        public override bool CanWrite => true;
+
+        public override void WriteJson(JsonWriter writer, object? value, JsonSerializer serializer)
+        {
+            var regularizer = value as IRegularizer;
+            if (regularizer is null)
+            {
+                JToken.FromObject(null).WriteTo(writer);
+                return;
+            }
+            JToken.FromObject(new RegularizerInfo()
+            {
+              class_name = regularizer.ClassName,
+              config = JObject.FromObject(regularizer.Config)
+            }, serializer).WriteTo(writer);
+        }
+
+        public override object? ReadJson(JsonReader reader, Type objectType, object? existingValue, JsonSerializer serializer)
+        {
+            var info = serializer.Deserialize<RegularizerInfo>(reader);
+            if (info is null)
+            {
+                return null;
+            }
+            return info.class_name switch
+            {
+                "L1L2" => new L1L2 (info.config["l1"].ToObject<float>(), info.config["l2"].ToObject<float>()),
+                "L1" => new L1(info.config["l1"].ToObject<float>()),
+                "L2" => new L2(info.config["l2"].ToObject<float>()),
+            };
+        }
+    }
+}
diff --git a/src/TensorFlowNET.Core/Operations/Regularizers/L1.cs b/src/TensorFlowNET.Core/Operations/Regularizers/L1.cs
new file mode 100644
index 000000000..8a5c68895
--- /dev/null
+++ b/src/TensorFlowNET.Core/Operations/Regularizers/L1.cs
@@ -0,0 +1,33 @@
+﻿using System;
+
+using Tensorflow.Keras;
+
+namespace Tensorflow.Operations.Regularizers
+{
+  public class L1 : IRegularizer
+  {
+    float _l1;
+    private readonly Dictionary<string, object> _config;
+
+    public string ClassName => "L2";
+    public virtual IDictionary<string, object> Config => _config;
+
+    public L1(float l1 = 0.01f)
+    {
+      //  l1 = 0.01 if l1 is None else l1
+      //  validate_float_arg(l1, name = "l1")
+      //  self.l1 = ops.convert_to_tensor(l1)
+      this._l1 = l1;
+
+      _config = new();
+      _config["l1"] = _l1;
+    }
+
+
+    public Tensor Apply(RegularizerArgs args)
+    {
+      //return self.l1 * ops.sum(ops.absolute(x))
+      return _l1 * math_ops.reduce_sum(math_ops.abs(args.X));
+    }
+  }
+}
diff --git a/src/TensorFlowNET.Core/Operations/Regularizers/L1L2.cs b/src/TensorFlowNET.Core/Operations/Regularizers/L1L2.cs
new file mode 100644
index 000000000..e3af00eb5
--- /dev/null
+++ b/src/TensorFlowNET.Core/Operations/Regularizers/L1L2.cs
@@ -0,0 +1,48 @@
+﻿using System;
+
+using Tensorflow.Keras;
+
+namespace Tensorflow.Operations.Regularizers
+{
+  public class L1L2 : IRegularizer
+  {
+    float _l1;
+    float _l2;
+    private readonly Dictionary<string, object> _config;
+
+    public string ClassName => "L1L2";
+    public virtual IDictionary<string, object> Config => _config;
+
+    public L1L2(float l1 = 0.0f, float l2 = 0.0f)
+    {
+      //l1 = 0.0 if l1 is None else l1
+      //l2 = 0.0 if l2 is None else l2
+      //  validate_float_arg(l1, name = "l1")
+      //  validate_float_arg(l2, name = "l2")
+
+      //  self.l1 = l1
+      //  self.l2 = l2
+      this._l1 = l1;
+      this._l2 = l2;
+
+      _config = new();
+      _config["l1"] = l1;
+      _config["l2"] = l2;
+    }
+
+    public Tensor Apply(RegularizerArgs args)
+    {
+        //regularization = ops.convert_to_tensor(0.0, dtype = x.dtype)
+        //if self.l1:
+        //    regularization += self.l1 * ops.sum(ops.absolute(x))
+        //if self.l2:
+        //    regularization += self.l2 * ops.sum(ops.square(x))
+        //return regularization
+
+        Tensor regularization = tf.constant(0.0, args.X.dtype);
+        regularization += _l1 * math_ops.reduce_sum(math_ops.abs(args.X));
+        regularization += _l2 * math_ops.reduce_sum(math_ops.square(args.X));
+        return regularization;
+    }
+  }
+}
diff --git a/src/TensorFlowNET.Core/Operations/Regularizers/L2.cs b/src/TensorFlowNET.Core/Operations/Regularizers/L2.cs
new file mode 100644
index 000000000..6c0e950a9
--- /dev/null
+++ b/src/TensorFlowNET.Core/Operations/Regularizers/L2.cs
@@ -0,0 +1,33 @@
+﻿using System;
+
+using Tensorflow.Keras;
+
+namespace Tensorflow.Operations.Regularizers
+{
+  public class L2 : IRegularizer
+  {
+    float _l2;
+    private readonly Dictionary<string, object> _config;
+
+    public string ClassName => "L2";
+    public virtual IDictionary<string, object> Config => _config;
+
+    public L2(float l2 = 0.01f)
+    {
+      //  l2 = 0.01 if l2 is None else l2
+      //  validate_float_arg(l2, name = "l2")
+      //  self.l2 = l2
+      this._l2 = l2;
+
+      _config = new();
+      _config["l2"] = _l2;
+    }
+
+
+    public Tensor Apply(RegularizerArgs args)
+    {
+      //return self.l2 * ops.sum(ops.square(x))
+      return _l2 * math_ops.reduce_sum(math_ops.square(args.X));
+    }
+  }
+}
diff --git a/src/TensorFlowNET.Keras/Regularizers.cs b/src/TensorFlowNET.Keras/Regularizers.cs
index 98da27a7f..9c6d07ca6 100644
--- a/src/TensorFlowNET.Keras/Regularizers.cs
+++ b/src/TensorFlowNET.Keras/Regularizers.cs
@@ -1,8 +1,17 @@
 ﻿namespace Tensorflow.Keras
 {
-    public class Regularizers
-    {
-        public IRegularizer l2(float l2 = 0.01f)
-            => new L2(l2);
-    }
+  public class Regularizers
+  {
+    public IRegularizer l1(float l1 = 0.01f)
+        => new Tensorflow.Operations.Regularizers.L1(l1);
+    public IRegularizer l2(float l2 = 0.01f)
+        => new Tensorflow.Operations.Regularizers.L2(l2);
+
+    //From TF source
+    //# The default value for l1 and l2 are different from the value in l1_l2
+    //# for backward compatibility reason. Eg, L1L2(l2=0.1) will only have l2
+    //# and no l1 penalty.
+    public IRegularizer l1l2(float l1 = 0.00f, float l2 = 0.00f)
+        => new Tensorflow.Operations.Regularizers.L1L2(l1, l2);
+  }
 }
diff --git a/src/TensorFlowNET.Keras/Regularizers/L1.cs b/src/TensorFlowNET.Keras/Regularizers/L1.cs
deleted file mode 100644
index 0f904b6f9..000000000
--- a/src/TensorFlowNET.Keras/Regularizers/L1.cs
+++ /dev/null
@@ -1,19 +0,0 @@
-﻿using System;
-
-namespace Tensorflow.Keras
-{
-    public class L1 : IRegularizer
-    {
-        float l1;
-
-        public L1(float l1 = 0.01f)
-        {
-            this.l1 = l1;
-        }
-
-        public Tensor Apply(RegularizerArgs args)
-        {
-            return l1 * math_ops.reduce_sum(math_ops.abs(args.X));
-        }
-    }
-}
diff --git a/src/TensorFlowNET.Keras/Regularizers/L1L2.cs b/src/TensorFlowNET.Keras/Regularizers/L1L2.cs
deleted file mode 100644
index f619f1582..000000000
--- a/src/TensorFlowNET.Keras/Regularizers/L1L2.cs
+++ /dev/null
@@ -1,24 +0,0 @@
-﻿using System;
-using static Tensorflow.Binding;
-namespace Tensorflow.Keras
-{
-    public class L1L2 : IRegularizer
-    {
-        float l1;
-        float l2;
-
-        public L1L2(float l1 = 0.0f, float l2 = 0.0f)
-        {
-            this.l1 = l1;
-            this.l2 = l2;
-
-        }
-        public Tensor Apply(RegularizerArgs args)
-        {
-            Tensor regularization = tf.constant(0.0, args.X.dtype);
-            regularization += l1 * math_ops.reduce_sum(math_ops.abs(args.X));
-            regularization += l2 * math_ops.reduce_sum(math_ops.square(args.X));
-            return regularization;
-        }
-    }
-}
diff --git a/src/TensorFlowNET.Keras/Regularizers/L2.cs b/src/TensorFlowNET.Keras/Regularizers/L2.cs
deleted file mode 100644
index 034bbd236..000000000
--- a/src/TensorFlowNET.Keras/Regularizers/L2.cs
+++ /dev/null
@@ -1,17 +0,0 @@
-﻿namespace Tensorflow.Keras
-{
-    public class L2 : IRegularizer
-    {
-        float l2;
-
-        public L2(float l2 = 0.01f)
-        {
-            this.l2 = l2;
-        }
-
-        public Tensor Apply(RegularizerArgs args)
-        {
-            return l2 * math_ops.reduce_sum(math_ops.square(args.X));
-        }
-    }
-}

From 5f9fce572d07768de9c1386bf29264a345e16c8c Mon Sep 17 00:00:00 2001
From: Schoen Tannenbaum <169845314+SchoenTannenbaum@users.noreply.github.com>
Date: Mon, 20 May 2024 12:10:09 -0400
Subject: [PATCH 24/33] RegularizerAPI and UnitTest

---
 .../Keras/Regularizers/IRegularizer.cs        | 11 ++++-
 .../Operations/Regularizers/L1.cs             |  2 +-
 src/TensorFlowNET.Keras/Regularizers.cs       | 44 +++++++++++++++--
 .../Model/ModelLoadTest.cs                    | 48 +++++++++++++++++++
 4 files changed, 98 insertions(+), 7 deletions(-)

diff --git a/src/TensorFlowNET.Core/Keras/Regularizers/IRegularizer.cs b/src/TensorFlowNET.Core/Keras/Regularizers/IRegularizer.cs
index e5de76ddb..06dbb7c8c 100644
--- a/src/TensorFlowNET.Core/Keras/Regularizers/IRegularizer.cs
+++ b/src/TensorFlowNET.Core/Keras/Regularizers/IRegularizer.cs
@@ -12,5 +12,14 @@ public interface IRegularizer
     [JsonProperty("config")]
     IDictionary<string, object> Config { get; }
     Tensor Apply(RegularizerArgs args);
-    }
+  }
+
+  public interface IRegularizerApi
+  {
+    IRegularizer GetRegularizerFromName(string name);
+    IRegularizer L1 { get; }
+    IRegularizer L2 { get; }
+    IRegularizer L1L2 { get; }
+  }
+
 }
diff --git a/src/TensorFlowNET.Core/Operations/Regularizers/L1.cs b/src/TensorFlowNET.Core/Operations/Regularizers/L1.cs
index 8a5c68895..9e0619454 100644
--- a/src/TensorFlowNET.Core/Operations/Regularizers/L1.cs
+++ b/src/TensorFlowNET.Core/Operations/Regularizers/L1.cs
@@ -9,7 +9,7 @@ public class L1 : IRegularizer
     float _l1;
     private readonly Dictionary<string, object> _config;
 
-    public string ClassName => "L2";
+    public string ClassName => "L1";
     public virtual IDictionary<string, object> Config => _config;
 
     public L1(float l1 = 0.01f)
diff --git a/src/TensorFlowNET.Keras/Regularizers.cs b/src/TensorFlowNET.Keras/Regularizers.cs
index 9c6d07ca6..73b72a051 100644
--- a/src/TensorFlowNET.Keras/Regularizers.cs
+++ b/src/TensorFlowNET.Keras/Regularizers.cs
@@ -1,17 +1,51 @@
-﻿namespace Tensorflow.Keras
+﻿using Tensorflow.Operations.Regularizers;
+
+namespace Tensorflow.Keras
 {
-  public class Regularizers
+  public class Regularizers: IRegularizerApi
   {
+    private static Dictionary<string, IRegularizer> _nameActivationMap;
+
     public IRegularizer l1(float l1 = 0.01f)
-        => new Tensorflow.Operations.Regularizers.L1(l1);
+        => new L1(l1);
     public IRegularizer l2(float l2 = 0.01f)
-        => new Tensorflow.Operations.Regularizers.L2(l2);
+        => new L2(l2);
 
     //From TF source
     //# The default value for l1 and l2 are different from the value in l1_l2
     //# for backward compatibility reason. Eg, L1L2(l2=0.1) will only have l2
     //# and no l1 penalty.
     public IRegularizer l1l2(float l1 = 0.00f, float l2 = 0.00f)
-        => new Tensorflow.Operations.Regularizers.L1L2(l1, l2);
+        => new L1L2(l1, l2);
+
+    static Regularizers()
+    {
+      _nameActivationMap = new Dictionary<string, IRegularizer>();
+      _nameActivationMap["L1"] = new L1();
+      _nameActivationMap["L1"] = new L2();
+      _nameActivationMap["L1"] = new L1L2();
+    }
+
+    public IRegularizer L1 => l1();
+
+    public IRegularizer L2 => l2();
+
+    public IRegularizer L1L2 => l1l2();
+
+    public IRegularizer GetRegularizerFromName(string name)
+    {
+      if (name == null)
+      {
+        throw new Exception($"Regularizer name cannot be null");
+      }
+      if (!_nameActivationMap.TryGetValue(name, out var res))
+      {
+        throw new Exception($"Regularizer {name} not found");
+      }
+      else
+      {
+        return res;
+      }
+    }
   }
 }
diff --git a/test/TensorFlowNET.Keras.UnitTest/Model/ModelLoadTest.cs b/test/TensorFlowNET.Keras.UnitTest/Model/ModelLoadTest.cs
index 53a67cbfa..c733537e7 100644
--- a/test/TensorFlowNET.Keras.UnitTest/Model/ModelLoadTest.cs
+++ b/test/TensorFlowNET.Keras.UnitTest/Model/ModelLoadTest.cs
@@ -1,6 +1,7 @@
 ﻿using Microsoft.VisualStudio.TestPlatform.Utilities;
 using Microsoft.VisualStudio.TestTools.UnitTesting;
 using Newtonsoft.Json.Linq;
+using System.Collections.Generic;
 using System.Linq;
 using System.Xml.Linq;
 using Tensorflow.Keras.Engine;
@@ -129,6 +130,53 @@ public void TestModelBeforeTF2_5()
     }
 
 
+    [TestMethod]
+    public void BiasRegularizerSaveAndLoad()
+    {
+        var savemodel = keras.Sequential(new List<ILayer>()
+            {
+                tf.keras.layers.InputLayer((227, 227, 3)),
+                tf.keras.layers.Conv2D(96, (11, 11), (4, 4), activation:"relu", padding:"valid"),
+                tf.keras.layers.BatchNormalization(),
+                tf.keras.layers.MaxPooling2D((3, 3), strides:(2, 2)),
+
+                tf.keras.layers.Conv2D(256, (5, 5), (1, 1), "same", activation: keras.activations.Relu, bias_regularizer:keras.regularizers.L1L2),
+                tf.keras.layers.BatchNormalization(),
+
+                tf.keras.layers.Conv2D(256, (5, 5), (1, 1), "same", activation: keras.activations.Relu, bias_regularizer:keras.regularizers.L2),
+                tf.keras.layers.BatchNormalization(),
+
+                tf.keras.layers.Conv2D(256, (5, 5), (1, 1), "same", activation: keras.activations.Relu, bias_regularizer:keras.regularizers.L1),
+                tf.keras.layers.BatchNormalization(),
+                tf.keras.layers.MaxPooling2D((3, 3), (2, 2)),
+
+                tf.keras.layers.Flatten(),
+
+                tf.keras.layers.Dense(1000, activation: "linear"),
+                tf.keras.layers.Softmax(1)
+            });
+
+        savemodel.compile(tf.keras.optimizers.Adam(), tf.keras.losses.SparseCategoricalCrossentropy(from_logits: true), new string[] { "accuracy" });
+
+        var num_epochs = 1;
+        var batch_size = 8;
+
+        var trainDataset = new RandomDataSet(new Shape(227, 227, 3), 16);
+
+        savemodel.fit(trainDataset.Data, trainDataset.Labels, batch_size, num_epochs);
+
+        savemodel.save(@"./bias_regularizer_save_and_load", save_format: "tf");
+
+        var loadModel = tf.keras.models.load_model(@"./bias_regularizer_save_and_load");
+        loadModel.summary();
+
+        loadModel.compile(tf.keras.optimizers.Adam(), tf.keras.losses.SparseCategoricalCrossentropy(from_logits: true), new string[] { "accuracy" });
+
+        var fitDataset = new RandomDataSet(new Shape(227, 227, 3), 16);
+
+        loadModel.fit(fitDataset.Data, fitDataset.Labels, batch_size, num_epochs);
+    }
+
 
     [TestMethod]
     public void CreateConcatenateModelSaveAndLoad()

From b3ce158ec3304469bf776bc582b847e685a9df73 Mon Sep 17 00:00:00 2001
From: novikov-alexander <79649566+novikov-alexander@users.noreply.github.com>
Date: Fri, 14 Jun 2024 14:40:06 +0300
Subject: [PATCH 25/33] Update tensor_util.cs

---
 src/TensorFlowNET.Core/Tensors/tensor_util.cs | 40 +++++++++++++------
 1 file changed, 27 insertions(+), 13 deletions(-)

diff --git a/src/TensorFlowNET.Core/Tensors/tensor_util.cs b/src/TensorFlowNET.Core/Tensors/tensor_util.cs
index f688d4d5d..f2003c9d4 100644
--- a/src/TensorFlowNET.Core/Tensors/tensor_util.cs
+++ b/src/TensorFlowNET.Core/Tensors/tensor_util.cs
@@ -1,4 +1,4 @@
-﻿/*****************************************************************************
+/*****************************************************************************
    Copyright 2018 The TensorFlow.NET Authors. All Rights Reserved.
 
    Licensed under the Apache License, Version 2.0 (the "License");
@@ -135,6 +135,23 @@ T[] ExpandArrayToSize<T>(IList<T> src)
             TF_DataType.TF_QINT32
         };
 
+        private static TOut[,] ConvertArray2D<TIn, TOut>(TIn[,] inputArray, Func<TIn, TOut> converter)
+        {
+            var rows = inputArray.GetLength(0);
+            var cols = inputArray.GetLength(1);
+            var outputArray = new TOut[rows, cols];
+
+            for (var i = 0; i < rows; i++)
+            {
+                for (var j = 0; j < cols; j++)
+                {
+                    outputArray[i, j] = converter(inputArray[i, j]);
+                }
+            }
+
+            return outputArray;
+        }
+
         /// <summary>
         /// Create a TensorProto, invoked in graph mode
         /// </summary>
@@ -157,19 +174,16 @@ public static TensorProto make_tensor_proto(object values, TF_DataType dtype = T
             else if(origin_dtype != dtype)
             {
                 var new_system_dtype = dtype.as_system_dtype();
-                if (values is long[] long_values)
-                {
-                    if (dtype == TF_DataType.TF_INT32)
-                        values = long_values.Select(x => (int)Convert.ChangeType(x, new_system_dtype)).ToArray();
-                }
-                else if (values is double[] double_values)
+                
+                values = values switch
                 {
-                    if (dtype == TF_DataType.TF_FLOAT)
-                        values = double_values.Select(x => (float)Convert.ChangeType(x, new_system_dtype)).ToArray();
-                }
-                else
-                    values = Convert.ChangeType(values, new_system_dtype);
-
+                    long[] longValues when dtype == TF_DataType.TF_INT32 => longValues.Select(x => (int)x).ToArray(),
+                    float[] floatValues when dtype == TF_DataType.TF_DOUBLE => floatValues.Select(x => (double)x).ToArray(),
+                    float[,] float2DValues when dtype == TF_DataType.TF_DOUBLE => ConvertArray2D(float2DValues, Convert.ToDouble),
+                    double[] doubleValues when dtype == TF_DataType.TF_FLOAT => doubleValues.Select(x => (float)x).ToArray(),
+                    double[,] double2DValues when dtype == TF_DataType.TF_DOUBLE => ConvertArray2D(double2DValues, Convert.ToSingle),
+                    _ => Convert.ChangeType(values, new_system_dtype),
+                };
                 dtype = values.GetDataType();
             }
 

From 18db147eb40a07931e8421bbd63c64ce11edd558 Mon Sep 17 00:00:00 2001
From: novikov-alexander <79649566+novikov-alexander@users.noreply.github.com>
Date: Fri, 14 Jun 2024 14:40:37 +0300
Subject: [PATCH 26/33] Update GradientDescentOptimizerTests.cs

---
 .../Training/GradientDescentOptimizerTests.cs                 | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
index f7062f00d..3b53ff9cd 100644
--- a/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
+++ b/test/TensorFlowNET.UnitTest/Training/GradientDescentOptimizerTests.cs
@@ -1,4 +1,4 @@
-﻿using Microsoft.VisualStudio.TestTools.UnitTesting;
+using Microsoft.VisualStudio.TestTools.UnitTesting;
 using System;
 using System.Linq;
 using Tensorflow;
@@ -82,7 +82,7 @@ private void TestMinimizeResourceVariable<T>() where T : struct
 
                 var pred = math_ops.matmul(var0, x) + var1;
                 var loss = pred * pred;
-                var sgd_op = tf.train.GradientDescentOptimizer(3.0f).minimize(loss);
+                var sgd_op = tf.train.GradientDescentOptimizer(1.0f).minimize(loss);
 
                 var global_variables = tf.global_variables_initializer();
                 sess.run(global_variables);

From 483ac82cd2db273c2c0520ce6923f5951638daba Mon Sep 17 00:00:00 2001
From: novikov-alexander <79649566+novikov-alexander@users.noreply.github.com>
Date: Fri, 14 Jun 2024 15:02:17 +0300
Subject: [PATCH 27/33] Update tensor_util.cs

---
 src/TensorFlowNET.Core/Tensors/tensor_util.cs | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/src/TensorFlowNET.Core/Tensors/tensor_util.cs b/src/TensorFlowNET.Core/Tensors/tensor_util.cs
index f2003c9d4..873579e42 100644
--- a/src/TensorFlowNET.Core/Tensors/tensor_util.cs
+++ b/src/TensorFlowNET.Core/Tensors/tensor_util.cs
@@ -178,10 +178,15 @@ public static TensorProto make_tensor_proto(object values, TF_DataType dtype = T
                 values = values switch
                 {
                     long[] longValues when dtype == TF_DataType.TF_INT32 => longValues.Select(x => (int)x).ToArray(),
+                    long[] longValues => values,
                     float[] floatValues when dtype == TF_DataType.TF_DOUBLE => floatValues.Select(x => (double)x).ToArray(),
+                    float[] floatValues => values,
                     float[,] float2DValues when dtype == TF_DataType.TF_DOUBLE => ConvertArray2D(float2DValues, Convert.ToDouble),
+                    float[,] float2DValues => values,
                     double[] doubleValues when dtype == TF_DataType.TF_FLOAT => doubleValues.Select(x => (float)x).ToArray(),
-                    double[,] double2DValues when dtype == TF_DataType.TF_DOUBLE => ConvertArray2D(double2DValues, Convert.ToSingle),
+                    double[] doubleValues => values,
+                    double[,] double2DValues when dtype == TF_DataType.TF_FLOAT => ConvertArray2D(double2DValues, Convert.ToSingle),
+                    double[,] double2DValues => values,
                     _ => Convert.ChangeType(values, new_system_dtype),
                 };
                 dtype = values.GetDataType();

From def57745b66d0537cdb70251584c940f327cd929 Mon Sep 17 00:00:00 2001
From: Alexander Novikov <novikov_alexander@live.ru>
Date: Wed, 19 Jun 2024 12:30:38 +0300
Subject: [PATCH 28/33] fix: more generic array cast

---
 src/TensorFlowNET.Core/Tensors/tensor_util.cs | 88 +++++++++++++------
 1 file changed, 59 insertions(+), 29 deletions(-)

diff --git a/src/TensorFlowNET.Core/Tensors/tensor_util.cs b/src/TensorFlowNET.Core/Tensors/tensor_util.cs
index 873579e42..6e5024efd 100644
--- a/src/TensorFlowNET.Core/Tensors/tensor_util.cs
+++ b/src/TensorFlowNET.Core/Tensors/tensor_util.cs
@@ -67,7 +67,7 @@ public static NDArray MakeNdarray(TensorProto tensor)
 
             T[] ExpandArrayToSize<T>(IList<T> src)
             {
-                if(src.Count == 0)
+                if (src.Count == 0)
                 {
                     return new T[0];
                 }
@@ -77,7 +77,7 @@ T[] ExpandArrayToSize<T>(IList<T> src)
                 var first_elem = src[0];
                 var last_elem = src[src.Count - 1];
                 T[] res = new T[num_elements];
-                for(long i = 0; i < num_elements; i++)
+                for (long i = 0; i < num_elements; i++)
                 {
                     if (i < pre) res[i] = first_elem;
                     else if (i >= num_elements - after) res[i] = last_elem;
@@ -121,7 +121,7 @@ T[] ExpandArrayToSize<T>(IList<T> src)
                     $"https://www.tensorflow.org/api_docs/python/tf/dtypes for supported TF dtypes.");
             }
 
-            if(values.size == 0)
+            if (values.size == 0)
             {
                 return np.zeros(shape, tensor_dtype);
             }
@@ -135,23 +135,47 @@ T[] ExpandArrayToSize<T>(IList<T> src)
             TF_DataType.TF_QINT32
         };
 
-        private static TOut[,] ConvertArray2D<TIn, TOut>(TIn[,] inputArray, Func<TIn, TOut> converter)
+        private static Array ConvertArray<TOut>(Array inputArray, Func<object, TOut> converter)
         {
-            var rows = inputArray.GetLength(0);
-            var cols = inputArray.GetLength(1);
-            var outputArray = new TOut[rows, cols];
+            if (inputArray == null)
+                throw new ArgumentNullException(nameof(inputArray));
 
-            for (var i = 0; i < rows; i++)
+            var elementType = typeof(TOut);
+            var lengths = new int[inputArray.Rank];
+            for (var i = 0; i < inputArray.Rank; i++)
             {
-                for (var j = 0; j < cols; j++)
-                {
-                    outputArray[i, j] = converter(inputArray[i, j]);
-                }
+                lengths[i] = inputArray.GetLength(i);
             }
 
+            var outputArray = Array.CreateInstance(elementType, lengths);
+
+            FillArray(inputArray, outputArray, converter, new int[inputArray.Rank], 0);
+
             return outputArray;
         }
 
+        private static void FillArray<TIn, TOut>(Array inputArray, Array outputArray, Func<TIn, TOut> converter, int[] indices, int dimension)
+        {
+            if (dimension == inputArray.Rank - 1)
+            {
+                for (int i = 0; i < inputArray.GetLength(dimension); i++)
+                {
+                    indices[dimension] = i;
+                    var inputValue = (TIn)inputArray.GetValue(indices);
+                    var convertedValue = converter(inputValue);
+                    outputArray.SetValue(convertedValue, indices);
+                }
+            }
+            else
+            {
+                for (int i = 0; i < inputArray.GetLength(dimension); i++)
+                {
+                    indices[dimension] = i;
+                    FillArray(inputArray, outputArray, converter, indices, dimension + 1);
+                }
+            }
+        }
+
         /// <summary>
         /// Create a TensorProto, invoked in graph mode
         /// </summary>
@@ -171,24 +195,30 @@ public static TensorProto make_tensor_proto(object values, TF_DataType dtype = T
             var origin_dtype = values.GetDataType();
             if (dtype == TF_DataType.DtInvalid)
                 dtype = origin_dtype;
-            else if(origin_dtype != dtype)
+            else if (origin_dtype != dtype)
             {
                 var new_system_dtype = dtype.as_system_dtype();
-                
-                values = values switch
+
+                if (dtype != TF_DataType.TF_STRING && dtype != TF_DataType.TF_VARIANT && dtype != TF_DataType.TF_RESOURCE)
+                {
+                    if (values is Array arrayValues)
+                    {
+                        values = dtype switch
+                        {
+                            TF_DataType.TF_INT32 => ConvertArray(arrayValues, Convert.ToInt32),
+                            TF_DataType.TF_FLOAT => ConvertArray(arrayValues, Convert.ToSingle),
+                            TF_DataType.TF_DOUBLE => ConvertArray(arrayValues, Convert.ToDouble),
+                            _ => values,
+                        };
+                    } else
+                    {
+                        values = Convert.ChangeType(values, new_system_dtype);
+                    }
+                    
+                } else
                 {
-                    long[] longValues when dtype == TF_DataType.TF_INT32 => longValues.Select(x => (int)x).ToArray(),
-                    long[] longValues => values,
-                    float[] floatValues when dtype == TF_DataType.TF_DOUBLE => floatValues.Select(x => (double)x).ToArray(),
-                    float[] floatValues => values,
-                    float[,] float2DValues when dtype == TF_DataType.TF_DOUBLE => ConvertArray2D(float2DValues, Convert.ToDouble),
-                    float[,] float2DValues => values,
-                    double[] doubleValues when dtype == TF_DataType.TF_FLOAT => doubleValues.Select(x => (float)x).ToArray(),
-                    double[] doubleValues => values,
-                    double[,] double2DValues when dtype == TF_DataType.TF_FLOAT => ConvertArray2D(double2DValues, Convert.ToSingle),
-                    double[,] double2DValues => values,
-                    _ => Convert.ChangeType(values, new_system_dtype),
-                };
+
+                }
                 dtype = values.GetDataType();
             }
 
@@ -306,7 +336,7 @@ bool hasattr(Graph property, string attr)
 
             if (tensor is EagerTensor eagerTensor)
             {
-                if(tensor.dtype == tf.int64)
+                if (tensor.dtype == tf.int64)
                     return new Shape(tensor.ToArray<long>());
                 else
                     return new Shape(tensor.ToArray<int>());
@@ -481,7 +511,7 @@ bool hasattr(Graph property, string attr)
                 var d_ = new int[value.size];
                 foreach (var (index, d) in enumerate(value.ToArray<int>()))
                     d_[index] = d >= 0 ? d : -1;
-                
+
                 ret = ret.merge_with(new Shape(d_));
             }
             return ret;

From 5142ad658cf9233abd2c9fe727c2daeea84a88f6 Mon Sep 17 00:00:00 2001
From: Aleksej Solomatin <aleksejsolomatin@gmail.com>
Date: Sun, 30 Jun 2024 22:06:12 +0300
Subject: [PATCH 29/33] test: Added an `evaluate` method call to a unit test
 for a multi-input model.

---
 test/TensorFlowNET.Keras.UnitTest/MultiInputModelTest.cs | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/test/TensorFlowNET.Keras.UnitTest/MultiInputModelTest.cs b/test/TensorFlowNET.Keras.UnitTest/MultiInputModelTest.cs
index dd8ef8f91..bb293bd90 100644
--- a/test/TensorFlowNET.Keras.UnitTest/MultiInputModelTest.cs
+++ b/test/TensorFlowNET.Keras.UnitTest/MultiInputModelTest.cs
@@ -54,6 +54,13 @@ public void LeNetModel()
             var x = new NDArray[] { x1, x2 };
             model.fit(x, dataset.Train.Labels, batch_size: 8, epochs: 3);
 
+            x1 = x1["0:8"];
+            x2 = x1;
+
+            x = new NDArray[] { x1, x2 };
+            var y = dataset.Train.Labels["0:8"];
+            (model as Engine.Model).evaluate(x, y);
+
             x1 = np.ones((1, 28, 28, 1), TF_DataType.TF_FLOAT);
             x2 = np.zeros((1, 28, 28, 1), TF_DataType.TF_FLOAT);
             var pred = model.predict((x1, x2));

From f8b7bdeb9b7fa10bf49b888934683f04febfc6e2 Mon Sep 17 00:00:00 2001
From: Aleksej Solomatin <aleksejsolomatin@gmail.com>
Date: Sun, 30 Jun 2024 22:43:01 +0300
Subject: [PATCH 30/33] test: Added a unit test of training a multi-input model
 using a dataset.

---
 .../MultiInputModelTest.cs                    | 75 +++++++++++++++++++
 1 file changed, 75 insertions(+)

diff --git a/test/TensorFlowNET.Keras.UnitTest/MultiInputModelTest.cs b/test/TensorFlowNET.Keras.UnitTest/MultiInputModelTest.cs
index bb293bd90..54b76d41a 100644
--- a/test/TensorFlowNET.Keras.UnitTest/MultiInputModelTest.cs
+++ b/test/TensorFlowNET.Keras.UnitTest/MultiInputModelTest.cs
@@ -2,6 +2,7 @@
 using System;
 using Tensorflow.Keras.Optimizers;
 using Tensorflow.NumPy;
+using static Tensorflow.Binding;
 using static Tensorflow.KerasApi;
 
 namespace Tensorflow.Keras.UnitTest
@@ -66,5 +67,79 @@ public void LeNetModel()
             var pred = model.predict((x1, x2));
             Console.WriteLine(pred);
         }
+
+        [TestMethod]
+        public void LeNetModelDataset()
+        {
+            var inputs = keras.Input((28, 28, 1));
+            var conv1 = keras.layers.Conv2D(16, (3, 3), activation: "relu", padding: "same").Apply(inputs);
+            var pool1 = keras.layers.MaxPooling2D((2, 2), 2).Apply(conv1);
+            var conv2 = keras.layers.Conv2D(32, (3, 3), activation: "relu", padding: "same").Apply(pool1);
+            var pool2 = keras.layers.MaxPooling2D((2, 2), 2).Apply(conv2);
+            var flat1 = keras.layers.Flatten().Apply(pool2);
+
+            var inputs_2 = keras.Input((28, 28, 1));
+            var conv1_2 = keras.layers.Conv2D(16, (3, 3), activation: "relu", padding: "same").Apply(inputs_2);
+            var pool1_2 = keras.layers.MaxPooling2D((4, 4), 4).Apply(conv1_2);
+            var conv2_2 = keras.layers.Conv2D(32, (1, 1), activation: "relu", padding: "same").Apply(pool1_2);
+            var pool2_2 = keras.layers.MaxPooling2D((2, 2), 2).Apply(conv2_2);
+            var flat1_2 = keras.layers.Flatten().Apply(pool2_2);
+
+            var concat = keras.layers.Concatenate().Apply((flat1, flat1_2));
+            var dense1 = keras.layers.Dense(512, activation: "relu").Apply(concat);
+            var dense2 = keras.layers.Dense(128, activation: "relu").Apply(dense1);
+            var dense3 = keras.layers.Dense(10, activation: "relu").Apply(dense2);
+            var output = keras.layers.Softmax(-1).Apply(dense3);
+
+            var model = keras.Model((inputs, inputs_2), output);
+            model.summary();
+
+            var data_loader = new MnistModelLoader();
+
+            var dataset = data_loader.LoadAsync(new ModelLoadSetting
+            {
+                TrainDir = "mnist",
+                OneHot = false,
+                ValidationSize = 59900,
+            }).Result;
+
+            var loss = keras.losses.SparseCategoricalCrossentropy();
+            var optimizer = new Adam(0.001f);
+            model.compile(optimizer, loss, new string[] { "accuracy" });
+
+            NDArray x1 = np.reshape(dataset.Train.Data, (dataset.Train.Data.shape[0], 28, 28, 1));
+
+            var multiInputDataset = tf.data.Dataset.zip(
+                tf.data.Dataset.from_tensor_slices(x1),
+                tf.data.Dataset.from_tensor_slices(x1),
+                tf.data.Dataset.from_tensor_slices(dataset.Train.Labels)
+            ).batch(8);
+            multiInputDataset.FirstInputTensorCount = 2;
+
+            model.fit(multiInputDataset, epochs: 3);
+
+            x1 = x1["0:8"];
+
+            multiInputDataset = tf.data.Dataset.zip(
+                tf.data.Dataset.from_tensor_slices(x1),
+                tf.data.Dataset.from_tensor_slices(x1),
+                tf.data.Dataset.from_tensor_slices(dataset.Train.Labels["0:8"])
+            ).batch(8);
+            multiInputDataset.FirstInputTensorCount = 2;
+
+            (model as Engine.Model).evaluate(multiInputDataset);
+
+            x1 = np.ones((1, 28, 28, 1), TF_DataType.TF_FLOAT);
+            var x2 = np.zeros((1, 28, 28, 1), TF_DataType.TF_FLOAT);
+
+            multiInputDataset = tf.data.Dataset.zip(
+                tf.data.Dataset.from_tensor_slices(x1),
+                tf.data.Dataset.from_tensor_slices(x2)
+            ).batch(8);
+            multiInputDataset.FirstInputTensorCount = 2;
+
+            var pred = model.predict(multiInputDataset);
+            Console.WriteLine(pred);
+        }
     }
 }

From 93dda17944b6e34380897ad3480ac2218fb7398e Mon Sep 17 00:00:00 2001
From: Aleksej Solomatin <aleksejsolomatin@gmail.com>
Date: Sun, 30 Jun 2024 22:44:03 +0300
Subject: [PATCH 31/33] fix: Added support for training a multi-input model
 using a dataset.

---
 src/TensorFlowNET.Keras/Engine/Model.Evaluate.cs | 14 +++++++++++++-
 src/TensorFlowNET.Keras/Engine/Model.Fit.cs      | 13 ++++++++++++-
 2 files changed, 25 insertions(+), 2 deletions(-)

diff --git a/src/TensorFlowNET.Keras/Engine/Model.Evaluate.cs b/src/TensorFlowNET.Keras/Engine/Model.Evaluate.cs
index b3264429e..ec99d7ef9 100644
--- a/src/TensorFlowNET.Keras/Engine/Model.Evaluate.cs
+++ b/src/TensorFlowNET.Keras/Engine/Model.Evaluate.cs
@@ -112,7 +112,19 @@ public Dictionary<string, float> evaluate(IDatasetV2 x, int verbose = 1, bool is
                 Steps = data_handler.Inferredsteps
             });
 
-            return evaluate(data_handler, callbacks, is_val, test_function);
+            Func<DataHandler, OwnedIterator, Dictionary<string, float>> testFunction;
+
+            if (data_handler.DataAdapter.GetDataset().structure.Length > 2 ||
+                data_handler.DataAdapter.GetDataset().FirstInputTensorCount > 1)
+            {
+                testFunction = test_step_multi_inputs_function;
+            }
+            else
+            {
+                testFunction = test_function;
+            }
+
+            return evaluate(data_handler, callbacks, is_val, testFunction);
         }
 
         /// <summary>
diff --git a/src/TensorFlowNET.Keras/Engine/Model.Fit.cs b/src/TensorFlowNET.Keras/Engine/Model.Fit.cs
index 13a1b63bc..e1303513e 100644
--- a/src/TensorFlowNET.Keras/Engine/Model.Fit.cs
+++ b/src/TensorFlowNET.Keras/Engine/Model.Fit.cs
@@ -179,9 +179,20 @@ public ICallback fit(IDatasetV2 dataset,
                 StepsPerExecution = _steps_per_execution
             });
 
+            Func<DataHandler, OwnedIterator, Dictionary<string, float>> trainStepFunction;
+
+            if (data_handler.DataAdapter.GetDataset().structure.Length > 2 ||
+                data_handler.DataAdapter.GetDataset().FirstInputTensorCount > 1)
+            {
+                trainStepFunction = train_step_multi_inputs_function;
+            }
+            else
+            {
+                trainStepFunction = train_step_function;
+            }
 
             return FitInternal(data_handler, epochs, validation_step, verbose, callbacks, validation_data: validation_data,
-                    train_step_func: train_step_function);
+                    train_step_func: trainStepFunction);
         }
 
         History FitInternal(DataHandler data_handler, int epochs, int validation_step, int verbose, List<ICallback> callbackList, IDatasetV2 validation_data, 

From b6c5d26fab9a5eab72c0c81c554fec8412d86771 Mon Sep 17 00:00:00 2001
From: Leonardo Doherty <73901464+eLDoherty@users.noreply.github.com>
Date: Mon, 13 Jan 2025 23:29:04 -0500
Subject: [PATCH 32/33] fix: Resolve fixed-size array issue

Replace .ToArray() with .ToList() to allow dynamic modification of network_nodes in MapGraphNetwork()

Replaced .ToArray() with .ToList() to resolve the issue where .Add() was called on a fixed-size array.

This preventing the "Collection was of a fixed size" error when called something like this var model = keras.Model(new Tensors(new Tensor[] { encoder_inputs, decoder_inputs }), outputs: decoder_dense);
---
 src/TensorFlowNET.Keras/Engine/Functional.cs | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/src/TensorFlowNET.Keras/Engine/Functional.cs b/src/TensorFlowNET.Keras/Engine/Functional.cs
index 7347585f8..75854d82c 100644
--- a/src/TensorFlowNET.Keras/Engine/Functional.cs
+++ b/src/TensorFlowNET.Keras/Engine/Functional.cs
@@ -180,7 +180,7 @@ void ComputeTensorUsageCount()
             var (nodes_in_decreasing_depth, layer_indices) = BuildMap(outputs);
             var network_nodes = nodes_in_decreasing_depth
                 .Select(node => MakeNodeKey(node.Layer.Name, node.Layer.InboundNodes.IndexOf(node)))
-                .ToArray();
+                .ToList();
 
             var nodes_depths = new Dictionary<INode, int>();
             var layers_depths = new Dictionary<ILayer, int>();
@@ -221,7 +221,7 @@ void ComputeTensorUsageCount()
                     layers_depths[input_layer] = 0;
                     layer_indices[input_layer] = -1;
                     nodes_depths[input_layer.InboundNodes[0]] = 0;
-                    network_nodes.add(MakeNodeKey(input_layer.Name, 0));
+                    network_nodes.Add(MakeNodeKey(input_layer.Name, 0));
                 }
             }
 
@@ -231,7 +231,7 @@ void ComputeTensorUsageCount()
             {
                 if (!nodes_by_depth.ContainsKey(depth))
                     nodes_by_depth[depth] = new List<INode>();
-                nodes_by_depth[depth].append(node);
+                nodes_by_depth[depth].Add(node);
             }
 
             var layers_by_depth = new Dictionary<int, List<ILayer>>();
@@ -239,7 +239,7 @@ void ComputeTensorUsageCount()
             {
                 if (!layers_by_depth.ContainsKey(depth))
                     layers_by_depth[depth] = new List<ILayer>();
-                layers_by_depth[depth].append(layer);
+                layers_by_depth[depth].Add(layer);
             }
 
             // Get sorted list of layer depths.
@@ -260,7 +260,7 @@ void ComputeTensorUsageCount()
             // Get sorted list of node depths.
             depth_keys = nodes_by_depth.Keys.OrderBy(x => x).Reverse();
 
-            return (network_nodes, nodes_by_depth, layers, layers_by_depth);
+            return (network_nodes.ToArray(), nodes_by_depth, layers, layers_by_depth);
         }
 
         string MakeNodeKey(string layer_name, int node_index)

From 6ce6066551ce80202119a121a05b006aadd9ef37 Mon Sep 17 00:00:00 2001
From: Haiping <haiping008@gmail.com>
Date: Wed, 22 Jan 2025 09:46:45 -0600
Subject: [PATCH 33/33] Update release.yml

---
 .github/workflows/release.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 8f862e329..02601764c 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -53,7 +53,7 @@ jobs:
         }
 
     - name: Upload packages artifacts
-      uses: actions/upload-artifact@v1.0.0
+      uses: actions/upload-artifact@v4.0.0
       with:
         name: "drop-ci-packages"
         path: './packages'