Sergio0694
diff --git a/‎NeuralNetwork.NET.Cuda/APIs/CuDnnNetworkLayersDeserializer.cs
Lines changed: 38 additions & 0 deletions b/‎NeuralNetwork.NET.Cuda/APIs/CuDnnNetworkLayersDeserializer.cs
Lines changed: 38 additions & 0 deletions
diff --git a/‎NeuralNetwork.NET.Cuda/Layers/CuDnnConvolutionalLayer.cs
Lines changed: 26 additions & 3 deletions b/‎NeuralNetwork.NET.Cuda/Layers/CuDnnConvolutionalLayer.cs
Lines changed: 26 additions & 3 deletions
diff --git a/‎NeuralNetwork.NET.Cuda/Layers/CuDnnFullyConnectedLayer.cs
Lines changed: 28 additions & 6 deletions b/‎NeuralNetwork.NET.Cuda/Layers/CuDnnFullyConnectedLayer.cs
Lines changed: 28 additions & 6 deletions
diff --git a/‎NeuralNetwork.NET.Cuda/Layers/CuDnnPoolingLayer.cs
Lines changed: 14 additions & 0 deletions b/‎NeuralNetwork.NET.Cuda/Layers/CuDnnPoolingLayer.cs
Lines changed: 14 additions & 0 deletions
diff --git a/‎NeuralNetwork.NET.Cuda/Layers/CuDnnSoftmaxLayer.cs
Lines changed: 24 additions & 2 deletions b/‎NeuralNetwork.NET.Cuda/Layers/CuDnnSoftmaxLayer.cs
Lines changed: 24 additions & 2 deletions
diff --git a/‎NeuralNetwork.NET/APIs/Delegates/LayerDeserializer.cs
Lines changed: 15 additions & 0 deletions b/‎NeuralNetwork.NET/APIs/Delegates/LayerDeserializer.cs
Lines changed: 15 additions & 0 deletions
diff --git a/‎NeuralNetwork.NET/APIs/Enums/LayerType.cs
Lines changed: 1 addition & 1 deletion b/‎NeuralNetwork.NET/APIs/Enums/LayerType.cs
Lines changed: 1 addition & 1 deletion
diff --git a/‎NeuralNetwork.NET/APIs/Enums/TrainingStopReason.cs
Lines changed: 1 addition & 1 deletion b/‎NeuralNetwork.NET/APIs/Enums/TrainingStopReason.cs
Lines changed: 1 addition & 1 deletion
diff --git a/‎NeuralNetwork.NET/APIs/Interfaces/INetworkLayer.cs
Lines changed: 3 additions & 3 deletions b/‎NeuralNetwork.NET/APIs/Interfaces/INetworkLayer.cs
Lines changed: 3 additions & 3 deletions
diff --git a/‎NeuralNetwork.NET/APIs/Interfaces/INeuralNetwork.cs
Lines changed: 1 addition & 1 deletion b/‎NeuralNetwork.NET/APIs/Interfaces/INeuralNetwork.cs
Lines changed: 1 addition & 1 deletion
@@ -0,0 +1,38 @@
+using JetBrains.Annotations;
+using NeuralNetworkNET.APIs.Delegates;
+using NeuralNetworkNET.APIs.Enums;
+using NeuralNetworkNET.APIs.Interfaces;
+using NeuralNetworkNET.Cuda.Layers;
+using System.IO;
+
+namespace NeuralNetworkNET.APIs
+{
+    /// <summary>
+    /// A static class that exposes a single deserialization method that can be used to load a saved network using the cuDNN layers
+    /// </summary>
+    public static class CuDnnNetworkLayersDeserializer
+    {
+        /// <summary>
+        /// Gets the <see cref="LayerDeserializer"/> instance to load cuDNN network layers
+        /// </summary>
+        [PublicAPI]
+        public static LayerDeserializer Deserializer { get; } = Deserialize;
+
+        /// <summary>
+        /// Deserializes a layer of the given type from the input <see cref="Stream"/>
+        /// </summary>
+        /// <param name="stream">The <see cref="Stream"/> to use to load the layer data</param>
+        /// <param name="type">The type of network layer to return</param>
+        private static INetworkLayer Deserialize([NotNull] Stream stream, LayerType type)
+        {
+            switch (type)
+            {
+                case LayerType.FullyConnected: return CuDnnFullyConnectedLayer.Deserialize(stream);
+                case LayerType.Convolutional: return CuDnnConvolutionalLayer.Deserialize(stream);
+                case LayerType.Pooling: return CuDnnPoolingLayer.Deserialize(stream);
+                case LayerType.Softmax: return CuDnnSoftmaxLayer.Deserialize(stream);
+                default: return null;
+            }
+        } 
+    }
+}
@@ -67,7 +67,7 @@ public CuDnnConvolutionalLayer(
 
         public CuDnnConvolutionalLayer(
             in TensorInfo input, in ConvolutionInfo operation, TensorInfo kernels, TensorInfo output,
-            [NotNull] float[,] weights, [NotNull] float[] biases, ActivationFunctionType activation)
+            [NotNull] float[] weights, [NotNull] float[] biases, ActivationFunctionType activation)
             : base(input, operation, kernels, output, weights, biases, activation)
             => SetupCuDnnInfo();
 
@@ -78,7 +78,7 @@ public override unsafe void Forward(in Tensor x, out Tensor z, out Tensor a)
         {
             fixed (float* pw = Weights)
             {
-                Tensor.Fix(pw, OutputInfo.Channels, KernelInfo.Size, out Tensor wTensor);
+                Tensor.Reshape(pw, OutputInfo.Channels, KernelInfo.Size, out Tensor wTensor);
                 using (DeviceMemory<float> z_gpu = DnnInstance.Gpu.AllocateDevice<float>(x.Entities * OutputInfo.Size))
                 {
                     // Tensors info setup
@@ -119,7 +119,7 @@ public override unsafe void Backpropagate(in Tensor delta_1, in Tensor z, Activa
         {
             fixed (float* pw = Weights)
             {
-                Tensor.Fix(pw, OutputInfo.Channels, KernelInfo.Size, out Tensor wTensor);
+                Tensor.Reshape(pw, OutputInfo.Channels, KernelInfo.Size, out Tensor wTensor);
                 DnnInstance.GetConvolutionBackwardDataAlgorithm(FilterDescription, OutputDescription, ConvolutionDescription, InputDescription, ConvolutionBwdDataPreference.PREFER_FASTEST, IntPtr.Zero, out ConvolutionBwdDataAlgo algorithm);
                 DnnInstance.GetConvolutionBackwardDataWorkspaceSize(FilterDescription, OutputDescription, ConvolutionDescription, InputDescription, algorithm, out IntPtr size);
                 using (DeviceMemory<float> delta_gpu = DnnInstance.Gpu.AllocateDevice<float>(z.Size))
@@ -173,7 +173,30 @@ public override void ComputeGradient(in Tensor a, in Tensor delta, out Tensor dJ
 
         #endregion
 
+        #region Misc
+
         /// <inheritdoc/>
         public override INetworkLayer Clone() => new CuDnnConvolutionalLayer(InputInfo, OperationInfo, KernelInfo, OutputInfo, Weights.BlockCopy(), Biases.BlockCopy(), ActivationFunctionType);
+
+        /// <summary>
+        /// Tries to deserialize a new <see cref="CuDnnConvolutionalLayer"/> from the input <see cref="System.IO.Stream"/>
+        /// </summary>
+        /// <param name="stream">The input <see cref="System.IO.Stream"/> to use to read the layer data</param>
+        [MustUseReturnValue, CanBeNull]
+        public new static INetworkLayer Deserialize([NotNull] System.IO.Stream stream)
+        {
+            if (!stream.TryRead(out TensorInfo input)) return null;
+            if (!stream.TryRead(out TensorInfo output)) return null;
+            if (!stream.TryRead(out ActivationFunctionType activation)) return null;
+            if (!stream.TryRead(out int wLength)) return null;
+            float[] weights = stream.ReadUnshuffled(wLength);
+            if (!stream.TryRead(out int bLength)) return null;
+            float[] biases = stream.ReadUnshuffled(bLength);
+            if (!stream.TryRead(out ConvolutionInfo operation)) return null;
+            if (!stream.TryRead(out TensorInfo kernels)) return null;
+            return new CuDnnConvolutionalLayer(input, operation, kernels, output, weights, biases, activation);
+        }
+
+        #endregion
     }
 }
@@ -9,6 +9,7 @@
 using NeuralNetworkNET.Networks.Implementations.Layers;
 using NeuralNetworkNET.APIs.Structs;
 using NeuralNetworkNET.APIs.Enums;
+using NeuralNetworkNET.APIs.Interfaces;
 
 namespace NeuralNetworkNET.Cuda.Layers
 {
@@ -20,18 +21,20 @@ internal class CuDnnFullyConnectedLayer : FullyConnectedLayer
         [NotNull]
         private readonly Dnn DnnInstance = DnnService.Instance;
 
-        public CuDnnFullyConnectedLayer(in TensorInfo input, int outputs, ActivationFunctionType activation, WeightsInitializationMode weightsMode, BiasInitializationMode biasMode) 
-            : base(input, outputs, activation, weightsMode, biasMode) { }
+        public CuDnnFullyConnectedLayer(in TensorInfo input, int neurons, ActivationFunctionType activation, WeightsInitializationMode weightsMode, BiasInitializationMode biasMode) 
+            : base(input, neurons, activation, weightsMode, biasMode) { }
 
-        public CuDnnFullyConnectedLayer([NotNull] float[,] weights, [NotNull] float[] biases, ActivationFunctionType activation) 
-            : base(weights, biases, activation) { }
+        public CuDnnFullyConnectedLayer(in TensorInfo input, int neurons, [NotNull] float[] weights, [NotNull] float[] biases, ActivationFunctionType activation) 
+            : base(input, neurons, weights, biases, activation) { }
+
+        #region Implementation
 
         /// <inheritdoc/>
         public override unsafe void Forward(in Tensor x, out Tensor z, out Tensor a)
         {
             fixed (float* pw = Weights)
             {
-                Tensor.Fix(pw, InputInfo.Size, OutputInfo.Size, out Tensor wTensor);
+                Tensor.Reshape(pw, InputInfo.Size, OutputInfo.Size, out Tensor wTensor);
                 using (DeviceMemory<float>
                     x_gpu = DnnInstance.Gpu.AllocateDevice(x),
                     w_gpu = DnnInstance.Gpu.AllocateDevice(wTensor),
@@ -51,7 +54,7 @@ public override unsafe void Backpropagate(in Tensor delta_1, in Tensor z, Activa
         {
             fixed (float* pw = Weights)
             {
-                Tensor.Fix(pw, InputInfo.Size, OutputInfo.Size, out Tensor wTensor);
+                Tensor.Reshape(pw, InputInfo.Size, OutputInfo.Size, out Tensor wTensor);
                 using (DeviceMemory<float>
                     delta_1_gpu = DnnInstance.Gpu.AllocateDevice(delta_1),
                     w_gpu = DnnInstance.Gpu.AllocateDevice(wTensor),
@@ -76,5 +79,24 @@ public override void ComputeGradient(in Tensor a, in Tensor delta, out Tensor dJ
             }
             delta.CompressVertically(out dJdb); // Doing this on CPU is generally faster than launching the kernels
         }
+
+        #endregion
+
+        /// <summary>
+        /// Tries to deserialize a new <see cref="CuDnnFullyConnectedLayer"/> from the input <see cref="System.IO.Stream"/>
+        /// </summary>
+        /// <param name="stream">The input <see cref="System.IO.Stream"/> to use to read the layer data</param>
+        [MustUseReturnValue, CanBeNull]
+        public new static INetworkLayer Deserialize([NotNull] System.IO.Stream stream)
+        {
+            if (!stream.TryRead(out TensorInfo input)) return null;
+            if (!stream.TryRead(out TensorInfo output)) return null;
+            if (!stream.TryRead(out ActivationFunctionType activation)) return null;
+            if (!stream.TryRead(out int wLength)) return null;
+            float[] weights = stream.ReadUnshuffled(wLength);
+            if (!stream.TryRead(out int bLength)) return null;
+            float[] biases = stream.ReadUnshuffled(bLength);
+            return new CuDnnFullyConnectedLayer(input, output.Size, weights, biases, activation);
+        }
     }
 }
@@ -70,5 +70,19 @@ public override void Forward(in Tensor x, out Tensor z, out Tensor a)
 
         /// <inheritdoc/>
         public override INetworkLayer Clone() => new CuDnnPoolingLayer(InputInfo, OperationInfo, ActivationFunctionType);
+
+        /// <summary>
+        /// Tries to deserialize a new <see cref="CuDnnPoolingLayer"/> from the input <see cref="System.IO.Stream"/>
+        /// </summary>
+        /// <param name="stream">The input <see cref="System.IO.Stream"/> to use to read the layer data</param>
+        [MustUseReturnValue, CanBeNull]
+        public new static INetworkLayer Deserialize([NotNull] System.IO.Stream stream)
+        {
+            if (!stream.TryRead(out TensorInfo input)) return null;
+            if (!stream.TryRead(out TensorInfo _)) return null;
+            if (!stream.TryRead(out ActivationFunctionType activation)) return null;
+            if (!stream.TryRead(out PoolingInfo operation)) return null;
+            return new CuDnnPoolingLayer(input, operation, activation);
+        }
     }
 }
@@ -1,11 +1,15 @@
 using Alea;
 using Alea.cuDNN;
 using JetBrains.Annotations;
+using NeuralNetworkNET.Extensions;
 using NeuralNetworkNET.Cuda.Services;
 using NeuralNetworkNET.Cuda.Extensions;
 using NeuralNetworkNET.Networks.Implementations.Layers;
 using NeuralNetworkNET.APIs.Structs;
 using NeuralNetworkNET.APIs.Enums;
+using NeuralNetworkNET.APIs.Interfaces;
+using NeuralNetworkNET.Networks.Activations;
+using NeuralNetworkNET.Networks.Cost;
 
 namespace NeuralNetworkNET.Cuda.Layers
 {
@@ -30,7 +34,7 @@ internal sealed class CuDnnSoftmaxLayer : SoftmaxLayer
 
         public CuDnnSoftmaxLayer(in TensorInfo input, int outputs, WeightsInitializationMode weightsMode, BiasInitializationMode biasMode) : base(input, outputs, weightsMode, biasMode) { }
 
-        public CuDnnSoftmaxLayer([NotNull] float[,] weights, [NotNull] float[] biases) : base(weights, biases) { }
+        public CuDnnSoftmaxLayer(in TensorInfo input, int outputs, [NotNull] float[] weights, [NotNull] float[] biases) : base(input, outputs, weights, biases) { }
 
         /// <inheritdoc/>
         public override unsafe void Forward(in Tensor x, out Tensor z, out Tensor a)
@@ -40,7 +44,7 @@ public override unsafe void Forward(in Tensor x, out Tensor z, out Tensor a)
                 // Linear pass
                 fixed (float* pw = Weights)
                 {
-                    Tensor.Fix(pw, InputInfo.Size, OutputInfo.Size, out Tensor wTensor);
+                    Tensor.Reshape(pw, InputInfo.Size, OutputInfo.Size, out Tensor wTensor);
                     using (DeviceMemory<float>
                         x_gpu = DnnInstance.Gpu.AllocateDevice(x),
                         w_gpu = DnnInstance.Gpu.AllocateDevice(wTensor),
@@ -60,5 +64,23 @@ public override unsafe void Forward(in Tensor x, out Tensor z, out Tensor a)
                 }
             }
         }
+
+        /// <summary>
+        /// Tries to deserialize a new <see cref="CuDnnSoftmaxLayer"/> from the input <see cref="System.IO.Stream"/>
+        /// </summary>
+        /// <param name="stream">The input <see cref="Stream"/> to use to read the layer data</param>
+        [MustUseReturnValue, CanBeNull]
+        public new static INetworkLayer Deserialize([NotNull] System.IO.Stream stream)
+        {
+            if (!stream.TryRead(out TensorInfo input)) return null;
+            if (!stream.TryRead(out TensorInfo output)) return null;
+            if (!stream.TryRead(out ActivationFunctionType activation) && activation == ActivationFunctionType.Softmax) return null;
+            if (!stream.TryRead(out int wLength)) return null;
+            float[] weights = stream.ReadUnshuffled(wLength);
+            if (!stream.TryRead(out int bLength)) return null;
+            float[] biases = stream.ReadUnshuffled(bLength);
+            if (!stream.TryRead(out CostFunctionType cost) && cost == CostFunctionType.LogLikelyhood) return null;
+            return new CuDnnSoftmaxLayer(input, output.Size, weights, biases);
+        }
     }
 }
@@ -0,0 +1,15 @@
+using System.IO;
+using JetBrains.Annotations;
+using NeuralNetworkNET.APIs.Enums;
+using NeuralNetworkNET.APIs.Interfaces;
+
+namespace NeuralNetworkNET.APIs.Delegates
+{
+    /// <summary>
+    /// A <see cref="delegate"/> that tries to deserialize a network layer from the input <see cref="Stream"/>, assuming the layer is of the given <see cref="LayerType"/>
+    /// </summary>
+    /// <param name="stream">The source <see cref="Stream"/> to load data from. If the layer type is not supported, the <see cref="Stream"/> should not be read at all</param>
+    /// <param name="type">The type of network layer to deserialize from the <see cref="Stream"/></param>
+    [CanBeNull]
+    public delegate INetworkLayer LayerDeserializer([NotNull] Stream stream, LayerType type);
+}
@@ -1,4 +1,4 @@
-namespace NeuralNetworkNET.APIs.Misc
+namespace NeuralNetworkNET.APIs.Enums
 {
     /// <summary>
     /// Indicates the type of a neural network layer (for serialization purposes only)
 
@@ -1,4 +1,4 @@
-namespace NeuralNetworkNET.APIs.Misc
+namespace NeuralNetworkNET.APIs.Enums
 {
     /// <summary>
     /// Indicates the reason why a network training session has stopped
 
@@ -1,4 +1,4 @@
-using NeuralNetworkNET.APIs.Misc;
+using NeuralNetworkNET.APIs.Enums;
 using NeuralNetworkNET.APIs.Structs;
 using System;
 
@@ -17,11 +17,11 @@ public interface INetworkLayer : IEquatable<INetworkLayer>, IClonable<INetworkLa
         /// <summary>
         /// Gets the info on the layer inputs
         /// </summary>
-        TensorInfo InputInfo { get; }
+        ref readonly TensorInfo InputInfo { get; }
 
         /// <summary>
         /// Gets the info on the layer outputs
         /// </summary>
-        TensorInfo OutputInfo { get; }
+        ref readonly TensorInfo OutputInfo { get; }
     }
 }
@@ -98,7 +98,7 @@ public interface INeuralNetwork : IEquatable<INeuralNetwork>, IClonable<INeuralN
         /// <summary>
         /// Saves the network to the target file
         /// </summary>
-        /// <param name="FileInfo">The <see cref="FileInfo"/> instance for the target file (it may not exist yet)</param>
+        /// <param name="target">The <see cref="FileInfo"/> instance for the target file (it may not exist yet)</param>
         void Save([NotNull] FileInfo target);
 
         /// <summary>
Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-namespace NeuralNetworkNET.APIs.Misc`
	`1`	`+namespace NeuralNetworkNET.APIs.Enums`
`2`	`2`	`{`
`3`	`3`	`/// <summary>`
`4`	`4`	`/// Indicates the type of a neural network layer (for serialization purposes only)`