5 years ago · 22144ee7cf
--- a/neuralnetwork/main.go
+++ b/neuralnetwork/main.go
@@ -11,8 +11,7 @@ import (
 
															 func main() {
														
 
															 	sizes := []int{13, 14, 14, 3}
														
 
															-	var nn neuralnetwork.NeuralNetwork
														
 
															-	nn, _ = neuralnetwork.NewBackProp(sizes, 0.1, 481)
														
 
															+	nn, _ := neuralnetwork.NewNeuralNetwork(sizes, 0.1, 481)
														
 
															 	// for i := 0; i < nn.Count; i++ {
														
 
															 	// 	if i > 0 {
														
@@ -55,7 +54,7 @@ func main() {
 
															 	}
														
 
															 	fmt.Printf("Fail count: %v\n\n", failCount)
														
 
															-	nn = &neuralnetwork.BackProp{}
														
 
															+	nn = &neuralnetwork.NeuralNetwork{}
														
 
															 	inFile, err := os.Open("./data")
														
 
															 	if err != nil {
														
 
															 		log.Fatal(err)
														
--- a/neuralnetwork/neuralnetworkbase/gradients.go
+++ b/neuralnetwork/neuralnetworkbase/gradients.go
@@ -0,0 +1,102 @@
 
															+/*
														
 
															+ * MIT License
														
 
															+ *
														
 
															+ * Copyright (c) 2019 Alexey Edelev <semlanik@gmail.com>
														
 
															+ *
														
 
															+ * This file is part of NeuralNetwork project https://git.semlanik.org/semlanik/NeuralNetwork
														
 
															+ *
														
 
															+ * Permission is hereby granted, free of charge, to any person obtaining a copy of this
														
 
															+ * software and associated documentation files (the "Software"), to deal in the Software
														
 
															+ * without restriction, including without limitation the rights to use, copy, modify,
														
 
															+ * merge, publish, distribute, sublicense, and/or sell copies of the Software, and
														
 
															+ * to permit persons to whom the Software is furnished to do so, subject to the following
														
 
															+ * conditions:
														
 
															+ *
														
 
															+ * The above copyright notice and this permission notice shall be included in all copies
														
 
															+ * or substantial portions of the Software.
														
 
															+ *
														
 
															+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
														
 
															+ * INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR
														
 
															+ * PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE
														
 
															+ * FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
														
 
															+ * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
														
 
															+ * DEALINGS IN THE SOFTWARE.
														
 
															+ */
														
 
															+
														
 
															+package neuralnetworkbase
														
 
															+
														
 
															+import (
														
 
															+	"math"
														
 
															+
														
 
															+	mat "gonum.org/v1/gonum/mat"
														
 
															+)
														
 
															+
														
 
															+type RPropGradient struct {
														
 
															+	Gradients *mat.Dense
														
 
															+	Deltas    *mat.Dense
														
 
															+}
														
 
															+
														
 
															+func NewRPropGradient(r, c int) (g *RPropGradient) {
														
 
															+	g = &RPropGradient{}
														
 
															+
														
 
															+	deltas := make([]float64, r*c)
														
 
															+
														
 
															+	for j, _ := range deltas {
														
 
															+		deltas[j] = 0.1
														
 
															+	}
														
 
															+
														
 
															+	g.Gradients = mat.NewDense(r, c, nil)
														
 
															+	g.Deltas = mat.NewDense(r, c, deltas)
														
 
															+	return
														
 
															+}
														
 
															+
														
 
															+func (g *RPropGradient) ApplyDelta(m mat.Matrix, derivative mat.Matrix) (result *mat.Dense) {
														
 
															+	//TODO: move this hardcoded parameters to separate config for gradient
														
 
															+	nuPlus := 1.2
														
 
															+	nuMinus := 0.5
														
 
															+
														
 
															+	deltaMax := 50.0
														
 
															+	deltaMin := 0.000001
														
 
															+
														
 
															+	result = &mat.Dense{}
														
 
															+
														
 
															+	result.Apply(func(i, j int, v float64) (outV float64) {
														
 
															+		gradientSign := g.Gradients.At(i, j) * derivative.At(i, j)
														
 
															+		if gradientSign > 0 {
														
 
															+			g.Deltas.Set(i, j, math.Min(nuPlus*g.Deltas.At(i, j), deltaMax))
														
 
															+			outV = v - sign(derivative.At(i, j))*g.Deltas.At(i, j)
														
 
															+
														
 
															+			g.Gradients.Set(i, j, derivative.At(i, j))
														
 
															+		} else if gradientSign < 0 {
														
 
															+			outV = v + sign(g.Gradients.At(i, j))*g.Deltas.At(i, j)
														
 
															+			g.Deltas.Set(i, j, math.Max(nuMinus*g.Deltas.At(i, j), deltaMin))
														
 
															+
														
 
															+			g.Gradients.Set(i, j, 0.0)
														
 
															+		} else {
														
 
															+			outV = v - sign(derivative.At(i, j))*g.Deltas.At(i, j)
														
 
															+
														
 
															+			g.Gradients.Set(i, j, derivative.At(i, j))
														
 
															+		}
														
 
															+		return
														
 
															+	}, m)
														
 
															+	return result
														
 
															+}
														
 
															+
														
 
															+//Simple backpropagation with constant value η
														
 
															+type BackPropGradient struct {
														
 
															+	alpha float64
														
 
															+}
														
 
															+
														
 
															+func (g *BackPropGradient) ApplyDelta(m mat.Matrix, derivative mat.Matrix) (result *mat.Dense) {
														
 
															+	// Gradient change of actual matrix using:
														
 
															+	// m[l]′ = m[l] − η * ∂C/∂m
														
 
															+	// Where ∂E/∂m is `in` matrix
														
 
															+	scaled := &mat.Dense{}
														
 
															+	result = &mat.Dense{}
														
 
															+
														
 
															+	// η * ∂E/∂m
														
 
															+	scaled.Scale(g.alpha, derivative)
														
 
															+	// m[l] − η * ∂E/∂m
														
 
															+	result.Sub(m, scaled)
														
 
															+	return result
														
 
															+}
														
--- a/neuralnetwork/neuralnetworkbase/interface.go
+++ b/neuralnetwork/neuralnetworkbase/interface.go
@@ -26,15 +26,9 @@
 
															 package neuralnetworkbase
														
 
															 import (
														
 
															-	"io"
														
 
															-
														
 
															-	teach "../teach"
														
 
															 	mat "gonum.org/v1/gonum/mat"
														
 
															 )
														
 
															-type NeuralNetwork interface {
														
 
															-	Teach(teacher teach.Teacher)
														
 
															-	Predict(aIn mat.Matrix) (maxIndex int, max float64)
														
 
															-	SaveState(io.Writer)
														
 
															-	LoadState(io.Reader)
														
 
															+type Gradient interface {
														
 
															+	ApplyDelta(aIn mat.Matrix, gradient mat.Matrix) *mat.Dense
														
 
															 }
														
--- a/neuralnetwork/neuralnetworkbase/mathcommon.go
+++ b/neuralnetwork/neuralnetworkbase/mathcommon.go
@@ -55,19 +55,14 @@ func sigmoid(x float64) float64 {
 
															 }
														
 
															 func sigmoidPrime(x float64) float64 {
														
 
															-	return sigmoid(x) * (1 - sigmoid(x))
														
 
															+	sig := sigmoid(x)
														
 
															+	return sig * (1 - sig)
														
 
															 }
														
 
															-func makeBackGradient(in mat.Matrix, actual mat.Matrix, alpha float64) *mat.Dense {
														
 
															-	// Gradient change of actual matrix using:
														
 
															-	// m[l]′ = m[l] − η * ∂C/∂m
														
 
															-	// Where ∂C/∂m is `in` matrix
														
 
															-	scaled := &mat.Dense{}
														
 
															-	result := &mat.Dense{}
														
 
															-
														
 
															-	// η * ∂C/∂m
														
 
															-	scaled.Scale(alpha, in)
														
 
															-	// m[l] − η * ∂C/∂m
														
 
															-	result.Sub(actual, scaled)
														
 
															-	return result
														
 
															+func sign(v float64) float64 {
														
 
															+	if v == 0 {
														
 
															+		return 0
														
 
															+	}
														
 
															+	// fmt.Printf("%v / math.Abs(%v) = %v\n", v, math.Abs(v), v/math.Abs(v))
														
 
															+	return v / math.Abs(v)
														
 
															 }
														
--- a/neuralnetwork/neuralnetworkbase/neuralnetwork.go
+++ b/neuralnetwork/neuralnetworkbase/neuralnetwork.go
@@ -40,6 +40,7 @@ import (
 
															 // Resources:
														
 
															 // http://neuralnetworksanddeeplearning.com
														
 
															 // https://www.youtube.com/watch?v=fNk_zzaMoSs
														
 
															+// http://www.inf.fu-berlin.de/lehre/WS06/Musterererkennung/Paper/rprop.pdf
														
 
															 //
														
 
															 // Matrix: A
														
 
															 // Description: A is set of calculated neuron activations after sigmoid correction
														
@@ -94,18 +95,19 @@ import (
 
															 //       s' = Sizes[l-1] - Previous neural network layer size
														
 
															 //       L = len(Sizes) - Number of neural network layers
														
 
															-type BackProp struct {
														
 
															+type NeuralNetwork struct {
														
 
															 	Count          int
														
 
															 	Sizes          []int
														
 
															 	Biases         []*mat.Dense
														
 
															 	Weights        []*mat.Dense
														
 
															 	A              []*mat.Dense
														
 
															 	Z              []*mat.Dense
														
 
															-	alpha          float64
														
 
															+	WGradient      []Gradient
														
 
															+	BGradient      []Gradient
														
 
															 	trainingCycles int
														
 
															 }
														
 
															-func NewBackProp(sizes []int, nu float64, trainingCycles int) (nn *BackProp, err error) {
														
 
															+func NewNeuralNetwork(sizes []int, nu float64, trainingCycles int) (nn *NeuralNetwork, err error) {
														
 
															 	err = nil
														
 
															 	if len(sizes) < 3 {
														
 
															 		fmt.Printf("Invalid network configuration: %v\n", sizes)
														
@@ -133,42 +135,48 @@ func NewBackProp(sizes []int, nu float64, trainingCycles int) (nn *BackProp, err
 
															 		fmt.Println("Training cycles number probably is too small")
														
 
															 	}
														
 
															-	nn = &BackProp{}
														
 
															+	nn = &NeuralNetwork{}
														
 
															 	nn.Sizes = sizes
														
 
															 	nn.Count = len(sizes)
														
 
															 	nn.Weights = make([]*mat.Dense, nn.Count)
														
 
															 	nn.Biases = make([]*mat.Dense, nn.Count)
														
 
															+	nn.WGradient = make([]Gradient, nn.Count)
														
 
															+	nn.BGradient = make([]Gradient, nn.Count)
														
 
															+
														
 
															 	nn.A = make([]*mat.Dense, nn.Count)
														
 
															 	nn.Z = make([]*mat.Dense, nn.Count)
														
 
															-	nn.alpha = nu / float64(nn.Sizes[0])
														
 
															 	nn.trainingCycles = trainingCycles
														
 
															+	alpha := nu / float64(nn.Sizes[0])
														
 
															 	for i := 1; i < nn.Count; i++ {
														
 
															 		nn.Weights[i] = generateRandomDense(nn.Sizes[i], nn.Sizes[i-1])
														
 
															 		nn.Biases[i] = generateRandomDense(nn.Sizes[i], 1)
														
 
															+		nn.WGradient[i] = &BackPropGradient{alpha}
														
 
															+		nn.BGradient[i] = &BackPropGradient{alpha}
														
 
															+		// nn.WGradient[i] = NewRPropGradient(nn.Sizes[i], nn.Sizes[i-1])
														
 
															+		// nn.BGradient[i] = NewRPropGradient(nn.Sizes[i], 1)
														
 
															 	}
														
 
															 	return
														
 
															 }
														
 
															-func (nn *BackProp) Copy() (out *BackProp) {
														
 
															-	out = &BackProp{}
														
 
															+func (nn *NeuralNetwork) Copy() (out *NeuralNetwork) {
														
 
															+	out = &NeuralNetwork{}
														
 
															 	out.Sizes = nn.Sizes
														
 
															 	out.Count = nn.Count
														
 
															 	out.Weights = make([]*mat.Dense, nn.Count)
														
 
															 	out.Biases = make([]*mat.Dense, nn.Count)
														
 
															 	out.A = make([]*mat.Dense, nn.Count)
														
 
															 	out.Z = make([]*mat.Dense, nn.Count)
														
 
															-	out.alpha = nn.alpha
														
 
															 	out.trainingCycles = nn.trainingCycles
														
 
															 	for i := 1; i < out.Count; i++ {
														
 
															-		nn.Weights[i] = mat.DenseCopyOf(out.Weights[i])
														
 
															-		nn.Biases[i] = mat.DenseCopyOf(out.Biases[i])
														
 
															+		out.Weights[i] = mat.DenseCopyOf(nn.Weights[i])
														
 
															+		out.Biases[i] = mat.DenseCopyOf(nn.Biases[i])
														
 
															 	}
														
 
															 	return
														
 
															 }
														
 
															-func (nn *BackProp) Predict(aIn mat.Matrix) (maxIndex int, max float64) {
														
 
															+func (nn *NeuralNetwork) Predict(aIn mat.Matrix) (maxIndex int, max float64) {
														
 
															 	r, _ := aIn.Dims()
														
 
															 	if r != nn.Sizes[0] {
														
 
															 		fmt.Printf("Invalid rows number of input matrix size: %v\n", r)
														
@@ -189,7 +197,7 @@ func (nn *BackProp) Predict(aIn mat.Matrix) (maxIndex int, max float64) {
 
															 	return
														
 
															 }
														
 
															-func (nn *BackProp) Teach(teacher teach.Teacher) {
														
 
															+func (nn *NeuralNetwork) Teach(teacher teach.Teacher) {
														
 
															 	for i := 0; i < nn.trainingCycles; i++ {
														
 
															 		for teacher.NextData() {
														
 
															 			nn.backward(teacher.GetData())
														
@@ -197,7 +205,7 @@ func (nn *BackProp) Teach(teacher teach.Teacher) {
 
															 	}
														
 
															 }
														
 
															-func (nn *BackProp) SaveState(writer io.Writer) {
														
 
															+func (nn *NeuralNetwork) SaveState(writer io.Writer) {
														
 
															 	//save input array count
														
 
															 	bufferSize := make([]byte, 4)
														
 
															 	binary.LittleEndian.PutUint32(bufferSize[0:], uint32(nn.Count))
														
@@ -229,7 +237,7 @@ func (nn *BackProp) SaveState(writer io.Writer) {
 
															 	}
														
 
															 }
														
 
															-func (nn *BackProp) LoadState(reader io.Reader) {
														
 
															+func (nn *NeuralNetwork) LoadState(reader io.Reader) {
														
 
															 	// Reade count
														
 
															 	nn.Count = readInt(reader)
														
@@ -265,7 +273,7 @@ func (nn *BackProp) LoadState(reader io.Reader) {
 
															 	// fmt.Printf("\nLoadState end\n")
														
 
															 }
														
 
															-func (nn *BackProp) forward(aIn mat.Matrix) {
														
 
															+func (nn *NeuralNetwork) forward(aIn mat.Matrix) {
														
 
															 	nn.A[0] = mat.DenseCopyOf(aIn)
														
 
															 	for i := 1; i < nn.Count; i++ {
														
@@ -290,15 +298,15 @@ func (nn *BackProp) forward(aIn mat.Matrix) {
 
															 	}
														
 
															 }
														
 
															-func (nn *BackProp) backward(aIn, aOut mat.Matrix) {
														
 
															+func (nn *NeuralNetwork) backward(aIn, aOut mat.Matrix) {
														
 
															 	nn.forward(aIn)
														
 
															 	lastLayerNum := nn.Count - 1
														
 
															 	// To calculate new values of weights and biases
														
 
															 	// following formulas are used:
														
 
															-	// W[l] = A[l−1]*δ[l]
														
 
															-	// B[l] = δ[l]
														
 
															+	// ∂E/∂W[l] = A[l−1]*δ[l]
														
 
															+	// ∂E/∂B[l] = δ[l]
														
 
															 	// For last layer δ value is calculated by following:
														
 
															 	// δ = (A[L]−y)⊙σ'(Z[L])
														
@@ -317,23 +325,31 @@ func (nn *BackProp) backward(aIn, aOut mat.Matrix) {
 
															 	delta := &mat.Dense{}
														
 
															 	delta.MulElem(err, sigmoidsPrime)
														
 
															-	// B[L] = δ[L]
														
 
															+	// ∂E/∂B[L] = δ[L]
														
 
															 	biases := mat.DenseCopyOf(delta)
														
 
															-	// W[L] = A[L−1]*δ[L]
														
 
															+	// ∂E/∂W[L] = A[L−1]*δ[L]
														
 
															 	weights := &mat.Dense{}
														
 
															 	weights.Mul(delta, nn.A[lastLayerNum-1].T())
														
 
															-	// Initialize new weights and biases values with last layer values
														
 
															-	newBiases := []*mat.Dense{makeBackGradient(biases, nn.Biases[lastLayerNum], nn.alpha)}
														
 
															-	newWeights := []*mat.Dense{makeBackGradient(weights, nn.Weights[lastLayerNum], nn.alpha)}
														
 
															+	// fmt.Printf("Prev biases[%v]:\n%v\n\n", lastLayerNum, mat.Formatted(nn.Biases[lastLayerNum], mat.Prefix(""), mat.Excerpt(0)))
														
 
															+	// fmt.Printf("Prev weights[%v]:\n%v\n\n", lastLayerNum, mat.Formatted(nn.Weights[lastLayerNum], mat.Prefix(""), mat.Excerpt(0)))
														
 
															-	// Save calculated delta value temporary error variable
														
 
															-	err = delta
														
 
															+	// fmt.Printf("Expect[%v]:\n%v\n\n", lastLayerNum, mat.Formatted(aOut, mat.Prefix(""), mat.Excerpt(0)))
														
 
															+	// fmt.Printf("Result[%v]:\n%v\n\n", lastLayerNum, mat.Formatted(nn.result(), mat.Prefix(""), mat.Excerpt(0)))
														
 
															+	// fmt.Printf("nn.Z[%v]:\n%v\n\n", lastLayerNum, mat.Formatted(nn.Z[lastLayerNum], mat.Prefix(""), mat.Excerpt(0)))
														
 
															+	// fmt.Printf("sigmoidsPrime[%v]:\n%v\n\n", lastLayerNum, mat.Formatted(sigmoidsPrime, mat.Prefix(""), mat.Excerpt(0)))
														
 
															+	// fmt.Printf("Err[%v]:\n%v\n\n", lastLayerNum, mat.Formatted(err, mat.Prefix(""), mat.Excerpt(0)))
														
 
															+	// fmt.Printf("Biases gradient[%v]:\n%v\n\n", lastLayerNum, mat.Formatted(biases, mat.Prefix(""), mat.Excerpt(0)))
														
 
															+	// fmt.Printf("Weights gradient[%v]:\n%v\n\n", lastLayerNum, mat.Formatted(weights, mat.Prefix(""), mat.Excerpt(0)))
														
 
															+
														
 
															+	// Initialize new weights and biases values with last layer values
														
 
															+	newBiases := []*mat.Dense{nn.BGradient[lastLayerNum].ApplyDelta(nn.Biases[lastLayerNum], biases)}
														
 
															+	newWeights := []*mat.Dense{nn.WGradient[lastLayerNum].ApplyDelta(nn.Weights[lastLayerNum], weights)}
														
 
															 	// Next layer Weights and Biases are calculated using same formulas:
														
 
															-	// W[l] = A[l−1]*δ[l]
														
 
															-	// B[l] = δ[l]
														
 
															+	// ∂E/∂W[l] = A[l−1]*δ[l]
														
 
															+	// ∂E/∂B[l] = δ[l]
														
 
															 	// But δ[l] is calculated using different formula:
														
 
															 	// δ[l] = ((Wt[l+1])*δ[l+1])⊙σ'(Z[l])
														
@@ -346,19 +362,18 @@ func (nn *BackProp) backward(aIn, aOut mat.Matrix) {
 
															 		// (Wt[l+1])*δ[l+1]
														
 
															 		// err bellow is delta from previous step(l+1)
														
 
															-		delta := &mat.Dense{}
														
 
															 		wdelta := &mat.Dense{}
														
 
															-		wdelta.Mul(nn.Weights[l+1].T(), err)
														
 
															+		wdelta.Mul(nn.Weights[l+1].T(), delta)
														
 
															 		// Calculate new delta and store it to temporary variable err
														
 
															 		// δ[l] = ((Wt[l+1])*δ[l+1])⊙σ'(Z[l])
														
 
															+		delta = &mat.Dense{}
														
 
															 		delta.MulElem(wdelta, sigmoidsPrime)
														
 
															-		err = delta
														
 
															-		// B[l] = δ[l]
														
 
															+		// ∂E/∂B[l] = δ[l]
														
 
															 		biases := mat.DenseCopyOf(delta)
														
 
															-		// W[l] = A[l−1]*δ[l]
														
 
															+		// ∂E/∂W[l] = A[l−1]*δ[l]
														
 
															 		// At this point it's required to give explanation for inaccuracy
														
 
															 		// in the formula
														
@@ -391,9 +406,12 @@ func (nn *BackProp) backward(aIn, aOut mat.Matrix) {
 
															 		weights := &mat.Dense{}
														
 
															 		weights.Mul(delta, nn.A[l-1].T())
														
 
															+		// fmt.Printf("Weights gradient[%v]:\n%v\n\n", l, mat.Formatted(weights, mat.Prefix(""), mat.Excerpt(0)))
														
 
															+		// fmt.Printf("Biases gradient[%v]:\n%v\n\n", l, mat.Formatted(biases, mat.Prefix(""), mat.Excerpt(0)))
														
 
															+
														
 
															 		// !Prepend! new Biases and Weights
														
 
															-		newBiases = append([]*mat.Dense{makeBackGradient(biases, nn.Biases[l], nn.alpha)}, newBiases...)
														
 
															-		newWeights = append([]*mat.Dense{makeBackGradient(weights, nn.Weights[l], nn.alpha)}, newWeights...)
														
 
															+		newBiases = append([]*mat.Dense{nn.BGradient[l].ApplyDelta(nn.Biases[l], biases)}, newBiases...)
														
 
															+		newWeights = append([]*mat.Dense{nn.WGradient[l].ApplyDelta(nn.Weights[l], weights)}, newWeights...)
														
 
															 	}
														
 
															 	newBiases = append([]*mat.Dense{&mat.Dense{}}, newBiases...)
														
@@ -403,6 +421,6 @@ func (nn *BackProp) backward(aIn, aOut mat.Matrix) {
 
															 	nn.Weights = newWeights
														
 
															 }
														
 
															-func (nn *BackProp) result() *mat.Dense {
														
 
															+func (nn *NeuralNetwork) result() *mat.Dense {
														
 
															 	return nn.A[nn.Count-1]
														
 
															 }
														
--- a/neuralnetwork/neuralnetworkbase/neuralnetwork_test.go
+++ b/neuralnetwork/neuralnetworkbase/neuralnetwork_test.go
@@ -6,40 +6,40 @@ import (
 
															 	"gonum.org/v1/gonum/mat"
														
 
															 )
														
 
															-func TestNewBackProp(t *testing.T) {
														
 
															-	nn, err := NewBackProp([]int{}, 0.1, 500)
														
 
															+func TestNewNeuralNetwork(t *testing.T) {
														
 
															+	nn, err := NewNeuralNetwork([]int{}, 0.1, 500)
														
 
															 	if nn != nil || err == nil {
														
 
															 		t.Error("nn initialized, but shouldn't ", err)
														
 
															 	}
														
 
															-	nn, err = NewBackProp([]int{0, 0, 0, 0}, 0.1, 500)
														
 
															+	nn, err = NewNeuralNetwork([]int{0, 0, 0, 0}, 0.1, 500)
														
 
															 	if nn != nil || err == nil {
														
 
															 		t.Error("nn initialized, but shouldn't ", err)
														
 
															 	}
														
 
															-	nn, err = NewBackProp([]int{1, 1, 1, 1}, 0.1, 500)
														
 
															+	nn, err = NewNeuralNetwork([]int{1, 1, 1, 1}, 0.1, 500)
														
 
															 	if nn != nil || err == nil {
														
 
															 		t.Error("nn initialized, but shouldn't ", err)
														
 
															 	}
														
 
															-	nn, err = NewBackProp([]int{5, 5}, 0.1, 500)
														
 
															+	nn, err = NewNeuralNetwork([]int{5, 5}, 0.1, 500)
														
 
															 	if nn != nil || err == nil {
														
 
															 		t.Error("nn initialized, but shouldn't ", err)
														
 
															 	}
														
 
															-	nn, err = NewBackProp([]int{5, 1, 5, 5}, 0.1, 500)
														
 
															+	nn, err = NewNeuralNetwork([]int{5, 1, 5, 5}, 0.1, 500)
														
 
															 	if nn != nil || err == nil {
														
 
															 		t.Error("nn initialized, but shouldn't ", err)
														
 
															 	}
														
 
															-	nn, err = NewBackProp([]int{5, 4, 4, 5}, 0.1, 500)
														
 
															+	nn, err = NewNeuralNetwork([]int{5, 4, 4, 5}, 0.1, 500)
														
 
															 	if nn == nil || err != nil {
														
 
															 		t.Error("nn is not initialized, but should be ", err)
														
 
															 	}
														
 
															 }
														
 
															 func TestNeuralNetworkPredict(t *testing.T) {
														
 
															-	nn, _ := NewBackProp([]int{3, 4, 4, 2}, 0.1, 500)
														
 
															+	nn, _ := NewNeuralNetwork([]int{3, 4, 4, 2}, 0.1, 500)
														
 
															 	aIn := &mat.Dense{}
														
 
															 	index, max := nn.Predict(aIn)
														
--- a/neuralnetwork/neuralnetworkbase/rprop.go
+++ b/neuralnetwork/neuralnetworkbase/rprop.go
@@ -1,345 +0,0 @@
 
															-/*
														
 
															- * MIT License
														
 
															- *
														
 
															- * Copyright (c) 2019 Alexey Edelev <semlanik@gmail.com>
														
 
															- *
														
 
															- * This file is part of NeuralNetwork project https://git.semlanik.org/semlanik/NeuralNetwork
														
 
															- *
														
 
															- * Permission is hereby granted, free of charge, to any person obtaining a copy of this
														
 
															- * software and associated documentation files (the "Software"), to deal in the Software
														
 
															- * without restriction, including without limitation the rights to use, copy, modify,
														
 
															- * merge, publish, distribute, sublicense, and/or sell copies of the Software, and
														
 
															- * to permit persons to whom the Software is furnished to do so, subject to the following
														
 
															- * conditions:
														
 
															- *
														
 
															- * The above copyright notice and this permission notice shall be included in all copies
														
 
															- * or substantial portions of the Software.
														
 
															- *
														
 
															- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
														
 
															- * INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR
														
 
															- * PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE
														
 
															- * FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
														
 
															- * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
														
 
															- * DEALINGS IN THE SOFTWARE.
														
 
															- */
														
 
															-
														
 
															-package neuralnetworkbase
														
 
															-
														
 
															-import (
														
 
															-	"errors"
														
 
															-	"fmt"
														
 
															-	"io"
														
 
															-
														
 
															-	teach "../teach"
														
 
															-	mat "gonum.org/v1/gonum/mat"
														
 
															-)
														
 
															-
														
 
															-// NeuralNetwork is simple neural network implementation
														
 
															-//
														
 
															-// Resources:
														
 
															-// http://neuralnetworksanddeeplearning.com
														
 
															-// https://www.youtube.com/watch?v=fNk_zzaMoSs
														
 
															-//
														
 
															-// Matrix: A
														
 
															-// Description: A is set of calculated neuron activations after sigmoid correction
														
 
															-// Format:    0          l           L
														
 
															-//         ⎡A[0] ⎤ ... ⎡A[0] ⎤ ... ⎡A[0] ⎤
														
 
															-//         ⎢A[1] ⎥ ... ⎢A[1] ⎥ ... ⎢A[1] ⎥
														
 
															-//         ⎢ ... ⎥ ... ⎢ ... ⎥ ... ⎢ ... ⎥
														
 
															-//         ⎢A[i] ⎥ ... ⎢A[i] ⎥ ... ⎢A[i] ⎥
														
 
															-//         ⎢ ... ⎥ ... ⎢ ... ⎥ ... ⎢ ... ⎥
														
 
															-//         ⎣A[s] ⎦ ... ⎣A[s] ⎦ ... ⎣A[s] ⎦
														
 
															-// Where s = Sizes[l] - Neural network layer size
														
 
															-//       L = len(Sizes) - Number of neural network layers
														
 
															-//
														
 
															-// Matrix: Z
														
 
															-// Description: Z is set of calculated raw neuron activations
														
 
															-// Format:    0          l           L
														
 
															-//         ⎡Z[0] ⎤ ... ⎡Z[0] ⎤ ... ⎡Z[0] ⎤
														
 
															-//         ⎢Z[1] ⎥ ... ⎢Z[1] ⎥ ... ⎢Z[1] ⎥
														
 
															-//         ⎢ ... ⎥ ... ⎢ ... ⎥ ... ⎢ ... ⎥
														
 
															-//         ⎢Z[i] ⎥ ... ⎢Z[i] ⎥ ... ⎢Z[i] ⎥
														
 
															-//         ⎢ ... ⎥ ... ⎢ ... ⎥ ... ⎢ ... ⎥
														
 
															-//         ⎣Z[s] ⎦ ... ⎣Z[s] ⎦ ... ⎣Z[s] ⎦
														
 
															-// Where s = Sizes[l] - Neural network layer size
														
 
															-//       L = len(Sizes) - Number of neural network layers
														
 
															-//
														
 
															-// Matrix: Biases
														
 
															-// Description: Biases is set of biases per layer except l0
														
 
															-//              NOTE: l0 is always empty Dense because first layer
														
 
															-//              doesn't have connections to previous layer
														
 
															-// Format:    1          l           L
														
 
															-//         ⎡b[0] ⎤ ... ⎡b[0] ⎤ ... ⎡b[0] ⎤
														
 
															-//         ⎢b[1] ⎥ ... ⎢b[1] ⎥ ... ⎢b[1] ⎥
														
 
															-//         ⎢ ... ⎥ ... ⎢ ... ⎥ ... ⎢ ... ⎥
														
 
															-//         ⎢b[i] ⎥ ... ⎢b[i] ⎥ ... ⎢b[i] ⎥
														
 
															-//         ⎢ ... ⎥ ... ⎢ ... ⎥ ... ⎢ ... ⎥
														
 
															-//         ⎣b[s] ⎦ ... ⎣b[s] ⎦ ... ⎣b[s] ⎦
														
 
															-// Where s = Sizes[l] - Neural network layer size
														
 
															-//       L = len(Sizes) - Number of neural network layers
														
 
															-//
														
 
															-// Matrix: Weights
														
 
															-// Description: Weights is set of weights per layer except l0
														
 
															-//              NOTE: l0 is always empty Dense because first layer
														
 
															-//              doesn't have connections to previous layer
														
 
															-// Format:               1                                   l                                   L
														
 
															-//         ⎡w[0,0] ... w[0,j] ... w[0,s']⎤ ... ⎡w[0,0] ... w[0,j] ... w[0,s']⎤ ... ⎡w[0,0] ... w[0,j] ... w[0,s']⎤
														
 
															-//         ⎢w[1,0] ... w[1,j] ... w[1,s']⎥ ... ⎢w[1,0] ... w[1,j] ... w[1,s']⎥ ... ⎢w[1,0] ... w[1,j] ... w[1,s']⎥
														
 
															-//         ⎢              ...            ⎥ ... ⎢              ...            ⎥ ... ⎢              ...            ⎥
														
 
															-//         ⎢w[i,0] ... w[i,j] ... w[i,s']⎥ ... ⎢w[i,0] ... w[i,j] ... w[i,s']⎥ ... ⎢w[i,0] ... w[i,j] ... w[i,s']⎥
														
 
															-//         ⎢              ...            ⎥ ... ⎢              ...            ⎥ ... ⎢              ...            ⎥
														
 
															-//         ⎣w[s,0] ... w[s,j] ... w[s,s']⎦ ... ⎣w[s,0] ... w[s,j] ... w[s,s']⎦ ... ⎣w[s,0] ... w[s,j] ... w[s,s']⎦
														
 
															-// Where s = Sizes[l] - Neural network layer size
														
 
															-//       s' = Sizes[l-1] - Previous neural network layer size
														
 
															-//       L = len(Sizes) - Number of neural network layers
														
 
															-
														
 
															-type RProp struct {
														
 
															-	Count          int
														
 
															-	Sizes          []int
														
 
															-	Biases         []*mat.Dense
														
 
															-	Weights        []*mat.Dense
														
 
															-	A              []*mat.Dense
														
 
															-	Z              []*mat.Dense
														
 
															-	alpha          float64
														
 
															-	trainingCycles int
														
 
															-}
														
 
															-
														
 
															-func NewRProp(sizes []int, nu float64, trainingCycles int) (nn *RProp, err error) {
														
 
															-	err = nil
														
 
															-	if len(sizes) < 3 {
														
 
															-		fmt.Printf("Invalid network configuration: %v\n", sizes)
														
 
															-		return nil, errors.New("Invalid network configuration: %v\n")
														
 
															-	}
														
 
															-
														
 
															-	for i := 0; i < len(sizes); i++ {
														
 
															-		if sizes[i] < 2 {
														
 
															-			fmt.Printf("Invalid network configuration: %v\n", sizes)
														
 
															-			return nil, errors.New("Invalid network configuration: %v\n")
														
 
															-		}
														
 
															-	}
														
 
															-
														
 
															-	if nu <= 0.0 || nu > 1.0 {
														
 
															-		fmt.Printf("Invalid η value: %v\n", nu)
														
 
															-		return nil, errors.New("Invalid η value: %v\n")
														
 
															-	}
														
 
															-
														
 
															-	if trainingCycles <= 0 {
														
 
															-		fmt.Printf("Invalid training cycles number: %v\n", trainingCycles)
														
 
															-		return nil, errors.New("Invalid training cycles number: %v\n")
														
 
															-	}
														
 
															-
														
 
															-	if trainingCycles < 100 {
														
 
															-		fmt.Println("Training cycles number probably is too small")
														
 
															-	}
														
 
															-
														
 
															-	nn = &RProp{}
														
 
															-	nn.Sizes = sizes
														
 
															-	nn.Count = len(sizes)
														
 
															-	nn.Weights = make([]*mat.Dense, nn.Count)
														
 
															-	nn.Biases = make([]*mat.Dense, nn.Count)
														
 
															-	nn.A = make([]*mat.Dense, nn.Count)
														
 
															-	nn.Z = make([]*mat.Dense, nn.Count)
														
 
															-	nn.alpha = nu / float64(nn.Sizes[0])
														
 
															-	nn.trainingCycles = trainingCycles
														
 
															-
														
 
															-	for i := 1; i < nn.Count; i++ {
														
 
															-		nn.Weights[i] = generateRandomDense(nn.Sizes[i], nn.Sizes[i-1])
														
 
															-		nn.Biases[i] = generateRandomDense(nn.Sizes[i], 1)
														
 
															-	}
														
 
															-	return
														
 
															-}
														
 
															-
														
 
															-func (nn *RProp) Copy() (out *RProp) {
														
 
															-	out = &RProp{}
														
 
															-	out.Sizes = nn.Sizes
														
 
															-	out.Count = nn.Count
														
 
															-	out.Weights = make([]*mat.Dense, nn.Count)
														
 
															-	out.Biases = make([]*mat.Dense, nn.Count)
														
 
															-	out.A = make([]*mat.Dense, nn.Count)
														
 
															-	out.Z = make([]*mat.Dense, nn.Count)
														
 
															-	out.alpha = nn.alpha
														
 
															-	out.trainingCycles = nn.trainingCycles
														
 
															-
														
 
															-	for i := 1; i < out.Count; i++ {
														
 
															-		nn.Weights[i] = mat.DenseCopyOf(out.Weights[i])
														
 
															-		nn.Biases[i] = mat.DenseCopyOf(out.Biases[i])
														
 
															-	}
														
 
															-	return
														
 
															-}
														
 
															-
														
 
															-func (nn *RProp) Predict(aIn mat.Matrix) (maxIndex int, max float64) {
														
 
															-	r, _ := aIn.Dims()
														
 
															-	if r != nn.Sizes[0] {
														
 
															-		fmt.Printf("Invalid rows number of input matrix size: %v\n", r)
														
 
															-		return -1, 0.0
														
 
															-	}
														
 
															-
														
 
															-	nn.forward(aIn)
														
 
															-	result := nn.result()
														
 
															-	r, _ = result.Dims()
														
 
															-	max = 0.0
														
 
															-	maxIndex = 0
														
 
															-	for i := 0; i < r; i++ {
														
 
															-		if result.At(i, 0) > max {
														
 
															-			max = result.At(i, 0)
														
 
															-			maxIndex = i
														
 
															-		}
														
 
															-	}
														
 
															-	return
														
 
															-}
														
 
															-
														
 
															-func (nn *RProp) Teach(teacher teach.Teacher) {
														
 
															-	for i := 0; i < nn.trainingCycles; i++ {
														
 
															-		for teacher.NextData() {
														
 
															-			nn.backward(teacher.GetData())
														
 
															-		}
														
 
															-	}
														
 
															-}
														
 
															-
														
 
															-func (nn *RProp) SaveState(writer io.Writer) {
														
 
															-}
														
 
															-
														
 
															-func (nn *RProp) LoadState(reader io.Reader) {
														
 
															-}
														
 
															-
														
 
															-func (nn *RProp) forward(aIn mat.Matrix) {
														
 
															-	nn.A[0] = mat.DenseCopyOf(aIn)
														
 
															-
														
 
															-	for i := 1; i < nn.Count; i++ {
														
 
															-		nn.A[i] = mat.NewDense(nn.Sizes[i], 1, nil)
														
 
															-		aSrc := nn.A[i-1]
														
 
															-		aDst := nn.A[i]
														
 
															-
														
 
															-		// Each iteration implements formula bellow for neuron activation values
														
 
															-		// A[l]=σ(W[l]*A[l−1]+B[l])
														
 
															-
														
 
															-		// W[l]*A[l−1]
														
 
															-		aDst.Mul(nn.Weights[i], aSrc)
														
 
															-
														
 
															-		// W[l]*A[l−1]+B[l]
														
 
															-		aDst.Add(aDst, nn.Biases[i])
														
 
															-
														
 
															-		// Save raw activation value for back propagation
														
 
															-		nn.Z[i] = mat.DenseCopyOf(aDst)
														
 
															-
														
 
															-		// σ(W[l]*A[l−1]+B[l])
														
 
															-		aDst.Apply(applySigmoid, aDst)
														
 
															-	}
														
 
															-}
														
 
															-
														
 
															-func (nn *RProp) backward(aIn, aOut mat.Matrix) {
														
 
															-	nn.forward(aIn)
														
 
															-
														
 
															-	lastLayerNum := nn.Count - 1
														
 
															-
														
 
															-	// To calculate new values of weights and biases
														
 
															-	// following formulas are used:
														
 
															-	// W[l] = A[l−1]*δ[l]
														
 
															-	// B[l] = δ[l]
														
 
															-
														
 
															-	// For last layer δ value is calculated by following:
														
 
															-	// δ = (A[L]−y)⊙σ'(Z[L])
														
 
															-
														
 
															-	// Calculate initial error for last layer L
														
 
															-	// error = A[L]-y
														
 
															-	// Where y is expected activations set
														
 
															-	err := &mat.Dense{}
														
 
															-	err.Sub(nn.result(), aOut)
														
 
															-
														
 
															-	// Calculate sigmoids prime σ'(Z[L]) for last layer L
														
 
															-	sigmoidsPrime := &mat.Dense{}
														
 
															-	sigmoidsPrime.Apply(applySigmoidPrime, nn.Z[lastLayerNum])
														
 
															-
														
 
															-	// (A[L]−y)⊙σ'(Z[L])
														
 
															-	delta := &mat.Dense{}
														
 
															-	delta.MulElem(err, sigmoidsPrime)
														
 
															-
														
 
															-	// B[L] = δ[L]
														
 
															-	biases := mat.DenseCopyOf(delta)
														
 
															-
														
 
															-	// W[L] = A[L−1]*δ[L]
														
 
															-	weights := &mat.Dense{}
														
 
															-	weights.Mul(delta, nn.A[lastLayerNum-1].T())
														
 
															-
														
 
															-	// Initialize new weights and biases values with last layer values
														
 
															-	newBiases := []*mat.Dense{makeBackGradient(biases, nn.Biases[lastLayerNum], nn.alpha)}
														
 
															-	newWeights := []*mat.Dense{makeBackGradient(weights, nn.Weights[lastLayerNum], nn.alpha)}
														
 
															-
														
 
															-	// Save calculated delta value temporary error variable
														
 
															-	err = delta
														
 
															-
														
 
															-	// Next layer Weights and Biases are calculated using same formulas:
														
 
															-	// W[l] = A[l−1]*δ[l]
														
 
															-	// B[l] = δ[l]
														
 
															-
														
 
															-	// But δ[l] is calculated using different formula:
														
 
															-	// δ[l] = ((Wt[l+1])*δ[l+1])⊙σ'(Z[l])
														
 
															-	// Where Wt[l+1] is transposed matrix of actual Weights from
														
 
															-	// forward step
														
 
															-	for l := nn.Count - 2; l > 0; l-- {
														
 
															-		// Calculate sigmoids prime σ'(Z[l]) for last layer l
														
 
															-		sigmoidsPrime := &mat.Dense{}
														
 
															-		sigmoidsPrime.Apply(applySigmoidPrime, nn.Z[l])
														
 
															-
														
 
															-		// (Wt[l+1])*δ[l+1]
														
 
															-		// err bellow is delta from previous step(l+1)
														
 
															-		delta := &mat.Dense{}
														
 
															-		wdelta := &mat.Dense{}
														
 
															-		wdelta.Mul(nn.Weights[l+1].T(), err)
														
 
															-
														
 
															-		// Calculate new delta and store it to temporary variable err
														
 
															-		// δ[l] = ((Wt[l+1])*δ[l+1])⊙σ'(Z[l])
														
 
															-		delta.MulElem(wdelta, sigmoidsPrime)
														
 
															-		err = delta
														
 
															-
														
 
															-		// B[l] = δ[l]
														
 
															-		biases := mat.DenseCopyOf(delta)
														
 
															-
														
 
															-		// W[l] = A[l−1]*δ[l]
														
 
															-		// At this point it's required to give explanation for inaccuracy
														
 
															-		// in the formula
														
 
															-
														
 
															-		// Multiplying of activations matrix for layer l-1 and δ[l] is imposible
														
 
															-		// because view of matrices are following:
														
 
															-		//          A[l-1]       δ[l]
														
 
															-		//         ⎡A[0]  ⎤     ⎡δ[0] ⎤
														
 
															-		//         ⎢A[1]  ⎥     ⎢δ[1] ⎥
														
 
															-		//         ⎢ ...  ⎥     ⎢ ... ⎥
														
 
															-		//         ⎢A[i]  ⎥  X  ⎢δ[i] ⎥
														
 
															-		//         ⎢ ...  ⎥     ⎢ ... ⎥
														
 
															-		//         ⎣A[s'] ⎦     ⎣δ[s] ⎦
														
 
															-		// So we need to modify these matrices to apply mutiplications and got
														
 
															-		// Weights matrix of following view:
														
 
															-		//         ⎡w[0,0] ... w[0,j] ... w[0,s']⎤
														
 
															-		//         ⎢w[1,0] ... w[1,j] ... w[1,s']⎥
														
 
															-		//         ⎢              ...            ⎥
														
 
															-		//         ⎢w[i,0] ... w[i,j] ... w[i,s']⎥
														
 
															-		//         ⎢              ...            ⎥
														
 
															-		//         ⎣w[s,0] ... w[s,j] ... w[s,s']⎦
														
 
															-		// So we swap matrices and transpose A[l-1] to get valid multiplication
														
 
															-		// of following view:
														
 
															-		//           δ[l]               A[l-1]
														
 
															-		//         ⎡δ[0] ⎤ x [A[0] A[1] ... A[i] ... A[s']]
														
 
															-		//         ⎢δ[1] ⎥
														
 
															-		//         ⎢ ... ⎥
														
 
															-		//         ⎢δ[i] ⎥
														
 
															-		//         ⎢ ... ⎥
														
 
															-		//         ⎣δ[s] ⎦
														
 
															-		weights := &mat.Dense{}
														
 
															-		weights.Mul(delta, nn.A[l-1].T())
														
 
															-
														
 
															-		// !Prepend! new Biases and Weights
														
 
															-		newBiases = append([]*mat.Dense{makeBackGradient(biases, nn.Biases[l], nn.alpha)}, newBiases...)
														
 
															-		newWeights = append([]*mat.Dense{makeBackGradient(weights, nn.Weights[l], nn.alpha)}, newWeights...)
														
 
															-	}
														
 
															-
														
 
															-	newBiases = append([]*mat.Dense{&mat.Dense{}}, newBiases...)
														
 
															-	newWeights = append([]*mat.Dense{&mat.Dense{}}, newWeights...)
														
 
															-
														
 
															-	nn.Biases = newBiases
														
 
															-	nn.Weights = newWeights
														
 
															-}
														
 
															-
														
 
															-func (nn *RProp) result() *mat.Dense {
														
 
															-	return nn.A[nn.Count-1]
														
 
															-}