iRprop+ implementation

2016-11-01 21:38:56 +01:00
parent 913a5cc41f
commit 173cfc9789
2 changed files with 116 additions and 0 deletions
--- a/include/NeuralNetwork/Learning/iRPropPlus.h
+++ b/include/NeuralNetwork/Learning/iRPropPlus.h
@@ -0,0 +1,64 @@
+#pragma once
+
+#include "BatchPropagation.h"
+
+namespace NeuralNetwork {
+	namespace Learning {
+
+		/** @class Resilient Propagation
+		 * @brief
+		 */
+		class iRPropPlus : public BatchPropagation {
+
+			public:
+				iRPropPlus(FeedForward::Network &feedForwardNetwork, std::shared_ptr<CorrectionFunction::CorrectionFunction> correction = std::make_shared<CorrectionFunction::Linear>()):
+					BatchPropagation(feedForwardNetwork, correction) {
+				}
+
+				iRPropPlus(const iRPropPlus&)=delete;
+				iRPropPlus& operator=(const NeuralNetwork::Learning::iRPropPlus&) = delete;
+
+				void setInitialWeightChange(float initVal) {
+					initialWeightChange=initVal;
+				}
+				void setLearningCoefficient(float) {
+
+				}
+			protected:
+
+				virtual inline void resize() override {
+					BatchPropagation::resize();
+
+					_lastGradients =_gradients;
+
+					_changesOfWeightChanges = _lastGradients;
+					for(std::size_t i = 1; i < _network.size(); i++) {
+						for(std::size_t j = 0; j < _changesOfWeightChanges[i].size(); j++) {
+							std::fill(_changesOfWeightChanges[i][j].begin(),_changesOfWeightChanges[i][j].end(),initialWeightChange);
+						}
+					}
+					_lastWeightChanges = _lastGradients;
+					for(std::size_t i = 1; i < _network.size(); i++) {
+						for(std::size_t j = 0; j < _lastWeightChanges[i].size(); j++) {
+							std::fill(_lastWeightChanges[i][j].begin(),_lastWeightChanges[i][j].end(),0.1);
+						}
+					}
+				}
+
+				void updateWeightsAndEndBatch() override;
+
+				std::vector<std::vector<std::vector<float>>> _lastGradients = {};
+				std::vector<std::vector<std::vector<float>>> _lastWeightChanges = {};
+				std::vector<std::vector<std::vector<float>>> _changesOfWeightChanges = {};
+
+				float _prevError=0;
+
+				float maxChangeOfWeights = 5;
+				float minChangeOfWeights = 0.0001;
+
+				float initialWeightChange=0.02;
+				float weightChangePlus=1.2;
+				float weightChangeMinus=0.5;
+		};
+	}
+}
--- a/src/NeuralNetwork/Learning/iRPropPlus.cpp
+++ b/src/NeuralNetwork/Learning/iRPropPlus.cpp
@@ -0,0 +1,52 @@
+#include <NeuralNetwork/Learning/iRPropPlus.h>
+
+void NeuralNetwork::Learning::iRPropPlus::updateWeightsAndEndBatch() {
+	float error = 0.0;
+	const auto& outputLayer=_network[_network.size()-1];
+	for(std::size_t j=1;j<outputLayer.size();j++) {
+		error+=_slopes[_network.size()-1][j];
+	}
+
+	error /= outputLayer.size();
+
+	for(std::size_t layerIndex=1;layerIndex<_network.size();layerIndex++) {
+		auto &layer = _network[layerIndex];
+		auto &prevLayer = _network[layerIndex - 1];
+
+		std::size_t prevLayerSize = prevLayer.size();
+		std::size_t layerSize = layer.size();
+
+		for(std::size_t j = 1; j < layerSize; j++) {
+			for(std::size_t k = 0; k < prevLayerSize; k++) {
+				float gradient = _gradients[layerIndex][j][k];
+				float lastGradient = _lastGradients[layerIndex][j][k];
+
+				_lastGradients[layerIndex][j][k] = gradient;
+
+				float weightChangeDelta = _changesOfWeightChanges[layerIndex][j][k];
+				float delta;
+
+				if(gradient * lastGradient > 0) {
+					weightChangeDelta = std::min(weightChangeDelta*weightChangePlus,maxChangeOfWeights);
+					delta = (std::signbit(gradient)? 1.0f : -1.0f ) * weightChangeDelta;
+					layer[j].weight(k) -= delta;
+				} else if (gradient * lastGradient < 0) {
+					weightChangeDelta = std::max(weightChangeDelta*weightChangeMinus,minChangeOfWeights);
+					delta = _lastWeightChanges[layerIndex][j][k];
+					if(error > _prevError) {
+						layer[j].weight(k) += delta;
+					}
+					_lastGradients[layerIndex][j][k] = 0;
+				} else {
+					delta = (std::signbit(gradient)? 1.0f : -1.0f ) * weightChangeDelta;
+					layer[j].weight(k) -= delta;
+				}
+				//std::cout << delta <<"\n";
+
+				_changesOfWeightChanges[layerIndex][j][k] = weightChangeDelta;
+				_lastWeightChanges[layerIndex][j][k] = delta;
+			}
+		}
+	}
+	_prevError = error;
+}