Added layer backpropagation

2024-12-31 17:21:57 +01:00
parent 9a1810775b
commit fb49c794b2
1 changed files with 33 additions and 0 deletions
--- a/layer.h
+++ b/layer.h
@ -15,12 +15,20 @@ class Layer {
    Matrix activated_output;
    Matrix biases;

+    // Planning for back propagation
+    // Each layer needs the derivative of Z with respect to W, derivative of A with respect to Z and derivative of loss with respect to A
+    // Let's call them dzw, daz and dca
+    Matrix daz;
+
    static inline float Sigmoid(float);
    static inline float SigmoidPrime(float);

    inline void Forward(); // Forward Pass with sigmoid
    inline void Forward(float (*activation)(float)); // Forward Pass with custom activation function

+    inline void BackPropagate(Matrix);
+    inline void BackPropagate(Matrix, Matrix, float (*activation)(float)); // To backpropagate, we need the derivative of loss with respect to A and the derivative of used activation function
+
    inline void Feed(Matrix);

    // Constructors
@ -29,6 +37,31 @@ class Layer {
    Layer();
 };

+void Layer::BackPropagate(Matrix dzw, Matrix dca, float (*derivative)(float)){
+    // Calculate daz ; derivative of activation function
+    this->daz = this->activated_output.Function(derivative);
+    // this->daz.Print("daz");
+
+    // We need to transpose dzw and extend down
+    // dzw.Print("dzw");
+    dzw = dzw.Transpose().ExtendDown(dca.values.size());
+    // dzw.Print("dzw extended transposed");
+
+    Matrix dcw = this->daz.Hadamard(&dca).ExtendRight(this->input.values.size());
+    // dcw.Print("daz . dca");
+    dcw = dcw.Hadamard(&dzw);
+    // dcw.Print("daz . dca . dzw : DCW");
+
+    // this->weights.Print("weights");
+
+    // Apply dcw to weights
+    float learning_rate = 0.1F;
+    Matrix reduced_dcw = dcw.Multiply(learning_rate);
+    // We SUBSTRACT the derivative of loss with respect to the weights.
+    this->weights = this->weights.Substract(&reduced_dcw);
+    // this->weights.Print("New weights");
+}
+
 Layer::Layer(){

 }