Documentation.

author: 3gg <3gg@shellblade.net> 2023-11-23 10:02:33 -0800
committer: 3gg <3gg@shellblade.net> 2023-11-23 10:02:33 -0800
commit: 3df7b6fb0c65295eed4590e6f166d60e89b3c68e (patch)
tree: 51c53d0b55e4fdff0facc5c4624b1102a40a13f0
parent: 6ca8a31143f087f3bc470d39eb3c00156443802a (diff)
3 files changed, 11 insertions, 8 deletions
diff --git a/src/lib/src/matrix.c b/src/lib/src/matrix.c
index 174504f..d98c8bb 100644
--- a/src/lib/src/matrix.c
+++ b/src/lib/src/matrix.c
@@ -6,7 +6,7 @@
 nnMatrix nnMatrixMake(int rows, int cols) {
  R* values = calloc(rows * cols, sizeof(R));
-  assert(values != 0);
+  assert(values != 0); // TODO: Make it a hard assert.
  return (nnMatrix){
      .rows   = rows,
diff --git a/src/lib/src/neuralnet_impl.h b/src/lib/src/neuralnet_impl.h
index 18694f4..f5a9c63 100644
--- a/src/lib/src/neuralnet_impl.h
+++ b/src/lib/src/neuralnet_impl.h
@@ -30,7 +30,7 @@ typedef struct nnNeuralNetwork {
 /// |network_outputs| points to the last output matrix in |layer_outputs| for
 /// convenience.
 typedef struct nnQueryObject {
-  int       num_layers;
+  int       num_layers;      // Same as nnNeuralNetwork::num_layers.
  nnMatrix* layer_outputs;   // Output matrices, one output per layer.
  nnMatrix* network_outputs; // Points to the last output matrix.
 } nnTrainingQueryObject;
diff --git a/src/lib/src/train.c b/src/lib/src/train.c
index 9244907..dc93f0f 100644
--- a/src/lib/src/train.c
+++ b/src/lib/src/train.c
@@ -219,13 +219,15 @@ void nnTrain(
      // Assuming one training input per iteration for now.
      nnMatrixTranspose(&training_inputs, &training_inputs_T);
-      // Run a forward pass and compute the output layer error.
+      // Run a forward pass and compute the output layer error relevant to the
-      // We don't square the error here; instead, we just compute t-o, which is
+      // derivative: o-t.
-      // part of the derivative, -2(t-o). Also, we compute o-t instead to
+      //   Error: (t-o)^2
-      // remove that outer negative sign.
+      //   dE/do = -2(t-o)
+      //         = +2(o-t)
+      // Note that we compute o-t instead to remove that outer negative sign.
+      // The 2 is dropped because we are only interested in the direction of the
+      // gradient. The learning rate controls the magnitude.
      nnQuery(net, query, &training_inputs);
-      // nnMatrixSub(&training_targets, training_outputs,
-      // &errors[net->num_layers - 1]);
      nnMatrixSub(
          training_outputs, &training_targets, &errors[net->num_layers - 1]);
@@ -328,6 +330,7 @@ void nnTrain(
        params->max_iterations, ComputeMSE(&errors[net->num_layers - 1]));
  }
+  // Clean up.
  for (int l = 0; l < net->num_layers; ++l) {
    nnMatrixDel(&errors[l]);
    nnMatrixDel(&outputs_T[l]);
author	3gg <3gg@shellblade.net>	2023-11-23 10:02:33 -0800
committer	3gg <3gg@shellblade.net>	2023-11-23 10:02:33 -0800
commit	3df7b6fb0c65295eed4590e6f166d60e89b3c68e (patch)
tree	51c53d0b55e4fdff0facc5c4624b1102a40a13f0
parent	6ca8a31143f087f3bc470d39eb3c00156443802a (diff)