1 files changed, 3 insertions, 25 deletions
diff --git a/src/lib/src/train.c b/src/lib/src/train.c
index ccff553..fe9f598 100644
--- a/src/lib/src/train.c
+++ b/src/lib/src/train.c
@@ -153,14 +153,9 @@ void nnTrain(
  nnGradientElements* gradient_elems =
      calloc(net->num_layers, sizeof(nnGradientElements));
-  // Allocate the output transpose vectors for weight delta calculation.
-  // This is one column vector per layer.
-  nnMatrix* outputs_T = calloc(net->num_layers, sizeof(nnMatrix));
  assert(errors != 0);
  assert(weight_deltas != 0);
  assert(gradient_elems);
-  assert(outputs_T);
  for (int l = 0; l < net->num_layers; ++l) {
    const int          layer_input_size  = nnLayerInputSize(net, l);
@@ -169,7 +164,6 @@ void nnTrain(
    errors[l]        = nnMatrixMake(1, layer_output_size);
    weight_deltas[l] = nnMatrixMake(layer_input_size, layer_output_size);
-    outputs_T[l]     = nnMatrixMake(layer_output_size, 1);
    // Allocate the gradient elements and vectors for weight delta calculation.
    nnGradientElements* elems = &gradient_elems[l];
@@ -199,9 +193,6 @@ void nnTrain(
  // the outputs.
  const nnMatrix* const training_outputs = query->network_outputs;
-  // A vector to store the training input transposed.
-  nnMatrix training_inputs_T = nnMatrixMake(inputs->cols, 1);
  // If debug mode is requested, we will show progress every Nth iteration.
  const int progress_frame =
      (params->max_iterations < PROGRESS_THRESHOLD)
@@ -223,10 +214,6 @@ void nnTrain(
      const nnMatrix training_targets =
          nnMatrixBorrowRows((nnMatrix*)targets, sample, 1);
-      // Will need the input transposed for backpropagation.
-      // Assuming one training input per iteration for now.
-      nnMatrixTranspose(&training_inputs, &training_inputs_T);
      // Forward pass.
      nnQuery(net, query, &training_inputs);
@@ -240,14 +227,11 @@ void nnTrain(
      nnMatrixSub(
          training_outputs, &training_targets, &errors[net->num_layers - 1]);
-      // Update outputs_T, which we need during weight updates.
-      for (int l = 0; l < net->num_layers; ++l) {
-        nnMatrixTranspose(&query->layer_outputs[l], &outputs_T[l]);
-      }
      // Update weights and biases for each internal layer, back-propagating
      // errors along the way.
      for (int l = net->num_layers - 1; l >= 0; --l) {
+        const nnMatrix* layer_input =
+            (l == 0) ? &training_inputs : &query->layer_outputs[l - 1];
        const nnMatrix*     layer_output = &query->layer_outputs[l];
        nnGradientElements* elems        = &gradient_elems[l];
        nnMatrix*           gradient     = &elems->gradient;
@@ -310,10 +294,7 @@ void nnTrain(
          nnMatrix*     layer_biases  = &linear->biases;
          // Outer product to compute the weight deltas.
-          // This layer's input is the previous layer's output.
+          nnMatrixMulOuter(layer_input, gradient, &weight_deltas[l]);
-          const nnMatrix* input_T =
-              (l == 0) ? &training_inputs_T : &outputs_T[l - 1];
-          nnMatrixMul(input_T, gradient, &weight_deltas[l]);
          // Update weights.
          nnMatrixScale(&weight_deltas[l], params->learning_rate);
@@ -360,7 +341,6 @@ void nnTrain(
  // Clean up.
  for (int l = 0; l < net->num_layers; ++l) {
    nnMatrixDel(&errors[l]);
-    nnMatrixDel(&outputs_T[l]);
    nnMatrixDel(&weight_deltas[l]);
    nnGradientElements* elems = &gradient_elems[l];
@@ -378,9 +358,7 @@ void nnTrain(
      break;
    }
  }
-  nnMatrixDel(&training_inputs_T);
  free(errors);
-  free(outputs_T);
  free(weight_deltas);
  free(gradient_elems);
 }