forward method - TransformerEncoderBlock class - aft_transformer_encoder_block library

dart_cuda package
documentation
aft_transformer_encoder_block.dart
TransformerEncoderBlock
forward method

forward method

Tensor forward(

Tensor x,
List<Tensor> tracker

)

x: T, embedSize

Implementation

Tensor forward(Tensor x, List<Tensor> tracker) {
  // --- 1. Multi-Head AFT Attention Sub-layer ---
  // Pre-Norm logic: ln -> attention -> residual
  final xNorm1 = ln1.forward(x, tracker);
  // Note: ln1.forward likely adds intermediates to tracker internally

  final attnOut = attention.forward(xNorm1, tracker);
  final xRes1 = x + attnOut;

  // We track intermediates created in this scope
  tracker.addAll([attnOut, xRes1]);

  // --- 2. Feed-Forward Network Sub-layer ---
  // Pre-Norm logic: ln -> ffn -> residual
  final xNorm2 = ln2.forward(xRes1, tracker);

  final ffnOut = ffn.forward(xNorm2, tracker);
  final out = xRes1 + ffnOut;

  // Track the MLP output.
  // 'out' is NOT added to tracker because it is the return value
  // and will be used (and tracked/disposed) by the next layer or main loop.
  tracker.add(ffnOut);

  return out;
}