PolicyGradient constructor

PolicyGradient({
  1. required int nActions,
  2. required List<int> policyLayers,
  3. int? seed,
  4. bool useBaseline = false,
})

Implementation

PolicyGradient({
  required this.nActions,
  required List<int> policyLayers,
  int? seed,
  this.useBaseline = false,
}) : _rand = seed != null ? Random(seed) : Random(),
     policy = ANN(layers: policyLayers, seed: seed),
     baseline = 0.0 {
  if (policyLayers.isEmpty) throw ArgumentError('policyLayers required');
}