Classic Control Environments Benchmarks

Segway

Run Parameters

n_runs

25

n_epochs

50

n_episodes

100

n_episodes_test

10

ConstrainedREPS:
  eps: 0.5
  kappa: 0.1
  n_episodes_per_fit: 25
PGPE:
  alpha: 0.3
  n_episodes_per_fit: 25
REPS:
  eps: 0.5
  n_episodes_per_fit: 25
RWR:
  beta: 0.01
  n_episodes_per_fit: 25
../../../_images/J11.png ../../../_images/R11.png

LQR

Run Parameters

n_runs

25

n_epochs

100

n_episodes

100

n_episodes_test

10

GPOMDP:
  alpha: 0.01
  n_episodes_per_fit: 25
REINFORCE:
  alpha: 0.01
  n_episodes_per_fit: 25
eNAC:
  alpha: 0.01
  n_episodes_per_fit: 25
../../../_images/J12.png ../../../_images/R12.png