| 0 |
CartPole |
{ $s^0$, -4.8, push cart to the right } |
| 1 |
CartPole |
{ $s^1$, 100, push cart to the right } |
| 2 |
CartPole |
{ $s^2$, -0.42, push cart to the left } |
| 3 |
CartPole |
{ $s^3$, -100, push cart to the left } |
| 4 |
Acrobot |
{ $s^0$, -1, apply -1 torque } |
| 5 |
Acrobot |
{ $s^1$, -1, apply 0 torque } |
| 6 |
Acrobot |
{ $s^2$, -1, apply 1 torque } |
| 7 |
Acrobot |
{ $s^3$, -1, apply -1 torque } |
| 8 |
Acrobot |
{ $s^4$, 12.57, apply 0 torque } |
| 9 |
Acrobot |
{ $s^5$, 28.27, apply 1 torque } |
| 10 |
MountainCar |
{ $s^0$, -0.07, not accelerate } |
| 11 |
MountainCar |
{ $s^1$, 0.07, accelerate to the right } |
| 12 |
Pendulum |
{ $s^2$, 8, maximum left torque } |
| 13 |
Pendulum |
{ $s^1$, -1, maximum right torque } |
| 14 |
Pendulum |
{ $s^2$, -8, maximum right torque } |
| 15 |
CartPole |
{ $s^0$, -4.8, push cart to the right }, { $s^2$, -0.42, push cart to the left } |
| 16 |
CartPole |
{ $s^1$, 100, push cart to the right }, { $s^3$, -100, push cart to the left } |
| 17 |
CartPole |
{ $s^0$, -4.8, push cart to the right }, { $s^3$, -100, push cart to the left } |
| 18 |
CartPole |
{ $s^1$, 100, push cart to the right }, { $s^2$, -0.42, push cart to the left } |
| 19 |
CartPole |
{ $s^0$, -4.8, push cart to the right }, { $s^1$, 100, push cart to the right }, { $s^2$, -0.42, push cart to the left }, { $s^3$, -100, push cart to the left } |
| 20 |
Acrobot |
{ $s^3$, -1, apply -1 torque }, { $s^4$, 12.57, apply 0 torque }, { $s^5$, 28.27, apply 1 torque } |
| 21 |
MountainCar |
{ $s^0$, -0.07, not accelerate }, { $s^1$, 0.07, accelerate to the right } |
| 22 |
Pendulum |
{ $s^2$, 8, maximum left torque }, { $s^1$, -1, maximum right torque } |
| 23 |
Pendulum |
{ $s^2$, 8, maximum left torque }, { $s^2$, -8, maximum right torque } |
| 24 |
Pendulum |
{ $s^1$, -1, maximum right torque }, { $s^2$, -8, maximum right torque } |
| 25 |
Pendulum |
{ $s^2$, 8, maximum left torque }, { $s^1$, -1, maximum right torque }, { $s^2$, -8, maximum right torque } |
| 26 |
Lunar Lander |
{ $s^0$, 1.5, do nothing } |
| 27 |
Lunar Lander |
{ $s^2$, -5, fire left orientation engine } |
| 28 |
Lunar Lander |
{ $s^4$, 3.14, fire main engine } |
| 29 |
Lunar Lander |
{ $s^6$, 0, fire right orientation engine } |
| 30 |
Bipedal Walker |
{ $s^0$, 3.14, maximum forward speed } |
| 31 |
Bipedal Walker |
{ $s^1$, 5, maximum backward speed } |
| 32 |
Lunar Lander |
{ $s^0$, 1.5, do nothing }, { $s^4$, 3.14, fire main engine } |
| 33 |
Lunar Lander |
{ $s^2$, -5, fire left orientation engine }, { $s^6$, 0, fire right orientation engine } |
| 34 |
Lunar Lander |
{ $s^0$, 1.5, do nothing }, { $s^6$, 0, fire right orientation engine } |
| 35 |
Lunar Lander |
{ $s^2$, -5, fire left orientation engine }, { $s^4$, 3.14, fire main engine } |
| 36 |
Lunar Lander |
{ $s^0$, 1.5, do nothing }, { $s^2$, -5, fire left orientation engine }, { $s^4$, 3.14, fire main engine }, { $s^6$, 0, fire right orientation engine } |
| 37 |
Bipedal Walker |
{ $s^0$, 3.14, maximum forward speed }, { $s^1$, 5, maximum backward speed } |
| 38 |
Half Cheetah |
{ $s^1$, 5, apply a torque of 1 to all rotors } |
| 39 |
Half Cheetah |
{ $s^2$, 5, apply a torque of -1 to all rotors } |
| 40 |
Hopper |
{ $s^1$, 5, apply a torque of 1 to all rotors } |
| 41 |
Hopper |
{ $s^2$, -5, apply a torque of -1 to all rotors } |
| 42 |
Reacher |
{ $s^0$, 5, apply a torque of 1 to all rotors } |
| 43 |
Reacher |
{ $s^1$, -5, apply a torque of -1 to all rotors } |
| 44 |
Half Cheetah |
{ $s^1$, 5, apply a torque of 1 to all rotors }, { $s^2$, 5, apply a torque of -1 to all rotors } |
| 45 |
Hopper |
{ $s^1$, 5, apply a torque of 1 to all rotors }, { $s^2$, -5, apply a torque of -1 to all rotors } |
| 46 |
Reacher |
{ $s^0$, 5, apply a torque of 1 to all rotors }, { $s^1$, -5, apply a torque of -1 to all rotors } |