Furuta Pendulum

DP rFVI

Δm = -5g

Δm = -5g

Δm = -5g

Δm = -2g

Δm = -2g

Δm = -2g

Δm = 0g

Δm = 0g

Δm = 0g

Δm = +1g

Δm = +1g

Δm = +1g

Δm = +3g

Δm = +3g

Δm = +3g

Δm = +5g

Δm = +5g

Δm = +5g

DP cFVI

Δm = -5g

Δm = -5g

Δm = -5g

Δm = -2g

Δm = -2g

Δm = -2g

Δm = 0g

Δm = 0g

Δm = 0g

Δm = +1g

Δm = +1g

Δm = +1g

Δm = +3g

Δm = +3g

Δm = +3g

Δm = +5g

Δm = +5g

Δm = +5g

SAC-U UDR

Δm = -5g

Δm = -5g

Δm = -5g

Δm = -2g

Δm = -2g

Δm = -2g

Δm = 0g

Δm = 0g

Δm = 0g

Δm = +1g

Δm = +1g

Δm = +1g

Δm = +3g

Δm = +3g

Δm = +3g

Δm = +5g

Δm = +5g

Δm = +5g

PPO-U UDR

Δm = -5g

Δm = -5g

Δm = -5g

Δm = -2g

Δm = -2g

Δm = -2g

Δm = 0g

Δm = 0g

Δm = 0g

Δm = +1g

Δm = +1g

Δm = +1g

Δm = +3g

Δm = +3g

Δm = +3g

Δm = +5g

Δm = +5g

Δm = +5g

DDPG-U UDR

Δm = -5g

Δm = -5g

Δm = -5g

Δm = -2g

Δm = -2g

Δm = -2g

Δm = 0g

Δm = 0g

Δm = 0g

Δm = +1g

Δm = +1g

Δm = +1g

Δm = +3g

Δm = +3g

Δm = +3g

Δm = +5g

Δm = +5g

Δm = +5g