Furuta Pendulum
DP rFVI
Δm = -5g
Δm = -5g
Δm = -5g
Δm = -2g
Δm = -2g
Δm = -2g
Δm = 0g
Δm = 0g
Δm = 0g
Δm = +1g
Δm = +1g
Δm = +1g
Δm = +3g
Δm = +3g
Δm = +3g
Δm = +5g
Δm = +5g
Δm = +5g
DP cFVI
Δm = -5g
Δm = -5g
Δm = -5g
Δm = -2g
Δm = -2g
Δm = -2g
Δm = 0g
Δm = 0g
Δm = 0g
Δm = +1g
Δm = +1g
Δm = +1g
Δm = +3g
Δm = +3g
Δm = +3g
Δm = +5g
Δm = +5g
Δm = +5g
SAC-U UDR
Δm = -5g
Δm = -5g
Δm = -5g
Δm = -2g
Δm = -2g
Δm = -2g
Δm = 0g
Δm = 0g
Δm = 0g
Δm = +1g
Δm = +1g
Δm = +1g
Δm = +3g
Δm = +3g
Δm = +3g
Δm = +5g
Δm = +5g
Δm = +5g
PPO-U UDR
Δm = -5g
Δm = -5g
Δm = -5g
Δm = -2g
Δm = -2g
Δm = -2g
Δm = 0g
Δm = 0g
Δm = 0g
Δm = +1g
Δm = +1g
Δm = +1g
Δm = +3g
Δm = +3g
Δm = +3g
Δm = +5g
Δm = +5g
Δm = +5g
DDPG-U UDR
Δm = -5g
Δm = -5g
Δm = -5g
Δm = -2g
Δm = -2g
Δm = -2g
Δm = 0g
Δm = 0g
Δm = 0g
Δm = +1g
Δm = +1g
Δm = +1g
Δm = +3g
Δm = +3g
Δm = +3g
Δm = +5g
Δm = +5g
Δm = +5g