45 lines
782 B
Python
45 lines
782 B
Python
|
|
from enum import Enum, unique
|
|
|
|
@unique
|
|
class ClipType(Enum):
|
|
ratio = 0
|
|
ratio_rollback = 1
|
|
|
|
ratio_strict = 2
|
|
ratio_rollback_constant = 3
|
|
|
|
a2c = 5
|
|
|
|
kl = 20
|
|
kl_strict = 21
|
|
kl_ratiorollback = 22
|
|
kl_klrollback_constant = 23
|
|
kl_klrollback = 24
|
|
kl_klrollback_constant_withratio = 25
|
|
|
|
kl2clip = 31
|
|
kl2clip_rollback = 32
|
|
|
|
|
|
adaptivekl = 40
|
|
|
|
adaptiverange_advantage = 50
|
|
|
|
wasserstein = 60
|
|
wasserstein_rollback_constant = 61
|
|
|
|
totalvariation=70
|
|
totalvariation_rollback_constant = 72
|
|
|
|
MUJOCO = 'mujoco'
|
|
ATARI = 'atari'
|
|
|
|
alg2cliptype = {
|
|
'ppo': 'ratio',
|
|
'trgppo': 'kl2clip',
|
|
'pporb': 'ratio_rollback',
|
|
'trppo': 'kl',
|
|
'trpporb': 'kl_ratiorollback',
|
|
'trulyppo': 'kl_klrollback_constant_withratio'
|
|
} |