16 lines
479 B
Python
16 lines
479 B
Python
import datetime
|
|
from typing import NamedTuple, Optional
|
|
|
|
|
|
class PPOConfig(NamedTuple):
|
|
NNShape: list = [256, 256, 128]
|
|
actorLR: float = 2e-3 # Actor Net Learning
|
|
criticLR: float = 2e-3 # Critic Net Learning
|
|
gamma: float = 0.99
|
|
lmbda: float = 0.95
|
|
clipRange: float = 0.20
|
|
entropyWeight: float = 1e-2
|
|
trainEpochs: int = 8
|
|
saveDir: str = "PPO-Model/" + datetime.datetime.now().strftime("%m%d-%H%M") + "/"
|
|
loadModelDir: Optional[str] = None
|