Safe Haskell | None |
---|---|
Language | Haskell2010 |
Soft Actor Critic Algorithm Defaults
Synopsis
- algorithm :: Algorithm
- verbose :: Bool
- bufferType :: BufferType
- numSteps :: Int
- numEpochs :: Int
- numIterations :: Int
- earlyStop :: Tensor
- minReward :: Float
- batchSize :: Int
- rngSeed :: Int
- maxTime :: Float
- aceId :: String
- aceBackend :: String
- aceVariant :: Int
- γ :: Tensor
- τ :: Tensor
- εNoise :: Tensor
- αLearned :: Bool
- αInit :: Tensor
- σMin :: Float
- σMax :: Float
- rewardScale :: Tensor
- ρ :: Tensor
- d :: Int
- εConst :: Tensor
- wInit :: Float
- ηπ :: Tensor
- ηq :: Tensor
- ηα :: Tensor
- β1 :: Float
- β2 :: Float
- bufferSize :: Int
- αStart :: Float
- βStart :: Float
- βFrames :: Int
- η0 :: Float
- ηT :: Float
- cMin :: Int
- strategy :: Strategy
- k :: Int
- relTol :: Tensor
Documentation
bufferType :: BufferType Source #
Replay Buffer Type
numIterations :: Int Source #
Total Number of iterations, depends on bufferType
.
aceBackend :: String Source #
PDK/Technology backend of the ACE Environment
aceVariant :: Int Source #
ACE Environment variant
rewardScale :: Tensor Source #
Reward Scaling Factor
bufferSize :: Int Source #
Maximum size of Replay Buffer