Safe Haskell | None |
---|---|
Language | Haskell2010 |
Soft Actor Critic Algorithm Defaults
Synopsis
- algorithm :: Algorithm
- data ActorNetSpec = ActorNetSpec {}
- data CriticNetSpec = CriticNetSpec {}
- data ActorNet = ActorNet {}
- data CriticNet = CriticNet {}
- data Agent = Agent {}
- mkAgent :: Int -> Int -> IO Agent
- saveAgent :: String -> Agent -> IO ()
- saveAgent' :: String -> Agent -> IO Agent
- loadAgent :: String -> Int -> Int -> Int -> IO Agent
- π :: ActorNet -> Tensor -> (Tensor, Tensor)
- q :: CriticNet -> Tensor -> Tensor -> Tensor
- q' :: CriticNet -> CriticNet -> Tensor -> Tensor -> Tensor
- actRandom :: Agent -> Tensor -> IO Tensor
- act :: Agent -> Tensor -> IO Tensor
- evaluate :: Agent -> Tensor -> Tensor -> IO (Tensor, Tensor)
- train :: Int -> Int -> HymURL -> TrackingURI -> IO Agent
Documentation
data ActorNetSpec Source #
Actor Network Specification
Instances
Eq ActorNetSpec Source # | |
Defined in SAC (==) :: ActorNetSpec -> ActorNetSpec -> Bool # (/=) :: ActorNetSpec -> ActorNetSpec -> Bool # | |
Show ActorNetSpec Source # | |
Defined in SAC showsPrec :: Int -> ActorNetSpec -> ShowS # show :: ActorNetSpec -> String # showList :: [ActorNetSpec] -> ShowS # | |
Randomizable ActorNetSpec ActorNet Source # | Actor Network Weight initialization |
data CriticNetSpec Source #
Critic Network Specification
Instances
Eq CriticNetSpec Source # | |
Defined in SAC (==) :: CriticNetSpec -> CriticNetSpec -> Bool # (/=) :: CriticNetSpec -> CriticNetSpec -> Bool # | |
Show CriticNetSpec Source # | |
Defined in SAC showsPrec :: Int -> CriticNetSpec -> ShowS # show :: CriticNetSpec -> String # showList :: [CriticNetSpec] -> ShowS # | |
Randomizable CriticNetSpec CriticNet Source # | Critic Network Weight initialization |
Actor Network Architecture
Instances
Show ActorNet Source # | |
Generic ActorNet Source # | |
Parameterized ActorNet Source # | |
Defined in SAC flattenParameters :: ActorNet -> [Parameter] # | |
Randomizable ActorNetSpec ActorNet Source # | Actor Network Weight initialization |
type Rep ActorNet Source # | |
Defined in SAC type Rep ActorNet = D1 ('MetaData "ActorNet" "SAC" "edelwace-0.1.0.0-NlkYKOSwr4E6F4MQQAmdJ" 'False) (C1 ('MetaCons "ActorNet" 'PrefixI 'True) ((S1 ('MetaSel ('Just "pLayer0") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear) :*: S1 ('MetaSel ('Just "pLayer1") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear)) :*: (S1 ('MetaSel ('Just "pLayer\956") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear) :*: S1 ('MetaSel ('Just "pLayer\963") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear)))) |
Critic Network Architecture
Instances
Show CriticNet Source # | |
Generic CriticNet Source # | |
Parameterized CriticNet Source # | |
Defined in SAC flattenParameters :: CriticNet -> [Parameter] # | |
Randomizable CriticNetSpec CriticNet Source # | Critic Network Weight initialization |
type Rep CriticNet Source # | |
Defined in SAC type Rep CriticNet = D1 ('MetaData "CriticNet" "SAC" "edelwace-0.1.0.0-NlkYKOSwr4E6F4MQQAmdJ" 'False) (C1 ('MetaCons "CriticNet" 'PrefixI 'True) (S1 ('MetaSel ('Just "qLayer0") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear) :*: (S1 ('MetaSel ('Just "qLayer1") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear) :*: S1 ('MetaSel ('Just "qLayer2") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear)))) |
SAC Agent
Agent | |
|
Instances
actRandom :: Agent -> Tensor -> IO Tensor Source #
Perform a completely random action for a given state