Safe Haskell | None |
---|---|
Language | Haskell2010 |
Proximal Policy Optimization Algorithm
Synopsis
- algorithm :: Algorithm
- data ActorNetSpec = ActorNetSpec {}
- newtype CriticNetSpec = CriticNetSpec {}
- data ActorNet = ActorNet {}
- data CriticNet = CriticNet {}
- data Agent = Agent {}
- mkAgent :: Int -> Int -> IO Agent
- saveAgent :: String -> Agent -> IO ()
- saveAgent' :: String -> Agent -> IO Agent
- loadAgent :: String -> Int -> Int -> Int -> IO Agent
- π :: ActorNet -> Tensor -> Tensor
- q :: CriticNet -> Tensor -> Tensor
- train :: Int -> Int -> HymURL -> TrackingURI -> IO Agent
Documentation
data ActorNetSpec Source #
Actor Network Specification
Instances
Eq ActorNetSpec Source # | |
Defined in PPO (==) :: ActorNetSpec -> ActorNetSpec -> Bool # (/=) :: ActorNetSpec -> ActorNetSpec -> Bool # | |
Show ActorNetSpec Source # | |
Defined in PPO showsPrec :: Int -> ActorNetSpec -> ShowS # show :: ActorNetSpec -> String # showList :: [ActorNetSpec] -> ShowS # | |
Randomizable ActorNetSpec ActorNet Source # | Actor Network Weight initialization |
newtype CriticNetSpec Source #
Critic Network Specification
Instances
Eq CriticNetSpec Source # | |
Defined in PPO (==) :: CriticNetSpec -> CriticNetSpec -> Bool # (/=) :: CriticNetSpec -> CriticNetSpec -> Bool # | |
Show CriticNetSpec Source # | |
Defined in PPO showsPrec :: Int -> CriticNetSpec -> ShowS # show :: CriticNetSpec -> String # showList :: [CriticNetSpec] -> ShowS # | |
Randomizable CriticNetSpec CriticNet Source # | Critic Network Weight initialization |
Actor Network Architecture
Instances
Show ActorNet Source # | |
Generic ActorNet Source # | |
Parameterized ActorNet Source # | |
Defined in PPO flattenParameters :: ActorNet -> [Parameter] # | |
Randomizable ActorNetSpec ActorNet Source # | Actor Network Weight initialization |
type Rep ActorNet Source # | |
Defined in PPO type Rep ActorNet = D1 ('MetaData "ActorNet" "PPO" "edelwace-0.1.0.0-NlkYKOSwr4E6F4MQQAmdJ" 'False) (C1 ('MetaCons "ActorNet" 'PrefixI 'True) (S1 ('MetaSel ('Just "pLayer0") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear) :*: (S1 ('MetaSel ('Just "pLayer1") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear) :*: S1 ('MetaSel ('Just "pLayer2") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear)))) |
Critic Network Architecture
Instances
Show CriticNet Source # | |
Generic CriticNet Source # | |
Parameterized CriticNet Source # | |
Defined in PPO flattenParameters :: CriticNet -> [Parameter] # | |
Randomizable CriticNetSpec CriticNet Source # | Critic Network Weight initialization |
type Rep CriticNet Source # | |
Defined in PPO type Rep CriticNet = D1 ('MetaData "CriticNet" "PPO" "edelwace-0.1.0.0-NlkYKOSwr4E6F4MQQAmdJ" 'False) (C1 ('MetaCons "CriticNet" 'PrefixI 'True) (S1 ('MetaSel ('Just "qLayer0") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear) :*: (S1 ('MetaSel ('Just "qLayer1") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear) :*: S1 ('MetaSel ('Just "qLayer2") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear)))) |
PPO Agent
Instances
Show Agent Source # | |
Generic Agent Source # | |
type Rep Agent Source # | |
Defined in PPO type Rep Agent = D1 ('MetaData "Agent" "PPO" "edelwace-0.1.0.0-NlkYKOSwr4E6F4MQQAmdJ" 'False) (C1 ('MetaCons "Agent" 'PrefixI 'True) ((S1 ('MetaSel ('Just "\966") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 ActorNet) :*: S1 ('MetaSel ('Just "\952") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 CriticNet)) :*: (S1 ('MetaSel ('Just "logStd") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 IndependentTensor) :*: S1 ('MetaSel ('Just "optim") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Adam)))) |