Safe Haskell | None |
---|---|
Language | Haskell2010 |
Twin Delayed Deep Deterministic Policy Gradient Algorithm
Synopsis
- algorithm :: Algorithm
- data ActorNetSpec = ActorNetSpec {}
- data CriticNetSpec = CriticNetSpec {}
- data ActorNet = ActorNet {}
- data CriticNet = CriticNet {}
- data Agent = Agent {}
- mkAgent :: Int -> Int -> IO Agent
- saveAgent :: String -> Agent -> IO ()
- saveAgent' :: String -> Agent -> IO Agent
- loadAgent :: String -> Int -> Int -> Int -> IO Agent
- π :: ActorNet -> Tensor -> Tensor
- q :: CriticNet -> Tensor -> Tensor -> (Tensor, Tensor)
- q' :: CriticNet -> Tensor -> Tensor -> Tensor
- act :: Agent -> Tensor -> IO Tensor
- act' :: Int -> Agent -> Tensor -> IO Tensor
- evaluate :: Agent -> Tensor -> IO Tensor
- train :: Int -> Int -> HymURL -> TrackingURI -> IO Agent
- updatePolicy :: Int -> Agent -> Tracker -> Buffer Tensor -> Int -> IO Agent
Documentation
data ActorNetSpec Source #
Actor Network Specification
Instances
Eq ActorNetSpec Source # | |
Defined in TD3 (==) :: ActorNetSpec -> ActorNetSpec -> Bool # (/=) :: ActorNetSpec -> ActorNetSpec -> Bool # | |
Show ActorNetSpec Source # | |
Defined in TD3 showsPrec :: Int -> ActorNetSpec -> ShowS # show :: ActorNetSpec -> String # showList :: [ActorNetSpec] -> ShowS # | |
Randomizable ActorNetSpec ActorNet Source # | Actor Network Weight initialization |
data CriticNetSpec Source #
Critic Network Specification
Instances
Eq CriticNetSpec Source # | |
Defined in TD3 (==) :: CriticNetSpec -> CriticNetSpec -> Bool # (/=) :: CriticNetSpec -> CriticNetSpec -> Bool # | |
Show CriticNetSpec Source # | |
Defined in TD3 showsPrec :: Int -> CriticNetSpec -> ShowS # show :: CriticNetSpec -> String # showList :: [CriticNetSpec] -> ShowS # | |
Randomizable CriticNetSpec CriticNet Source # | Critic Network Weight initialization |
Actor Network Architecture
Instances
Show ActorNet Source # | |
Generic ActorNet Source # | |
Parameterized ActorNet Source # | |
Defined in TD3 flattenParameters :: ActorNet -> [Parameter] # | |
Randomizable ActorNetSpec ActorNet Source # | Actor Network Weight initialization |
type Rep ActorNet Source # | |
Defined in TD3 type Rep ActorNet = D1 ('MetaData "ActorNet" "TD3" "edelwace-0.1.0.0-NlkYKOSwr4E6F4MQQAmdJ" 'False) (C1 ('MetaCons "ActorNet" 'PrefixI 'True) (S1 ('MetaSel ('Just "pLayer0") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear) :*: (S1 ('MetaSel ('Just "pLayer1") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear) :*: S1 ('MetaSel ('Just "pLayer2") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Linear)))) |
Critic Network Architecture
Instances
TD3 Agent
Instances
Show Agent Source # | |
Generic Agent Source # | |
type Rep Agent Source # | |
Defined in TD3 type Rep Agent = D1 ('MetaData "Agent" "TD3" "edelwace-0.1.0.0-NlkYKOSwr4E6F4MQQAmdJ" 'False) (C1 ('MetaCons "Agent" 'PrefixI 'True) ((S1 ('MetaSel ('Just "\966") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 ActorNet) :*: (S1 ('MetaSel ('Just "\966'") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 ActorNet) :*: S1 ('MetaSel ('Just "\952") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 CriticNet))) :*: (S1 ('MetaSel ('Just "\952'") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 CriticNet) :*: (S1 ('MetaSel ('Just "\966Optim") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Adam) :*: S1 ('MetaSel ('Just "\952Optim") 'NoSourceUnpackedness 'NoSourceStrictness 'DecidedLazy) (Rec0 Adam))))) |
q' :: CriticNet -> Tensor -> Tensor -> Tensor Source #
Convenience Function, takes the minimum of both online actors
act :: Agent -> Tensor -> IO Tensor Source #
Get action from online policy with naive / static Exploration Noise
act' :: Int -> Agent -> Tensor -> IO Tensor Source #
Get action from online policy with dynamic Exploration Noise