protovoices-rl-0.1.0.0
Safe HaskellNone
LanguageGHC2021

RL

Documentation

trainDQN :: forall (dev :: (DeviceType, Nat)) gen tr tr' slc slc' s f h. (IsValidDevice dev, StatefulGen gen IO, Show s, Show f, Show h, s ~ Split SPitch, f ~ Freeze SPitch, h ~ Spread SPitch, Show slc, Show tr) => gen -> Eval tr tr' slc slc' h (Leftmost s f h) -> (GreedyState tr tr' slc (Leftmost s f h) -> Action slc tr s f h -> QEncoding dev ('[] :: [Nat])) -> (Analysis s f h tr slc -> IO QType) -> (Action slc tr s f h -> Maybe Bool -> IO QType) -> [Path slc' tr'] -> Int -> IO ([QType], [QType], QModel dev) Source #

trainA2C Source #

Arguments

:: forall (dev :: (DeviceType, Nat)) label. IsValidDevice dev 
=> Eval (Edges SPitch) [Edge SPitch] (Notes SPitch) [Note SPitch] (Spread SPitch) (PVLeftmost SPitch) 
-> IOGenM StdGen 
-> PVRewardFn label 
-> (QType -> QType)

learning rate schedule

-> (QType -> QType)

temperature schedule

-> Maybe [QType] 
-> QModel dev 
-> QModel dev 
-> [(Path [Note SPitch] [Edge SPitch], label)] 
-> Int 
-> IO ([[QType]], [QType], QModel dev, QModel dev) 

module RL.Model