| Safe Haskell | None |
|---|---|
| Language | GHC2021 |
RL
Documentation
module RL.ModelTypes
module RL.Callbacks
trainDQN :: forall (dev :: (DeviceType, Nat)) gen tr tr' slc slc' s f h. (IsValidDevice dev, StatefulGen gen IO, Show s, Show f, Show h, s ~ Split SPitch, f ~ Freeze SPitch, h ~ Spread SPitch, Show slc, Show tr) => gen -> Eval tr tr' slc slc' h (Leftmost s f h) -> (GreedyState tr tr' slc (Leftmost s f h) -> Action slc tr s f h -> QEncoding dev ('[] :: [Nat])) -> (Analysis s f h tr slc -> IO QType) -> (Action slc tr s f h -> Maybe Bool -> IO QType) -> [Path slc' tr'] -> Int -> IO ([QType], [QType], QModel dev) Source #
Arguments
| :: forall (dev :: (DeviceType, Nat)) label. IsValidDevice dev | |
| => Eval (Edges SPitch) [Edge SPitch] (Notes SPitch) [Note SPitch] (Spread SPitch) (PVLeftmost SPitch) | |
| -> IOGenM StdGen | |
| -> PVRewardFn label | |
| -> (QType -> QType) | learning rate schedule |
| -> (QType -> QType) | temperature schedule |
| -> Maybe [QType] | |
| -> QModel dev | |
| -> QModel dev | |
| -> [(Path [Note SPitch] [Edge SPitch], label)] | |
| -> Int | |
| -> IO ([[QType]], [QType], QModel dev, QModel dev) |
module RL.Encoding
module RL.Model
module RL.Plotting