Episode

object Episode

Source: Episode.scala

Linear Supertypes

AnyRef, Any

Ordering

Alphabetic
By Inheritance

Inherited

Episode
AnyRef
Any

Hide All
Show All

Visibility

Public
All

Type Members

case class Moment[Obs, A, R, M[_]](policy: Policy[Obs, A, R, M, M], state: State[Obs, A, R, M]) extends Product with Serializable
Wrapper around a combination of state and policy.
Wrapper around a combination of state and policy. A moment in time. this wraps up a common thing that we interact with...

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def asInstanceOf[T0]: T0

Definition Classes
Any
def clone(): AnyRef

Attributes
protected[lang]
Definition Classes
AnyRef
Annotations
@throws( ... ) @native()
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def finalize(): Unit

Attributes
protected[lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
def firstVisit[Obs, A, R, M[_]](moment: Moment[Obs, A, R, M])(implicit arg0: Monad[M]): M[(Moment[Obs, A, R, M], Trajectory[Obs, A, R, M])]
Specialized version of playEpisode that only updates every first time a state is seen.
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
Annotations
@native()
def hashCode(): Int

Definition Classes
AnyRef → Any
Annotations
@native()
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
Annotations
@native()
final def notifyAll(): Unit

Definition Classes
AnyRef
Annotations
@native()
def playEpisode[Obs, A, R, M[_], T](moment: Moment[Obs, A, R, M], tracker: Tracker[Obs, A, R, T, M])(implicit arg0: Monad[M]): M[(Moment[Obs, A, R, M], Trajectory[Obs, A, R, M])]
Takes a policy and a starting state and returns an M containing the final policy, final state and the trajectory that got us there.
def playMany[Obs, A, R, M[_]](moments: List[Moment[Obs, A, R, M]])(rewardSum: (List[SARS[Obs, A, R, M]]) ⇒ R)(implicit arg0: Monad[M]): M[(List[Moment[Obs, A, R, M]], R)]
Takes a list of policy, initial state pairs and plays a single episode of a game with each of them.
def playManyN[Obs, A, R, M[_]](moments: List[Moment[Obs, A, R, M]], nTimes: Int)(rewardSum: (List[SARS[Obs, A, R, M]]) ⇒ R)(implicit arg0: Monad[M]): M[(List[Moment[Obs, A, R, M]], List[R])]
Takes an initial set of policies and astate...
Takes an initial set of policies and astate... we could definitely adapt this to do some serious learning on the policies, and use the MonoidAggregator stuff.
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
AnyRef → Any
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... ) @native()

Packages

ScalaRL

Episode

object Episode

Type Members

Value Members

Inherited from AnyRef

Inherited from Any

Ungrouped

Packages

ScalaRL

Episode 

object Episode

Type Members

Value Members

Inherited from AnyRef

Inherited from Any

Ungrouped

Episode