UCB

Companion object UCB

case class UCB[Obs, A, R, T, S[_]](config: Config[R, T], valueFn: ActionValueFn[Obs, A, Choice[T]], time: Time) extends Policy[Obs, A, R, Cat, S] with Product with Serializable

Source: UCB.scala

Linear Supertypes

Serializable, Serializable, Product, Equals, Policy[Obs, A, R, Cat, S], AnyRef, Any

Ordering

Alphabetic
By Inheritance

Inherited

UCB
Serializable
Serializable
Product
Equals
Policy
AnyRef
Any

Hide All
Show All

Visibility

Public
All

Instance Constructors

new UCB(config: Config[R, T], valueFn: ActionValueFn[Obs, A, Choice[T]], time: Time)

Type Members

type This = Policy[Obs, A, R, Cat, S]

Definition Classes
Policy

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def asInstanceOf[T0]: T0

Definition Classes
Any
def choose(state: State[Obs, A, R, S]): Cat[A]

Definition Classes
UCB → Policy
def clone(): AnyRef

Attributes
protected[lang]
Definition Classes
AnyRef
Annotations
@throws( ... ) @native()
val config: Config[R, T]
def contramapObservation[P](f: (P) ⇒ Obs)(implicit S: Functor[S]): Policy[P, A, R, Cat, S]

Definition Classes
Policy
def contramapReward[T](f: (T) ⇒ R)(implicit S: Functor[S]): Policy[Obs, A, T, Cat, S]

Definition Classes
Policy
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def finalize(): Unit

Attributes
protected[lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
Annotations
@native()
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
def learn(sars: SARS[Obs, A, R, S]): This
learn here passes directly through to the ActionValueFn now, which is the new thing.
learn here passes directly through to the ActionValueFn now, which is the new thing. Does this mean that we shouldn't learn at all? Should that get delegated to an agent?

Definition Classes
UCB → Policy
def mapK[N[_]](f: FunctionK[Cat, N]): Policy[Obs, A, R, N, S]
Just an idea to see if I can make stochastic deciders out of deterministic deciders.
Just an idea to see if I can make stochastic deciders out of deterministic deciders. We'll see how this develops.

Definition Classes
Policy
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
Annotations
@native()
final def notifyAll(): Unit

Definition Classes
AnyRef
Annotations
@native()
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
val time: Time
val valueFn: ActionValueFn[Obs, A, Choice[T]]
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... ) @native()

Packages

ScalaRL

UCB

Companion object UCB

case class UCB[Obs, A, R, T, S[_]](config: Config[R, T], valueFn: ActionValueFn[Obs, A, Choice[T]], time: Time) extends Policy[Obs, A, R, Cat, S] with Product with Serializable

Instance Constructors

Type Members

Value Members

Inherited from Serializable

Inherited from Serializable

Inherited from Product

Inherited from Equals

Inherited from Policy[Obs, A, R, Cat, S]

Inherited from AnyRef

Inherited from Any

Ungrouped

Packages

ScalaRL

UCB 

Companion object UCB

case class UCB[Obs, A, R, T, S[_]](config: Config[R, T], valueFn: ActionValueFn[Obs, A, Choice[T]], time: Time) extends Policy[Obs, A, R, Cat, S] with Product with Serializable

Instance Constructors

Type Members

Value Members

Inherited from Serializable

Inherited from Serializable

Inherited from Product

Inherited from Equals

Inherited from Policy[Obs, A, R, Cat, S]

Inherited from AnyRef

Inherited from Any

Ungrouped

UCB