LSPI Python
lspi
lspi package
Submodules
lspi.basis_functions module
lspi.domains module
lspi.lspi module
lspi.policy module
lspi.sample module
lspi.solvers module
Module contents
LSPI Python
Docs
»
Index
_
|
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
L
|
M
|
N
|
O
|
P
|
R
|
S
_
__copy__() (lspi.policy.Policy method)
__repr__() (lspi.sample.Sample method)
A
action_name() (lspi.domains.ChainDomain method)
(lspi.domains.Domain method)
apply_action() (lspi.domains.ChainDomain method)
(lspi.domains.Domain method)
B
BasisFunction (class in lspi.basis_functions)
best_action() (lspi.policy.Policy method)
C
calc_q_value() (lspi.policy.Policy method)
ChainDomain (class in lspi.domains)
ChainDomain.RewardLocation (class in lspi.domains)
current_state() (lspi.domains.ChainDomain method)
(lspi.domains.Domain method)
D
Domain (class in lspi.domains)
E
Ends (lspi.domains.ChainDomain.RewardLocation attribute)
evaluate() (lspi.basis_functions.BasisFunction method)
(lspi.basis_functions.ExactBasis method)
(lspi.basis_functions.FakeBasis method)
(lspi.basis_functions.OneDimensionalPolynomialBasis method)
(lspi.basis_functions.RadialBasisFunction method)
ExactBasis (class in lspi.basis_functions)
F
FakeBasis (class in lspi.basis_functions)
FirstWins (lspi.policy.Policy.TieBreakingStrategy attribute)
G
get_state_action_index() (lspi.basis_functions.ExactBasis method)
H
HalfMiddles (lspi.domains.ChainDomain.RewardLocation attribute)
L
LastWins (lspi.policy.Policy.TieBreakingStrategy attribute)
learn() (in module lspi.lspi)
lspi (module)
lspi.basis_functions (module)
lspi.domains (module)
lspi.lspi (module)
lspi.policy (module)
lspi.sample (module)
lspi.solvers (module)
LSTDQSolver (class in lspi.solvers)
M
Middle (lspi.domains.ChainDomain.RewardLocation attribute)
N
num_actions (lspi.basis_functions.BasisFunction attribute)
(lspi.basis_functions.ExactBasis attribute)
(lspi.basis_functions.FakeBasis attribute)
(lspi.basis_functions.OneDimensionalPolynomialBasis attribute)
(lspi.basis_functions.RadialBasisFunction attribute)
(lspi.policy.Policy attribute)
num_actions() (lspi.domains.ChainDomain method)
(lspi.domains.Domain method)
O
OneDimensionalPolynomialBasis (class in lspi.basis_functions)
P
Policy (class in lspi.policy)
Policy.TieBreakingStrategy (class in lspi.policy)
R
RadialBasisFunction (class in lspi.basis_functions)
random() (in module lspi.domains)
RandomWins (lspi.policy.Policy.TieBreakingStrategy attribute)
reset() (lspi.domains.ChainDomain method)
(lspi.domains.Domain method)
S
Sample (class in lspi.sample)
select_action() (lspi.policy.Policy method)
size() (lspi.basis_functions.BasisFunction method)
(lspi.basis_functions.ExactBasis method)
(lspi.basis_functions.FakeBasis method)
(lspi.basis_functions.OneDimensionalPolynomialBasis method)
(lspi.basis_functions.RadialBasisFunction method)
solve() (lspi.solvers.LSTDQSolver method)
(lspi.solvers.Solver method)
Solver (class in lspi.solvers)