ChainerRL
stable
Installation
Quickstart Guide
API Reference
ChainerRL
Docs
»
Index
Edit on GitHub
Index
_
|
A
|
B
|
C
|
D
|
E
|
F
|
G
|
I
|
K
|
L
|
M
|
N
|
P
|
Q
|
R
|
S
|
T
|
U
_
__call__() (chainerrl.policy.Policy method)
(chainerrl.q_function.StateActionQFunction method)
(chainerrl.q_function.StateQFunction method)
A
A2C (class in chainerrl.agents)
A3C (class in chainerrl.agents)
ACER (class in chainerrl.agents)
act() (chainerrl.agent.Agent method)
act_and_train() (chainerrl.agent.Agent method)
ActionValue (class in chainerrl.action_value)
AdditiveGaussian (class in chainerrl.explorers)
AdditiveOU (class in chainerrl.explorers)
Agent (class in chainerrl.agent)
AL (class in chainerrl.agents)
append() (chainerrl.replay_buffer.ReplayBuffer method)
B
Boltzmann (class in chainerrl.explorers)
Branched (class in chainerrl.links)
C
CategoricalDoubleDQN (class in chainerrl.agents)
CategoricalDQN (class in chainerrl.agents)
collect_demonstrations() (in module chainerrl.experiments)
concatenate_recurrent_states() (chainerrl.links.StatelessRecurrent method)
ConstantEpsilonGreedy (class in chainerrl.explorers)
ContinuousDeterministicDistribution (class in chainerrl.distribution)
ContinuousDeterministicPolicy (class in chainerrl.policies)
copy() (chainerrl.distribution.Distribution method)
D
DDPG (class in chainerrl.agents)
DiscreteActionValue (class in chainerrl.action_value)
Distribution (class in chainerrl.distribution)
DistributionalDuelingDQN (class in chainerrl.q_functions)
DistributionalFCStateQFunctionWithDiscreteAction (class in chainerrl.q_functions)
DistributionalSingleModelStateQFunctionWithDiscreteAction (class in chainerrl.q_functions)
DoubleDQN (class in chainerrl.agents)
DoublePAL (class in chainerrl.agents)
DPP (class in chainerrl.agents)
DQN (class in chainerrl.agents)
DuelingDQN (class in chainerrl.q_functions)
E
EmpiricalNormalization (class in chainerrl.links)
entropy (chainerrl.distribution.Distribution attribute)
EpisodicReplayBuffer (class in chainerrl.replay_buffer)
evaluate_actions() (chainerrl.action_value.ActionValue method)
Explorer (class in chainerrl.explorer)
F
FactorizedNoisyLinear (class in chainerrl.links)
FCBNDeterministicPolicy (class in chainerrl.policies)
FCBNLateActionSAQFunction (class in chainerrl.q_functions)
FCBNQuadraticStateQFunction (class in chainerrl.q_functions)
FCBNSAQFunction (class in chainerrl.q_functions)
FCDeterministicPolicy (class in chainerrl.policies)
FCGaussianPolicy (class in chainerrl.policies)
FCGaussianPolicyWithFixedCovariance (class in chainerrl.policies)
FCGaussianPolicyWithStateIndependentCovariance (class in chainerrl.policies)
FCLateActionSAQFunction (class in chainerrl.q_functions)
FCLSTMDeterministicPolicy (class in chainerrl.policies)
FCLSTMSAQFunction (class in chainerrl.q_functions)
FCLSTMStateQFunction (class in chainerrl.q_functions)
FCQuadraticStateQFunction (class in chainerrl.q_functions)
FCSAQFunction (class in chainerrl.q_functions)
FCSoftmaxPolicy (class in chainerrl.policies)
FCStateQFunctionWithDiscreteAction (class in chainerrl.q_functions)
G
GaussianDistribution (class in chainerrl.distribution)
GaussianHeadWithStateIndependentCovariance (class in chainerrl.policies)
get_recurrent_state_at() (chainerrl.links.StatelessRecurrent method)
get_state() (chainerrl.recurrent.Recurrent method)
get_statistics() (chainerrl.agent.Agent method)
Greedy (class in chainerrl.explorers)
greedy_actions (chainerrl.action_value.ActionValue attribute)
I
IQN (class in chainerrl.agents)
K
kl (chainerrl.distribution.Distribution attribute)
L
LinearDecayEpsilonGreedy (class in chainerrl.explorers)
LinearInterpolationHook (class in chainerrl.experiments)
load() (chainerrl.agent.Agent method)
(chainerrl.replay_buffer.ReplayBuffer method)
log_prob() (chainerrl.distribution.Distribution method)
M
mask_recurrent_state_at() (chainerrl.links.StatelessRecurrent method)
max (chainerrl.action_value.ActionValue attribute)
MellowmaxDistribution (class in chainerrl.distribution)
MellowmaxPolicy (class in chainerrl.policies)
MLP (class in chainerrl.links)
MLPBN (class in chainerrl.links)
most_probable (chainerrl.distribution.Distribution attribute)
N
n_step_forward() (chainerrl.links.StatelessRecurrent method)
NatureDQNHead (class in chainerrl.links)
NIPSDQNHead (class in chainerrl.links)
NSQ (class in chainerrl.agents)
P
PAL (class in chainerrl.agents)
params (chainerrl.action_value.ActionValue attribute)
(chainerrl.distribution.Distribution attribute)
PCL (class in chainerrl.agents)
PGT (class in chainerrl.agents)
Policy (class in chainerrl.policy)
PPO (class in chainerrl.agents)
PrioritizedEpisodicReplayBuffer (class in chainerrl.replay_buffer)
PrioritizedReplayBuffer (class in chainerrl.replay_buffer)
prob() (chainerrl.distribution.Distribution method)
Q
QuadraticActionValue (class in chainerrl.action_value)
R
Recurrent (class in chainerrl.recurrent)
REINFORCE (class in chainerrl.agents)
ReplayBuffer (class in chainerrl.replay_buffer)
,
[1]
reset_state() (chainerrl.recurrent.Recurrent method)
ResidualDQN (class in chainerrl.agents)
S
sample() (chainerrl.distribution.Distribution method)
(chainerrl.replay_buffer.ReplayBuffer method)
sample_with_log_prob() (chainerrl.distribution.Distribution method)
SARSA (class in chainerrl.agents)
save() (chainerrl.agent.Agent method)
(chainerrl.replay_buffer.ReplayBuffer method)
select_action() (chainerrl.explorer.Explorer method)
Sequence (class in chainerrl.links)
set_state() (chainerrl.recurrent.Recurrent method)
SingleActionValue (class in chainerrl.action_value)
SingleModelStateActionQFunction (class in chainerrl.q_functions)
SingleModelStateQFunctionWithDiscreteAction (class in chainerrl.q_functions)
SoftActorCritic (class in chainerrl.agents)
SoftmaxDistribution (class in chainerrl.distribution)
SoftmaxPolicy (class in chainerrl.policies)
state_kept() (in module chainerrl.recurrent)
state_reset() (in module chainerrl.recurrent)
StateActionQFunction (class in chainerrl.q_function)
StatelessRecurrent (class in chainerrl.links)
StatelessRecurrentBranched (class in chainerrl.links)
StatelessRecurrentChainList (class in chainerrl.links)
StatelessRecurrentSequential (class in chainerrl.links)
StateQFunction (class in chainerrl.q_function)
StepHook (class in chainerrl.experiments)
stop_episode() (chainerrl.agent.Agent method)
stop_episode_and_train() (chainerrl.agent.Agent method)
T
TD3 (class in chainerrl.agents)
to_factorized_noisy() (in module chainerrl.links)
train_agent_async() (in module chainerrl.experiments)
train_agent_batch() (in module chainerrl.experiments)
train_agent_batch_with_evaluation() (in module chainerrl.experiments)
train_agent_with_evaluation() (in module chainerrl.experiments)
TRPO (class in chainerrl.agents)
U
update_state() (chainerrl.recurrent.Recurrent method)
Read the Docs
v: stable
Versions
latest
stable
add-docs
Downloads
pdf
html
epub
On Read the Docs
Project Home
Builds
Free document hosting provided by
Read the Docs
.