NNablaRL
v0.9.0
Installation
Example codes
Colab demos
NNabla RL APIs
NNablaRL
»
Index
Edit on GitHub
Index
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
K
|
L
|
M
|
N
|
O
|
P
|
Q
|
R
|
S
|
T
|
V
A
A2C (class in nnabla_rl.algorithms.a2c)
A2CConfig (class in nnabla_rl.algorithms.a2c)
action_dim (nnabla_rl.environments.environment_info.EnvironmentInfo property)
action_shape (nnabla_rl.environments.environment_info.EnvironmentInfo property)
Algorithm (class in nnabla_rl.algorithm)
AlgorithmConfig (class in nnabla_rl.algorithm)
all_probs() (nnabla_rl.models.ValueDistributionFunction method)
all_q() (nnabla_rl.models.QFunction method)
all_quantile_values() (nnabla_rl.models.StateActionQuantileFunction method)
all_quantiles() (nnabla_rl.models.QuantileDistributionFunction method)
append() (nnabla_rl.replay_buffer.ReplayBuffer method)
(nnabla_rl.replay_buffers.MemoryEfficientAtariBuffer method)
(nnabla_rl.replay_buffers.PrioritizedReplayBuffer method)
append_all() (nnabla_rl.replay_buffer.ReplayBuffer method)
(nnabla_rl.replay_buffers.MemoryEfficientAtariBuffer method)
argmax_q() (nnabla_rl.models.QFunction method)
as_q_function() (nnabla_rl.models.QuantileDistributionFunction method)
(nnabla_rl.models.StateActionQuantileFunction method)
(nnabla_rl.models.ValueDistributionFunction method)
B
BCQ (class in nnabla_rl.algorithms.bcq)
BCQConfig (class in nnabla_rl.algorithms.bcq)
BEAR (class in nnabla_rl.algorithms.bear)
BEARConfig (class in nnabla_rl.algorithms.bear)
build_model() (nnabla_rl.builders.ModelBuilder method)
build_preprocessor() (nnabla_rl.builders.PreprocessorBuilder method)
build_replay_buffer() (nnabla_rl.builders.ReplayBufferBuilder method)
build_solver() (nnabla_rl.builders.SolverBuilder method)
C
capacity (nnabla_rl.replay_buffer.ReplayBuffer property)
CategoricalDQN (class in nnabla_rl.algorithms.categorical_dqn)
CategoricalDQNConfig (class in nnabla_rl.algorithms.categorical_dqn)
choose_probable() (nnabla_rl.distributions.Distribution method)
(nnabla_rl.distributions.Gaussian method)
(nnabla_rl.distributions.Softmax method)
(nnabla_rl.distributions.SquashedGaussian method)
compute_eval_action() (nnabla_rl.algorithm.Algorithm method)
(nnabla_rl.algorithms.ddpg.DDPG method)
D
DDPG (class in nnabla_rl.algorithms.ddpg)
DDPGConfig (class in nnabla_rl.algorithms.ddpg)
decode() (nnabla_rl.models.VariationalAutoEncoder method)
decode_multiple() (nnabla_rl.models.VariationalAutoEncoder method)
DecorableReplayBuffer (class in nnabla_rl.replay_buffers)
deepcopy() (nnabla_rl.models.model.Model method)
DeterministicPolicy (class in nnabla_rl.models)
Distribution (class in nnabla_rl.distributions)
DQN (class in nnabla_rl.algorithms.dqn)
DQNConfig (class in nnabla_rl.algorithms.dqn)
E
encode() (nnabla_rl.models.Encoder method)
encode_and_decode() (nnabla_rl.models.VariationalAutoEncoder method)
Encoder (class in nnabla_rl.models)
entropy() (nnabla_rl.distributions.Distribution method)
(nnabla_rl.distributions.Gaussian method)
(nnabla_rl.distributions.Softmax method)
EnvironmentInfo (class in nnabla_rl.environments.environment_info)
EvaluationHook (class in nnabla_rl.hooks)
F
from_env() (nnabla_rl.environments.environment_info.EnvironmentInfo static method)
G
GAIL (class in nnabla_rl.algorithms.gail)
GAILConfig (class in nnabla_rl.algorithms.gail)
Gaussian (class in nnabla_rl.distributions)
get_parameters() (nnabla_rl.models.model.Model method)
H
Hook (class in nnabla_rl.hook)
I
ICML2015TRPO (class in nnabla_rl.algorithms.icml2015_trpo)
ICML2015TRPOConfig (class in nnabla_rl.algorithms.icml2015_trpo)
ICML2018SAC (class in nnabla_rl.algorithms.icml2018_sac)
ICML2018SACConfig (class in nnabla_rl.algorithms.icml2018_sac)
IQN (class in nnabla_rl.algorithms.iqn)
IQNConfig (class in nnabla_rl.algorithms.iqn)
is_continuous_action_env() (nnabla_rl.environments.environment_info.EnvironmentInfo method)
is_discrete_action_env() (nnabla_rl.environments.environment_info.EnvironmentInfo method)
iteration_num (nnabla_rl.algorithm.Algorithm property)
IterationNumHook (class in nnabla_rl.hooks)
IterationStateHook (class in nnabla_rl.hooks)
K
kl_divergence() (nnabla_rl.distributions.Distribution method)
(nnabla_rl.distributions.Gaussian method)
(nnabla_rl.distributions.Softmax method)
L
latent_distribution() (nnabla_rl.models.VariationalAutoEncoder method)
latest_iteration_state (nnabla_rl.algorithm.Algorithm property)
(nnabla_rl.algorithms.a2c.A2C property)
(nnabla_rl.algorithms.bcq.BCQ property)
(nnabla_rl.algorithms.bear.BEAR property)
(nnabla_rl.algorithms.categorical_dqn.CategoricalDQN property)
(nnabla_rl.algorithms.ddpg.DDPG property)
(nnabla_rl.algorithms.dqn.DQN property)
(nnabla_rl.algorithms.gail.GAIL property)
(nnabla_rl.algorithms.icml2015_trpo.ICML2015TRPO property)
(nnabla_rl.algorithms.icml2018_sac.ICML2018SAC property)
(nnabla_rl.algorithms.iqn.IQN property)
(nnabla_rl.algorithms.munchausen_dqn.MunchausenDQN property)
(nnabla_rl.algorithms.munchausen_iqn.MunchausenIQN property)
(nnabla_rl.algorithms.ppo.PPO property)
(nnabla_rl.algorithms.qrdqn.QRDQN property)
(nnabla_rl.algorithms.reinforce.REINFORCE property)
(nnabla_rl.algorithms.sac.SAC property)
(nnabla_rl.algorithms.td3.TD3 property)
(nnabla_rl.algorithms.trpo.TRPO property)
load_parameters() (nnabla_rl.models.model.Model method)
log_prob() (nnabla_rl.distributions.Distribution method)
(nnabla_rl.distributions.Gaussian method)
(nnabla_rl.distributions.Softmax method)
(nnabla_rl.distributions.SquashedGaussian method)
M
max_iterations (nnabla_rl.algorithm.Algorithm property)
max_q() (nnabla_rl.models.QFunction method)
max_q_probs() (nnabla_rl.models.ValueDistributionFunction method)
max_q_quantile_values() (nnabla_rl.models.StateActionQuantileFunction method)
max_q_quantiles() (nnabla_rl.models.QuantileDistributionFunction method)
mean() (nnabla_rl.distributions.Distribution method)
(nnabla_rl.distributions.Gaussian method)
(nnabla_rl.distributions.Softmax method)
MemoryEfficientAtariBuffer (class in nnabla_rl.replay_buffers)
Model (class in nnabla_rl.models.model)
ModelBuilder (class in nnabla_rl.builders)
MunchausenDQN (class in nnabla_rl.algorithms.munchausen_dqn)
MunchausenDQNConfig (class in nnabla_rl.algorithms.munchausen_dqn)
MunchausenIQN (class in nnabla_rl.algorithms.munchausen_iqn)
MunchausenIQNConfig (class in nnabla_rl.algorithms.munchausen_iqn)
N
ndim (nnabla_rl.distributions.Distribution property)
(nnabla_rl.distributions.Gaussian property)
(nnabla_rl.distributions.Softmax property)
(nnabla_rl.distributions.SquashedGaussian property)
O
on_hook_called() (nnabla_rl.hook.Hook method)
(nnabla_rl.hooks.EvaluationHook method)
(nnabla_rl.hooks.IterationNumHook method)
(nnabla_rl.hooks.IterationStateHook method)
(nnabla_rl.hooks.SaveSnapshotHook method)
(nnabla_rl.hooks.TimeMeasuringHook method)
P
Perturbator (class in nnabla_rl.models)
pi() (nnabla_rl.models.DeterministicPolicy method)
(nnabla_rl.models.StochasticPolicy method)
Policy (class in nnabla_rl.models)
PPO (class in nnabla_rl.algorithms.ppo)
PPOConfig (class in nnabla_rl.algorithms.ppo)
PreprocessorBuilder (class in nnabla_rl.builders)
PrioritizedReplayBuffer (class in nnabla_rl.replay_buffers)
probs() (nnabla_rl.models.ValueDistributionFunction method)
Q
q() (nnabla_rl.models.QFunction method)
QFunction (class in nnabla_rl.models)
QRDQN (class in nnabla_rl.algorithms.qrdqn)
QRDQNConfig (class in nnabla_rl.algorithms.qrdqn)
quantile_values() (nnabla_rl.models.StateActionQuantileFunction method)
QuantileDistributionFunction (class in nnabla_rl.models)
quantiles() (nnabla_rl.models.QuantileDistributionFunction method)
R
r() (nnabla_rl.models.reward_function.RewardFunction method)
REINFORCE (class in nnabla_rl.algorithms.reinforce)
REINFORCEConfig (class in nnabla_rl.algorithms.reinforce)
ReplayBuffer (class in nnabla_rl.replay_buffer)
ReplayBufferBuilder (class in nnabla_rl.builders)
RewardFunction (class in nnabla_rl.models.reward_function)
S
SAC (class in nnabla_rl.algorithms.sac)
SACConfig (class in nnabla_rl.algorithms.sac)
sample() (nnabla_rl.distributions.Distribution method)
(nnabla_rl.distributions.Gaussian method)
(nnabla_rl.distributions.Softmax method)
(nnabla_rl.distributions.SquashedGaussian method)
(nnabla_rl.replay_buffer.ReplayBuffer method)
(nnabla_rl.replay_buffers.PrioritizedReplayBuffer method)
sample_and_compute_log_prob() (nnabla_rl.distributions.Distribution method)
(nnabla_rl.distributions.Gaussian method)
(nnabla_rl.distributions.Softmax method)
(nnabla_rl.distributions.SquashedGaussian method)
sample_indices() (nnabla_rl.replay_buffer.ReplayBuffer method)
(nnabla_rl.replay_buffers.PrioritizedReplayBuffer method)
sample_multiple() (nnabla_rl.distributions.Distribution method)
(nnabla_rl.distributions.Gaussian method)
(nnabla_rl.distributions.Softmax method)
(nnabla_rl.distributions.SquashedGaussian method)
sample_multiple_and_compute_log_prob() (nnabla_rl.distributions.SquashedGaussian method)
sample_tau() (nnabla_rl.models.StateActionQuantileFunction method)
save_parameters() (nnabla_rl.models.model.Model method)
SaveSnapshotHook (class in nnabla_rl.hooks)
scope_name (nnabla_rl.models.model.Model property)
set_hooks() (nnabla_rl.algorithm.Algorithm method)
Softmax (class in nnabla_rl.distributions)
SolverBuilder (class in nnabla_rl.builders)
SquashedGaussian (class in nnabla_rl.distributions)
state_dim (nnabla_rl.environments.environment_info.EnvironmentInfo property)
state_shape (nnabla_rl.environments.environment_info.EnvironmentInfo property)
StateActionQuantileFunction (class in nnabla_rl.models)
StochasticPolicy (class in nnabla_rl.models)
T
TD3 (class in nnabla_rl.algorithms.td3)
TD3Config (class in nnabla_rl.algorithms.td3)
TimeMeasuringHook (class in nnabla_rl.hooks)
train() (nnabla_rl.algorithm.Algorithm method)
train_offline() (nnabla_rl.algorithm.Algorithm method)
train_online() (nnabla_rl.algorithm.Algorithm method)
TRPO (class in nnabla_rl.algorithms.trpo)
TRPOConfig (class in nnabla_rl.algorithms.trpo)
V
v() (nnabla_rl.models.VFunction method)
ValueDistributionFunction (class in nnabla_rl.models)
VariationalAutoEncoder (class in nnabla_rl.models)
VFunction (class in nnabla_rl.models)
Read the Docs
v: v0.9.0
Versions
latest
stable
v0.9.0
Downloads
html
On Read the Docs
Project Home
Builds