d3rlpy
v0.40
Tutorials
Getting Started
Jupyter Notebooks
References
API Reference
Installation
Other
License
d3rlpy
Docs
»
Index
Edit on GitHub
Index
_
|
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
L
|
M
|
N
|
O
|
P
|
Q
|
R
|
S
|
T
|
U
|
V
_
__getitem__() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
__iter__() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
__len__() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.online.buffers.ReplayBuffer method)
A
action (d3rlpy.dataset.Transition attribute)
action_flexibility (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
action_size (d3rlpy.online.buffers.ReplayBuffer attribute)
actions (d3rlpy.dataset.Episode attribute)
(d3rlpy.dataset.MDPDataset attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
activation (d3rlpy.encoders.PixelEncoderFactory attribute)
(d3rlpy.encoders.VectorEncoderFactory attribute)
actor_encoder_factory (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
actor_learning_rate (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
actor_optim_factory (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
AdamFactory (class in d3rlpy.optimizers)
alpha_learning_rate (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
alpha_optim_factory (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
alpha_threshold (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
append() (d3rlpy.dataset.MDPDataset method)
(d3rlpy.online.buffers.ReplayBuffer method)
append_episode() (d3rlpy.online.buffers.ReplayBuffer method)
augmentation (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
average_value_estimation_scorer() (in module d3rlpy.metrics.scorer)
AWAC (class in d3rlpy.algos)
AWR (class in d3rlpy.algos)
B
batch_size (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
batch_size_per_update (d3rlpy.algos.AWR attribute)
(d3rlpy.algos.DiscreteAWR attribute)
BC (class in d3rlpy.algos)
BCQ (class in d3rlpy.algos)
BEAR (class in d3rlpy.algos)
beta (d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
bootstrap (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
brightness (d3rlpy.augmentation.image.ColorJitter attribute)
build_episodes() (d3rlpy.dataset.MDPDataset method)
build_transitions() (d3rlpy.dataset.Episode method)
C
clear_links() (d3rlpy.dataset.Transition method)
clip_reward() (d3rlpy.dataset.MDPDataset method)
ColorJitter (class in d3rlpy.augmentation.image)
compare_continuous_action_diff() (in module d3rlpy.metrics.comparer)
compare_discrete_action_match() (in module d3rlpy.metrics.comparer)
compute_epsilon() (d3rlpy.online.explorers.LinearDecayEpsilonGreedy method)
compute_return() (d3rlpy.dataset.Episode method)
compute_stats() (d3rlpy.dataset.MDPDataset method)
continuous_action_diff_scorer() (in module d3rlpy.metrics.scorer)
contrast (d3rlpy.augmentation.image.ColorJitter attribute)
CQL (class in d3rlpy.algos)
create() (d3rlpy.encoders.DefaultEncoderFactory method)
(d3rlpy.encoders.PixelEncoderFactory method)
(d3rlpy.encoders.VectorEncoderFactory method)
(d3rlpy.optimizers.AdamFactory method)
(d3rlpy.optimizers.OptimizerFactory method)
(d3rlpy.optimizers.RMSpropFactory method)
(d3rlpy.optimizers.SGDFactory method)
create_impl() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DiscreteSAC method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
critic_encoder_factory (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
critic_learning_rate (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
critic_optim_factory (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
Cutout (class in d3rlpy.augmentation.image)
D
d3rlpy (module)
d3rlpy.algos (module)
d3rlpy.augmentation (module)
d3rlpy.dataset (module)
d3rlpy.datasets (module)
d3rlpy.dynamics (module)
d3rlpy.encoders (module)
d3rlpy.metrics (module)
d3rlpy.models.torch.q_functions (module)
d3rlpy.online (module)
d3rlpy.optimizers (module)
d3rlpy.preprocessing (module)
DDPG (class in d3rlpy.algos)
DefaultEncoderFactory (class in d3rlpy.encoders)
degree (d3rlpy.augmentation.image.RandomRotation attribute)
discounted_sum_of_advantage_scorer() (in module d3rlpy.metrics.scorer)
discrete_action (d3rlpy.dynamics.mopo.MOPO attribute)
discrete_action_match_scorer() (in module d3rlpy.metrics.scorer)
DiscreteAWR (class in d3rlpy.algos)
DiscreteBC (class in d3rlpy.algos)
DiscreteBCQ (class in d3rlpy.algos)
DiscreteCQL (class in d3rlpy.algos)
DiscreteSAC (class in d3rlpy.algos)
DoubleDQN (class in d3rlpy.algos)
DQN (class in d3rlpy.algos)
dump() (d3rlpy.dataset.MDPDataset method)
duration (d3rlpy.online.explorers.LinearDecayEpsilonGreedy attribute)
dynamics (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
dynamics_observation_prediction_error_scorer() (in module d3rlpy.metrics.scorer)
dynamics_prediction_variance_scorer() (in module d3rlpy.metrics.scorer)
dynamics_reward_prediction_error_scorer() (in module d3rlpy.metrics.scorer)
E
encoder_factory (d3rlpy.algos.BC attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
end_epsilon (d3rlpy.online.explorers.LinearDecayEpsilonGreedy attribute)
Episode (class in d3rlpy.dataset)
episodes (d3rlpy.dataset.MDPDataset attribute)
eval_results_ (d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
evaluate_on_environment() (in module d3rlpy.metrics.scorer)
extend() (d3rlpy.dataset.MDPDataset method)
F
feature_size (d3rlpy.encoders.PixelEncoderFactory attribute)
filters (d3rlpy.encoders.PixelEncoderFactory attribute)
fit() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DiscreteSAC method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
(d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
fit_online() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DiscreteSAC method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
from_json() (d3rlpy.algos.AWAC class method)
(d3rlpy.algos.AWR class method)
(d3rlpy.algos.BC class method)
(d3rlpy.algos.BCQ class method)
(d3rlpy.algos.BEAR class method)
(d3rlpy.algos.CQL class method)
(d3rlpy.algos.DDPG class method)
(d3rlpy.algos.DQN class method)
(d3rlpy.algos.DiscreteAWR class method)
(d3rlpy.algos.DiscreteBC class method)
(d3rlpy.algos.DiscreteBCQ class method)
(d3rlpy.algos.DiscreteCQL class method)
(d3rlpy.algos.DiscreteSAC class method)
(d3rlpy.algos.DoubleDQN class method)
(d3rlpy.algos.SAC class method)
(d3rlpy.algos.TD3 class method)
(d3rlpy.dynamics.mopo.MOPO class method)
G
gamma (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
generate() (d3rlpy.dynamics.mopo.MOPO method)
get_action_size() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.dataset.Transition method)
get_atari() (in module d3rlpy.datasets)
get_cartpole() (in module d3rlpy.datasets)
get_observation_shape() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.dataset.Transition method)
get_params() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DiscreteSAC method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.augmentation.image.ColorJitter method)
(d3rlpy.augmentation.image.Cutout method)
(d3rlpy.augmentation.image.HorizontalFlip method)
(d3rlpy.augmentation.image.Intensity method)
(d3rlpy.augmentation.image.RandomRotation method)
(d3rlpy.augmentation.image.RandomShift method)
(d3rlpy.augmentation.image.VerticalFlip method)
(d3rlpy.augmentation.vector.MultipleAmplitudeScaling method)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling method)
(d3rlpy.dynamics.mopo.MOPO method)
(d3rlpy.encoders.DefaultEncoderFactory method)
(d3rlpy.encoders.PixelEncoderFactory method)
(d3rlpy.encoders.VectorEncoderFactory method)
(d3rlpy.optimizers.AdamFactory method)
(d3rlpy.optimizers.OptimizerFactory method)
(d3rlpy.optimizers.RMSpropFactory method)
(d3rlpy.optimizers.SGDFactory method)
(d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
get_pendulum() (in module d3rlpy.datasets)
get_pybullet() (in module d3rlpy.datasets)
get_type() (d3rlpy.augmentation.image.ColorJitter method)
(d3rlpy.augmentation.image.Cutout method)
(d3rlpy.augmentation.image.HorizontalFlip method)
(d3rlpy.augmentation.image.Intensity method)
(d3rlpy.augmentation.image.RandomRotation method)
(d3rlpy.augmentation.image.RandomShift method)
(d3rlpy.augmentation.image.VerticalFlip method)
(d3rlpy.augmentation.vector.MultipleAmplitudeScaling method)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling method)
(d3rlpy.encoders.DefaultEncoderFactory method)
(d3rlpy.encoders.PixelEncoderFactory method)
(d3rlpy.encoders.VectorEncoderFactory method)
(d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
H
hidden_units (d3rlpy.encoders.VectorEncoderFactory attribute)
horizon (d3rlpy.dynamics.mopo.MOPO attribute)
HorizontalFlip (class in d3rlpy.augmentation.image)
hue (d3rlpy.augmentation.image.ColorJitter attribute)
I
imitator_encoder_factory (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
imitator_learning_rate (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
imitator_optim_factory (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
impl (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
initial_alpha (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
initial_state_value_estimation_scorer() (in module d3rlpy.metrics.scorer)
initial_temperature (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.SAC attribute)
Intensity (class in d3rlpy.augmentation.image)
is_action_discrete() (d3rlpy.dataset.MDPDataset method)
L
lam (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
latent_size (d3rlpy.algos.BCQ attribute)
learning_rate (d3rlpy.algos.BC attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
LinearDecayEpsilonGreedy (class in d3rlpy.online.explorers)
load() (d3rlpy.dataset.MDPDataset class method)
load_model() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DiscreteSAC method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
M
max_weight (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.DiscreteAWR attribute)
maximum (d3rlpy.augmentation.vector.MultipleAmplitudeScaling attribute)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling attribute)
(d3rlpy.preprocessing.MinMaxScaler attribute)
MDPDataset (class in d3rlpy.dataset)
mean (d3rlpy.online.explorers.NormalNoise attribute)
(d3rlpy.preprocessing.StandardScaler attribute)
minimum (d3rlpy.augmentation.vector.MultipleAmplitudeScaling attribute)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling attribute)
(d3rlpy.preprocessing.MinMaxScaler attribute)
MinMaxScaler (class in d3rlpy.preprocessing)
mmd_sigma (d3rlpy.algos.BEAR attribute)
MOPO (class in d3rlpy.dynamics.mopo)
MultipleAmplitudeScaling (class in d3rlpy.augmentation.vector)
N
n_action_samples (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
n_actor_updates (d3rlpy.algos.AWR attribute)
(d3rlpy.algos.DiscreteAWR attribute)
n_augmentations (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
n_critic_updates (d3rlpy.algos.AWR attribute)
(d3rlpy.algos.DiscreteAWR attribute)
n_critics (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
n_ensembles (d3rlpy.dynamics.mopo.MOPO attribute)
n_frames (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
n_transitions (d3rlpy.dynamics.mopo.MOPO attribute)
next_action (d3rlpy.dataset.Transition attribute)
next_actions (d3rlpy.dataset.TransitionMiniBatch attribute)
next_observation (d3rlpy.dataset.Transition attribute)
next_observations (d3rlpy.dataset.TransitionMiniBatch attribute)
next_reward (d3rlpy.dataset.Transition attribute)
next_rewards (d3rlpy.dataset.TransitionMiniBatch attribute)
next_transition (d3rlpy.dataset.Transition attribute)
NormalNoise (class in d3rlpy.online.explorers)
O
observation (d3rlpy.dataset.Transition attribute)
observation_shape (d3rlpy.online.buffers.ReplayBuffer attribute)
observations (d3rlpy.dataset.Episode attribute)
(d3rlpy.dataset.MDPDataset attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
optim_cls (d3rlpy.optimizers.AdamFactory attribute)
(d3rlpy.optimizers.OptimizerFactory attribute)
(d3rlpy.optimizers.RMSpropFactory attribute)
(d3rlpy.optimizers.SGDFactory attribute)
optim_factory (d3rlpy.algos.BC attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
optim_kwargs (d3rlpy.optimizers.AdamFactory attribute)
(d3rlpy.optimizers.OptimizerFactory attribute)
(d3rlpy.optimizers.RMSpropFactory attribute)
(d3rlpy.optimizers.SGDFactory attribute)
OptimizerFactory (class in d3rlpy.optimizers)
P
PixelEncoderFactory (class in d3rlpy.encoders)
PixelScaler (class in d3rlpy.preprocessing)
predict() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DiscreteSAC method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
predict_value() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DiscreteSAC method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
prev_action (d3rlpy.online.buffers.ReplayBuffer attribute)
prev_observation (d3rlpy.online.buffers.ReplayBuffer attribute)
prev_reward (d3rlpy.online.buffers.ReplayBuffer attribute)
prev_transition (d3rlpy.dataset.Transition attribute)
(d3rlpy.online.buffers.ReplayBuffer attribute)
probability (d3rlpy.augmentation.image.Cutout attribute)
(d3rlpy.augmentation.image.HorizontalFlip attribute)
(d3rlpy.augmentation.image.VerticalFlip attribute)
Q
q_func_type (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
R
RandomRotation (class in d3rlpy.augmentation.image)
RandomShift (class in d3rlpy.augmentation.image)
reguralizing_rate (d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.TD3 attribute)
ReplayBuffer (class in d3rlpy.online.buffers)
reverse_transform() (d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
reward (d3rlpy.dataset.Transition attribute)
rewards (d3rlpy.dataset.Episode attribute)
(d3rlpy.dataset.MDPDataset attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
rl_start_epoch (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
RMSpropFactory (class in d3rlpy.optimizers)
S
SAC (class in d3rlpy.algos)
sample() (d3rlpy.online.buffers.ReplayBuffer method)
(d3rlpy.online.explorers.LinearDecayEpsilonGreedy method)
(d3rlpy.online.explorers.NormalNoise method)
sample_action() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DiscreteSAC method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
saturation (d3rlpy.augmentation.image.ColorJitter attribute)
save_model() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DiscreteSAC method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
save_policy() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DiscreteSAC method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
scale (d3rlpy.augmentation.image.Intensity attribute)
scaler (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
set_params() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DiscreteSAC method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
SGDFactory (class in d3rlpy.optimizers)
share_encoder (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
shift_size (d3rlpy.augmentation.image.RandomShift attribute)
SingleAmplitudeScaling (class in d3rlpy.augmentation.vector)
size() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.dataset.TransitionMiniBatch method)
(d3rlpy.online.buffers.ReplayBuffer method)
soft_opc_scorer() (in module d3rlpy.metrics.scorer)
StandardScaler (class in d3rlpy.preprocessing)
start_epsilon (d3rlpy.online.explorers.LinearDecayEpsilonGreedy attribute)
std (d3rlpy.online.explorers.NormalNoise attribute)
(d3rlpy.preprocessing.StandardScaler attribute)
T
target_smoothing_clip (d3rlpy.algos.TD3 attribute)
target_smoothing_sigma (d3rlpy.algos.TD3 attribute)
target_update_interval (d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
tau (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
TD3 (class in d3rlpy.algos)
td_error_scorer() (in module d3rlpy.metrics.scorer)
temp_learning_rate (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.SAC attribute)
temp_optim_factory (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.SAC attribute)
terminal (d3rlpy.dataset.Transition attribute)
terminals (d3rlpy.dataset.MDPDataset attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
train() (in module d3rlpy.online.iterators)
transform() (d3rlpy.augmentation.image.ColorJitter method)
(d3rlpy.augmentation.image.Cutout method)
(d3rlpy.augmentation.image.HorizontalFlip method)
(d3rlpy.augmentation.image.Intensity method)
(d3rlpy.augmentation.image.RandomRotation method)
(d3rlpy.augmentation.image.RandomShift method)
(d3rlpy.augmentation.image.VerticalFlip method)
(d3rlpy.augmentation.vector.MultipleAmplitudeScaling method)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling method)
(d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
Transition (class in d3rlpy.dataset)
TransitionMiniBatch (class in d3rlpy.dataset)
transitions (d3rlpy.dataset.Episode attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
(d3rlpy.online.buffers.ReplayBuffer attribute)
TYPE (d3rlpy.augmentation.image.ColorJitter attribute)
(d3rlpy.augmentation.image.Cutout attribute)
(d3rlpy.augmentation.image.HorizontalFlip attribute)
(d3rlpy.augmentation.image.Intensity attribute)
(d3rlpy.augmentation.image.RandomRotation attribute)
(d3rlpy.augmentation.image.RandomShift attribute)
(d3rlpy.augmentation.image.VerticalFlip attribute)
(d3rlpy.augmentation.vector.MultipleAmplitudeScaling attribute)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling attribute)
(d3rlpy.encoders.DefaultEncoderFactory attribute)
(d3rlpy.encoders.PixelEncoderFactory attribute)
(d3rlpy.encoders.VectorEncoderFactory attribute)
(d3rlpy.preprocessing.MinMaxScaler attribute)
(d3rlpy.preprocessing.PixelScaler attribute)
(d3rlpy.preprocessing.StandardScaler attribute)
U
update() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DiscreteSAC method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
update_actor_interval (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
use_batch_norm (d3rlpy.encoders.DefaultEncoderFactory attribute)
(d3rlpy.encoders.PixelEncoderFactory attribute)
(d3rlpy.encoders.VectorEncoderFactory attribute)
use_gpu (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DiscreteSAC attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
V
value_estimation_std_scorer() (in module d3rlpy.metrics.scorer)
VectorEncoderFactory (class in d3rlpy.encoders)
VerticalFlip (class in d3rlpy.augmentation.image)
Read the Docs
v: v0.40
Versions
latest
stable
v0.40
v0.32
v0.31
v0.30
v0.23
v0.22
v0.21
v0.2
v0.1
Downloads
pdf
html
epub
On Read the Docs
Project Home
Builds
Free document hosting provided by
Read the Docs
.