d3rlpy
v0.31
Tutorials
Getting Started
Jupyter Notebooks
References
API Reference
Installation
Other
License
d3rlpy
Docs
»
Index
Edit on GitHub
Index
_
|
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
L
|
M
|
N
|
O
|
P
|
Q
|
R
|
S
|
T
|
U
|
V
|
W
_
__getitem__() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
__iter__() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
__len__() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.online.buffers.ReplayBuffer method)
A
action (d3rlpy.dataset.Transition attribute)
action_flexibility (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
action_size (d3rlpy.online.buffers.ReplayBuffer attribute)
actions (d3rlpy.dataset.Episode attribute)
(d3rlpy.dataset.MDPDataset attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
actor_learning_rate (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
actor_weight_decay (d3rlpy.algos.AWAC attribute)
alpha_learning_rate (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
alpha_threshold (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
append() (d3rlpy.dataset.MDPDataset method)
(d3rlpy.online.buffers.ReplayBuffer method)
append_episode() (d3rlpy.online.buffers.ReplayBuffer method)
augmentation (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
average_value_estimation_scorer() (in module d3rlpy.metrics.scorer)
AWAC (class in d3rlpy.algos)
AWR (class in d3rlpy.algos)
B
batch_size (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
batch_size_per_update (d3rlpy.algos.AWR attribute)
(d3rlpy.algos.DiscreteAWR attribute)
BC (class in d3rlpy.algos)
BCQ (class in d3rlpy.algos)
BEAR (class in d3rlpy.algos)
beta (d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
bootstrap (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
brightness (d3rlpy.augmentation.image.ColorJitter attribute)
build_episodes() (d3rlpy.dataset.MDPDataset method)
build_transitions() (d3rlpy.dataset.Episode method)
C
clip_reward() (d3rlpy.dataset.MDPDataset method)
ColorJitter (class in d3rlpy.augmentation.image)
compare_continuous_action_diff() (in module d3rlpy.metrics.comparer)
compare_discrete_action_match() (in module d3rlpy.metrics.comparer)
compute_epsilon() (d3rlpy.online.explorers.LinearDecayEpsilonGreedy method)
compute_return() (d3rlpy.dataset.Episode method)
compute_stats() (d3rlpy.dataset.MDPDataset method)
continuous_action_diff_scorer() (in module d3rlpy.metrics.scorer)
contrast (d3rlpy.augmentation.image.ColorJitter attribute)
CQL (class in d3rlpy.algos)
create_impl() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
critic_learning_rate (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
Cutout (class in d3rlpy.augmentation.image)
D
d3rlpy (module)
d3rlpy.algos (module)
d3rlpy.augmentation (module)
d3rlpy.dataset (module)
d3rlpy.datasets (module)
d3rlpy.dynamics (module)
d3rlpy.metrics (module)
d3rlpy.models.torch.q_functions (module)
d3rlpy.online (module)
d3rlpy.preprocessing (module)
DDPG (class in d3rlpy.algos)
degree (d3rlpy.augmentation.image.RandomRotation attribute)
discounted_sum_of_advantage_scorer() (in module d3rlpy.metrics.scorer)
discrete_action (d3rlpy.dynamics.mopo.MOPO attribute)
discrete_action_match_scorer() (in module d3rlpy.metrics.scorer)
DiscreteAWR (class in d3rlpy.algos)
DiscreteBC (class in d3rlpy.algos)
DiscreteBCQ (class in d3rlpy.algos)
DiscreteCQL (class in d3rlpy.algos)
DoubleDQN (class in d3rlpy.algos)
DQN (class in d3rlpy.algos)
dump() (d3rlpy.dataset.MDPDataset method)
duration (d3rlpy.online.explorers.LinearDecayEpsilonGreedy attribute)
dynamics (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
dynamics_observation_prediction_error_scorer() (in module d3rlpy.metrics.scorer)
dynamics_prediction_variance_scorer() (in module d3rlpy.metrics.scorer)
dynamics_reward_prediction_error_scorer() (in module d3rlpy.metrics.scorer)
E
encoder_params (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
end_epsilon (d3rlpy.online.explorers.LinearDecayEpsilonGreedy attribute)
Episode (class in d3rlpy.dataset)
episodes (d3rlpy.dataset.MDPDataset attribute)
eps (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
eval_results_ (d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
evaluate_on_environment() (in module d3rlpy.metrics.scorer)
extend() (d3rlpy.dataset.MDPDataset method)
F
fit() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
(d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
fit_online() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
from_json() (d3rlpy.algos.AWAC class method)
(d3rlpy.algos.AWR class method)
(d3rlpy.algos.BC class method)
(d3rlpy.algos.BCQ class method)
(d3rlpy.algos.BEAR class method)
(d3rlpy.algos.CQL class method)
(d3rlpy.algos.DDPG class method)
(d3rlpy.algos.DQN class method)
(d3rlpy.algos.DiscreteAWR class method)
(d3rlpy.algos.DiscreteBC class method)
(d3rlpy.algos.DiscreteBCQ class method)
(d3rlpy.algos.DiscreteCQL class method)
(d3rlpy.algos.DoubleDQN class method)
(d3rlpy.algos.SAC class method)
(d3rlpy.algos.TD3 class method)
(d3rlpy.dynamics.mopo.MOPO class method)
G
gamma (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
generate() (d3rlpy.dynamics.mopo.MOPO method)
get_action_size() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.dataset.Transition method)
get_atari() (in module d3rlpy.datasets)
get_cartpole() (in module d3rlpy.datasets)
get_observation_shape() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.dataset.Transition method)
get_params() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.augmentation.image.ColorJitter method)
(d3rlpy.augmentation.image.Cutout method)
(d3rlpy.augmentation.image.HorizontalFlip method)
(d3rlpy.augmentation.image.Intensity method)
(d3rlpy.augmentation.image.RandomRotation method)
(d3rlpy.augmentation.image.RandomShift method)
(d3rlpy.augmentation.image.VerticalFlip method)
(d3rlpy.augmentation.vector.MultipleAmplitudeScaling method)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling method)
(d3rlpy.dynamics.mopo.MOPO method)
(d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
get_pendulum() (in module d3rlpy.datasets)
get_pybullet() (in module d3rlpy.datasets)
get_type() (d3rlpy.augmentation.image.ColorJitter method)
(d3rlpy.augmentation.image.Cutout method)
(d3rlpy.augmentation.image.HorizontalFlip method)
(d3rlpy.augmentation.image.Intensity method)
(d3rlpy.augmentation.image.RandomRotation method)
(d3rlpy.augmentation.image.RandomShift method)
(d3rlpy.augmentation.image.VerticalFlip method)
(d3rlpy.augmentation.vector.MultipleAmplitudeScaling method)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling method)
(d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
H
horizon (d3rlpy.dynamics.mopo.MOPO attribute)
HorizontalFlip (class in d3rlpy.augmentation.image)
hue (d3rlpy.augmentation.image.ColorJitter attribute)
I
imitator_learning_rate (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
impl (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
initial_alpha (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
initial_state_value_estimation_scorer() (in module d3rlpy.metrics.scorer)
initial_temperature (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.SAC attribute)
Intensity (class in d3rlpy.augmentation.image)
is_action_discrete() (d3rlpy.dataset.MDPDataset method)
L
lam (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
latent_size (d3rlpy.algos.BCQ attribute)
learning_rate (d3rlpy.algos.BC attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
LinearDecayEpsilonGreedy (class in d3rlpy.online.explorers)
load() (d3rlpy.dataset.MDPDataset class method)
load_model() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
M
max_weight (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.DiscreteAWR attribute)
maximum (d3rlpy.augmentation.vector.MultipleAmplitudeScaling attribute)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling attribute)
(d3rlpy.preprocessing.MinMaxScaler attribute)
MDPDataset (class in d3rlpy.dataset)
mean (d3rlpy.online.explorers.NormalNoise attribute)
(d3rlpy.preprocessing.StandardScaler attribute)
minimum (d3rlpy.augmentation.vector.MultipleAmplitudeScaling attribute)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling attribute)
(d3rlpy.preprocessing.MinMaxScaler attribute)
MinMaxScaler (class in d3rlpy.preprocessing)
mmd_sigma (d3rlpy.algos.BEAR attribute)
momentum (d3rlpy.algos.AWR attribute)
(d3rlpy.algos.DiscreteAWR attribute)
MOPO (class in d3rlpy.dynamics.mopo)
MultipleAmplitudeScaling (class in d3rlpy.augmentation.vector)
N
n_action_samples (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
n_actor_updates (d3rlpy.algos.AWR attribute)
(d3rlpy.algos.DiscreteAWR attribute)
n_augmentations (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
n_critic_updates (d3rlpy.algos.AWR attribute)
(d3rlpy.algos.DiscreteAWR attribute)
n_critics (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
n_ensembles (d3rlpy.dynamics.mopo.MOPO attribute)
n_frames (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
n_transitions (d3rlpy.dynamics.mopo.MOPO attribute)
next_action (d3rlpy.dataset.Transition attribute)
next_actions (d3rlpy.dataset.TransitionMiniBatch attribute)
next_observation (d3rlpy.dataset.Transition attribute)
next_observations (d3rlpy.dataset.TransitionMiniBatch attribute)
next_reward (d3rlpy.dataset.Transition attribute)
next_rewards (d3rlpy.dataset.TransitionMiniBatch attribute)
next_transition (d3rlpy.dataset.Transition attribute)
NormalNoise (class in d3rlpy.online.explorers)
O
observation (d3rlpy.dataset.Transition attribute)
observation_shape (d3rlpy.online.buffers.ReplayBuffer attribute)
observations (d3rlpy.dataset.Episode attribute)
(d3rlpy.dataset.MDPDataset attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
P
PixelScaler (class in d3rlpy.preprocessing)
predict() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
predict_value() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
prev_action (d3rlpy.online.buffers.ReplayBuffer attribute)
prev_observation (d3rlpy.online.buffers.ReplayBuffer attribute)
prev_reward (d3rlpy.online.buffers.ReplayBuffer attribute)
prev_transition (d3rlpy.dataset.Transition attribute)
(d3rlpy.online.buffers.ReplayBuffer attribute)
probability (d3rlpy.augmentation.image.Cutout attribute)
(d3rlpy.augmentation.image.HorizontalFlip attribute)
(d3rlpy.augmentation.image.VerticalFlip attribute)
Q
q_func_type (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
R
RandomRotation (class in d3rlpy.augmentation.image)
RandomShift (class in d3rlpy.augmentation.image)
reguralizing_rate (d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.TD3 attribute)
ReplayBuffer (class in d3rlpy.online.buffers)
reverse_transform() (d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
reward (d3rlpy.dataset.Transition attribute)
rewards (d3rlpy.dataset.Episode attribute)
(d3rlpy.dataset.MDPDataset attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
rl_start_epoch (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
S
SAC (class in d3rlpy.algos)
sample() (d3rlpy.online.buffers.ReplayBuffer method)
(d3rlpy.online.explorers.LinearDecayEpsilonGreedy method)
(d3rlpy.online.explorers.NormalNoise method)
sample_action() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
saturation (d3rlpy.augmentation.image.ColorJitter attribute)
save_model() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
save_policy() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
scale (d3rlpy.augmentation.image.Intensity attribute)
scaler (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
set_params() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
share_encoder (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
shift_size (d3rlpy.augmentation.image.RandomShift attribute)
SingleAmplitudeScaling (class in d3rlpy.augmentation.vector)
size() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.dataset.TransitionMiniBatch method)
(d3rlpy.online.buffers.ReplayBuffer method)
soft_opc_scorer() (in module d3rlpy.metrics.scorer)
StandardScaler (class in d3rlpy.preprocessing)
start_epsilon (d3rlpy.online.explorers.LinearDecayEpsilonGreedy attribute)
std (d3rlpy.online.explorers.NormalNoise attribute)
(d3rlpy.preprocessing.StandardScaler attribute)
T
target_smoothing_clip (d3rlpy.algos.TD3 attribute)
target_smoothing_sigma (d3rlpy.algos.TD3 attribute)
target_update_interval (d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
tau (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
TD3 (class in d3rlpy.algos)
td_error_scorer() (in module d3rlpy.metrics.scorer)
temp_learning_rate (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.SAC attribute)
terminal (d3rlpy.dataset.Transition attribute)
terminals (d3rlpy.dataset.MDPDataset attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
train() (in module d3rlpy.online.iterators)
transform() (d3rlpy.augmentation.image.ColorJitter method)
(d3rlpy.augmentation.image.Cutout method)
(d3rlpy.augmentation.image.HorizontalFlip method)
(d3rlpy.augmentation.image.Intensity method)
(d3rlpy.augmentation.image.RandomRotation method)
(d3rlpy.augmentation.image.RandomShift method)
(d3rlpy.augmentation.image.VerticalFlip method)
(d3rlpy.augmentation.vector.MultipleAmplitudeScaling method)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling method)
(d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
Transition (class in d3rlpy.dataset)
TransitionMiniBatch (class in d3rlpy.dataset)
transitions (d3rlpy.dataset.Episode attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
(d3rlpy.online.buffers.ReplayBuffer attribute)
U
update() (d3rlpy.algos.AWAC method)
(d3rlpy.algos.AWR method)
(d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteAWR method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
update_actor_interval (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
use_batch_norm (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
use_gpu (d3rlpy.algos.AWAC attribute)
(d3rlpy.algos.AWR attribute)
(d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteAWR attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
V
value_estimation_std_scorer() (in module d3rlpy.metrics.scorer)
VerticalFlip (class in d3rlpy.augmentation.image)
W
weight_decay (d3rlpy.dynamics.mopo.MOPO attribute)
Read the Docs
v: v0.31
Versions
latest
stable
v0.31
v0.30
v0.23
v0.22
v0.21
v0.2
v0.1
Downloads
pdf
html
epub
On Read the Docs
Project Home
Builds
Free document hosting provided by
Read the Docs
.