d3rlpy
v0.22
Tutorials
Jupyter Notebooks
References
API Reference
Installation
Other
License
d3rlpy
Docs
»
Index
Edit on GitHub
Index
_
|
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
L
|
M
|
N
|
O
|
P
|
Q
|
R
|
S
|
T
|
U
|
V
|
W
_
__getitem__() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.dataset.TransitionMiniBatch method)
__iter__() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.dataset.TransitionMiniBatch method)
__len__() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.dataset.TransitionMiniBatch method)
(d3rlpy.online.buffers.ReplayBuffer method)
A
action (d3rlpy.dataset.Transition attribute)
action_flexibility (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
action_size (d3rlpy.online.buffers.ReplayBuffer attribute)
actions (d3rlpy.dataset.Episode attribute)
(d3rlpy.dataset.MDPDataset attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
(d3rlpy.online.buffers.ReplayBuffer attribute)
actor_learning_rate (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
alpha_learning_rate (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
alpha_threshold (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
append() (d3rlpy.dataset.MDPDataset method)
(d3rlpy.online.buffers.ReplayBuffer method)
augmentation (d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
average_value_estimation_scorer() (in module d3rlpy.metrics.scorer)
B
batch_size (d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
BC (class in d3rlpy.algos)
BCQ (class in d3rlpy.algos)
BEAR (class in d3rlpy.algos)
beta (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
bootstrap (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
brightness (d3rlpy.augmentation.image.ColorJitter attribute)
C
clip_reward() (d3rlpy.dataset.MDPDataset method)
ColorJitter (class in d3rlpy.augmentation.image)
compare_continuous_action_diff() (in module d3rlpy.metrics.comparer)
compare_discrete_action_match() (in module d3rlpy.metrics.comparer)
compute_epsilon() (d3rlpy.online.explorers.LinearDecayEpsilonGreedy method)
compute_return() (d3rlpy.dataset.Episode method)
compute_stats() (d3rlpy.dataset.MDPDataset method)
continuous_action_diff_scorer() (in module d3rlpy.metrics.scorer)
contrast (d3rlpy.augmentation.image.ColorJitter attribute)
CQL (class in d3rlpy.algos)
create_impl() (d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
critic_learning_rate (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
cursor (d3rlpy.online.buffers.ReplayBuffer attribute)
Cutout (class in d3rlpy.augmentation.image)
D
d3rlpy (module)
d3rlpy.algos (module)
d3rlpy.augmentation (module)
d3rlpy.dataset (module)
d3rlpy.datasets (module)
d3rlpy.dynamics (module)
d3rlpy.metrics (module)
d3rlpy.models.torch.q_functions (module)
d3rlpy.online (module)
d3rlpy.preprocessing (module)
DDPG (class in d3rlpy.algos)
degree (d3rlpy.augmentation.image.RandomRotation attribute)
discounted_sum_of_advantage_scorer() (in module d3rlpy.metrics.scorer)
discrete_action (d3rlpy.dynamics.mopo.MOPO attribute)
discrete_action_match_scorer() (in module d3rlpy.metrics.scorer)
DiscreteBC (class in d3rlpy.algos)
DiscreteBCQ (class in d3rlpy.algos)
DiscreteCQL (class in d3rlpy.algos)
DoubleDQN (class in d3rlpy.algos)
DQN (class in d3rlpy.algos)
dump() (d3rlpy.dataset.MDPDataset method)
duration (d3rlpy.online.explorers.LinearDecayEpsilonGreedy attribute)
dynamics (d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
dynamics_observation_prediction_error_scorer() (in module d3rlpy.metrics.scorer)
dynamics_prediction_variance_scorer() (in module d3rlpy.metrics.scorer)
dynamics_reward_prediction_error_scorer() (in module d3rlpy.metrics.scorer)
E
encoder_params (d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
end_epsilon (d3rlpy.online.explorers.LinearDecayEpsilonGreedy attribute)
Episode (class in d3rlpy.dataset)
episodes (d3rlpy.dataset.MDPDataset attribute)
eps (d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
evaluate_on_environment() (in module d3rlpy.metrics.scorer)
F
fit() (d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
(d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
from_json() (d3rlpy.algos.BC class method)
(d3rlpy.algos.BCQ class method)
(d3rlpy.algos.BEAR class method)
(d3rlpy.algos.CQL class method)
(d3rlpy.algos.DDPG class method)
(d3rlpy.algos.DQN class method)
(d3rlpy.algos.DiscreteBC class method)
(d3rlpy.algos.DiscreteBCQ class method)
(d3rlpy.algos.DiscreteCQL class method)
(d3rlpy.algos.DoubleDQN class method)
(d3rlpy.algos.SAC class method)
(d3rlpy.algos.TD3 class method)
(d3rlpy.dynamics.mopo.MOPO class method)
G
gamma (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
generate() (d3rlpy.dynamics.mopo.MOPO method)
get_action_size() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.dataset.Transition method)
get_atari() (in module d3rlpy.datasets)
get_cartpole() (in module d3rlpy.datasets)
get_observation_shape() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.dataset.Transition method)
get_params() (d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.augmentation.image.ColorJitter method)
(d3rlpy.augmentation.image.Cutout method)
(d3rlpy.augmentation.image.HorizontalFlip method)
(d3rlpy.augmentation.image.Intensity method)
(d3rlpy.augmentation.image.RandomRotation method)
(d3rlpy.augmentation.image.RandomShift method)
(d3rlpy.augmentation.image.VerticalFlip method)
(d3rlpy.augmentation.vector.MultipleAmplitudeScaling method)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling method)
(d3rlpy.dynamics.mopo.MOPO method)
(d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
get_pendulum() (in module d3rlpy.datasets)
get_pybullet() (in module d3rlpy.datasets)
get_type() (d3rlpy.augmentation.image.ColorJitter method)
(d3rlpy.augmentation.image.Cutout method)
(d3rlpy.augmentation.image.HorizontalFlip method)
(d3rlpy.augmentation.image.Intensity method)
(d3rlpy.augmentation.image.RandomRotation method)
(d3rlpy.augmentation.image.RandomShift method)
(d3rlpy.augmentation.image.VerticalFlip method)
(d3rlpy.augmentation.vector.MultipleAmplitudeScaling method)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling method)
(d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
H
horizon (d3rlpy.dynamics.mopo.MOPO attribute)
HorizontalFlip (class in d3rlpy.augmentation.image)
hue (d3rlpy.augmentation.image.ColorJitter attribute)
I
imitator_learning_rate (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
impl (d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
initial_alpha (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
initial_temperature (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.SAC attribute)
Intensity (class in d3rlpy.augmentation.image)
is_action_discrete() (d3rlpy.dataset.MDPDataset method)
L
lam (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
latent_size (d3rlpy.algos.BCQ attribute)
learning_rate (d3rlpy.algos.BC attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
LinearDecayEpsilonGreedy (class in d3rlpy.online.explorers)
load() (d3rlpy.dataset.MDPDataset class method)
load_model() (d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
M
maximum (d3rlpy.augmentation.vector.MultipleAmplitudeScaling attribute)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling attribute)
(d3rlpy.preprocessing.MinMaxScaler attribute)
maxlen (d3rlpy.online.buffers.ReplayBuffer attribute)
MDPDataset (class in d3rlpy.dataset)
mean (d3rlpy.online.explorers.NormalNoise attribute)
(d3rlpy.preprocessing.StandardScaler attribute)
minimum (d3rlpy.augmentation.vector.MultipleAmplitudeScaling attribute)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling attribute)
(d3rlpy.preprocessing.MinMaxScaler attribute)
MinMaxScaler (class in d3rlpy.preprocessing)
mmd_sigma (d3rlpy.algos.BEAR attribute)
MOPO (class in d3rlpy.dynamics.mopo)
MultipleAmplitudeScaling (class in d3rlpy.augmentation.vector)
N
n_action_samples (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
n_augmentations (d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
n_critics (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
n_ensembles (d3rlpy.dynamics.mopo.MOPO attribute)
n_epochs (d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
n_transitions (d3rlpy.dynamics.mopo.MOPO attribute)
next_action (d3rlpy.dataset.Transition attribute)
next_actions (d3rlpy.dataset.TransitionMiniBatch attribute)
next_observation (d3rlpy.dataset.Transition attribute)
next_observations (d3rlpy.dataset.TransitionMiniBatch attribute)
next_reward (d3rlpy.dataset.Transition attribute)
next_rewards (d3rlpy.dataset.TransitionMiniBatch attribute)
NormalNoise (class in d3rlpy.online.explorers)
O
observation (d3rlpy.dataset.Transition attribute)
observation_shape (d3rlpy.online.buffers.ReplayBuffer attribute)
observations (d3rlpy.dataset.Episode attribute)
(d3rlpy.dataset.MDPDataset attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
(d3rlpy.online.buffers.ReplayBuffer attribute)
P
PixelScaler (class in d3rlpy.preprocessing)
predict() (d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
predict_value() (d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
probability (d3rlpy.augmentation.image.Cutout attribute)
(d3rlpy.augmentation.image.HorizontalFlip attribute)
(d3rlpy.augmentation.image.VerticalFlip attribute)
Q
q_func_type (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
R
RandomRotation (class in d3rlpy.augmentation.image)
RandomShift (class in d3rlpy.augmentation.image)
reguralizing_rate (d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.TD3 attribute)
ReplayBuffer (class in d3rlpy.online.buffers)
reverse_transform() (d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
reward (d3rlpy.dataset.Transition attribute)
rewards (d3rlpy.dataset.Episode attribute)
(d3rlpy.dataset.MDPDataset attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
(d3rlpy.online.buffers.ReplayBuffer attribute)
rl_start_epoch (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
S
SAC (class in d3rlpy.algos)
sample() (d3rlpy.online.buffers.ReplayBuffer method)
(d3rlpy.online.explorers.LinearDecayEpsilonGreedy method)
(d3rlpy.online.explorers.NormalNoise method)
sample_action() (d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
saturation (d3rlpy.augmentation.image.ColorJitter attribute)
save_model() (d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
save_policy() (d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
scale (d3rlpy.augmentation.image.Intensity attribute)
scaler (d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
set_params() (d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
share_encoder (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
shift_size (d3rlpy.augmentation.image.RandomShift attribute)
SingleAmplitudeScaling (class in d3rlpy.augmentation.vector)
size() (d3rlpy.dataset.Episode method)
(d3rlpy.dataset.MDPDataset method)
(d3rlpy.dataset.TransitionMiniBatch method)
(d3rlpy.online.buffers.ReplayBuffer method)
StandardScaler (class in d3rlpy.preprocessing)
start_epsilon (d3rlpy.online.explorers.LinearDecayEpsilonGreedy attribute)
std (d3rlpy.online.explorers.NormalNoise attribute)
(d3rlpy.preprocessing.StandardScaler attribute)
T
target_smoothing_clip (d3rlpy.algos.TD3 attribute)
target_smoothing_sigma (d3rlpy.algos.TD3 attribute)
target_update_interval (d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
tau (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
TD3 (class in d3rlpy.algos)
td_error_scorer() (in module d3rlpy.metrics.scorer)
temp_learning_rate (d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.SAC attribute)
terminal (d3rlpy.dataset.Transition attribute)
terminals (d3rlpy.dataset.MDPDataset attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
(d3rlpy.online.buffers.ReplayBuffer attribute)
train() (in module d3rlpy.online.iterators)
transform() (d3rlpy.augmentation.image.ColorJitter method)
(d3rlpy.augmentation.image.Cutout method)
(d3rlpy.augmentation.image.HorizontalFlip method)
(d3rlpy.augmentation.image.Intensity method)
(d3rlpy.augmentation.image.RandomRotation method)
(d3rlpy.augmentation.image.RandomShift method)
(d3rlpy.augmentation.image.VerticalFlip method)
(d3rlpy.augmentation.vector.MultipleAmplitudeScaling method)
(d3rlpy.augmentation.vector.SingleAmplitudeScaling method)
(d3rlpy.preprocessing.MinMaxScaler method)
(d3rlpy.preprocessing.PixelScaler method)
(d3rlpy.preprocessing.StandardScaler method)
Transition (class in d3rlpy.dataset)
TransitionMiniBatch (class in d3rlpy.dataset)
transitions (d3rlpy.dataset.Episode attribute)
(d3rlpy.dataset.TransitionMiniBatch attribute)
U
update() (d3rlpy.algos.BC method)
(d3rlpy.algos.BCQ method)
(d3rlpy.algos.BEAR method)
(d3rlpy.algos.CQL method)
(d3rlpy.algos.DDPG method)
(d3rlpy.algos.DQN method)
(d3rlpy.algos.DiscreteBC method)
(d3rlpy.algos.DiscreteBCQ method)
(d3rlpy.algos.DiscreteCQL method)
(d3rlpy.algos.DoubleDQN method)
(d3rlpy.algos.SAC method)
(d3rlpy.algos.TD3 method)
(d3rlpy.dynamics.mopo.MOPO method)
update_actor_interval (d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
use_batch_norm (d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
use_gpu (d3rlpy.algos.BC attribute)
(d3rlpy.algos.BCQ attribute)
(d3rlpy.algos.BEAR attribute)
(d3rlpy.algos.CQL attribute)
(d3rlpy.algos.DDPG attribute)
(d3rlpy.algos.DQN attribute)
(d3rlpy.algos.DiscreteBC attribute)
(d3rlpy.algos.DiscreteBCQ attribute)
(d3rlpy.algos.DiscreteCQL attribute)
(d3rlpy.algos.DoubleDQN attribute)
(d3rlpy.algos.SAC attribute)
(d3rlpy.algos.TD3 attribute)
(d3rlpy.dynamics.mopo.MOPO attribute)
V
value_estimation_std_scorer() (in module d3rlpy.metrics.scorer)
VerticalFlip (class in d3rlpy.augmentation.image)
W
weight_decay (d3rlpy.dynamics.mopo.MOPO attribute)
Read the Docs
v: v0.22
Versions
latest
stable
v0.22
v0.21
v0.2
v0.1
Downloads
pdf
html
epub
On Read the Docs
Project Home
Builds
Free document hosting provided by
Read the Docs
.