Index _ | A | B | C | D | E | F | G | H | I | K | L | M | N | O | P | Q | R | S | T | U | V | W _ __init() (objectrl.nets.layers.bayesian_layers.CLTLinearDet method) __init__() (objectrl.agents.base_agent.Agent method) (objectrl.loggers.logger.Logger method) (objectrl.models.basic.ac.ActorCritic method) (objectrl.models.basic.actor.Actor method) (objectrl.models.basic.critic.Critic method) (objectrl.models.basic.critic.CriticEnsemble method) (objectrl.models.basic.ensemble.Ensemble method) (objectrl.models.basic.loss.DSACLoss method) (objectrl.models.basic.loss.PACBayesLoss method) (objectrl.models.basic.loss.ProbabilisticLoss method) (objectrl.models.ddpg.DDPGActor method) (objectrl.models.ddpg.DDPGCritic method) (objectrl.models.ddpg.DeepDeterministicPolicyGradient method) (objectrl.models.ddpg.OrnsteinUhlenbeckNoise method) (objectrl.models.drnd.DRND method) (objectrl.models.drnd.DRNDActor method) (objectrl.models.drnd.DRNDBonus method) (objectrl.models.drnd.DRNDCritics method) (objectrl.models.dsac.DistributionalSoftActorCritic method) (objectrl.models.dsac.DSACActor method) (objectrl.models.dsac.DSACCritic method) (objectrl.models.oac.GaussianNoise method) (objectrl.models.oac.OACActor method) (objectrl.models.oac.OACCritic method) (objectrl.models.oac.OptimisticActorCritic method) (objectrl.models.oac.OptimisticNoise method) (objectrl.models.pbac.PACBayesianAC method) (objectrl.models.pbac.PBACActor method) (objectrl.models.pbac.PBACCritic method) (objectrl.models.ppo.PPOActor method) (objectrl.models.ppo.PPOActorNetProbabilistic method) (objectrl.models.ppo.PPOCritic method) (objectrl.models.ppo.ProximalPolicyOptimization method) (objectrl.models.redq.RandomizedEnsembledDoubleQLearning method) (objectrl.models.redq.REDQCritic method) (objectrl.models.sac.SACActor method) (objectrl.models.sac.SACCritic method) (objectrl.models.sac.SoftActorCritic method) (objectrl.models.td3.TD3Actor method) (objectrl.models.td3.TD3Critic method) (objectrl.models.td3.TwinDelayedDeepDeterministicPolicyGradient method) (objectrl.nets.actor_nets.ActorNet method) (objectrl.nets.actor_nets.ActorNetProbabilistic method) (objectrl.nets.critic_nets.BNNCriticNet method) (objectrl.nets.critic_nets.CriticNet method) (objectrl.nets.critic_nets.CriticNetProbabilistic method) (objectrl.nets.critic_nets.DQNNet method) (objectrl.nets.critic_nets.EMstyle method) (objectrl.nets.critic_nets.QuantileCriticNet method) (objectrl.nets.critic_nets.ValueNet method) (objectrl.nets.layers.bayesian_layers.BayesianLinear method) (objectrl.nets.layers.bayesian_layers.CLTLinear method) (objectrl.nets.layers.heads.CategoricalHead method) (objectrl.nets.layers.heads.DeterministicHead method) (objectrl.nets.layers.heads.GaussianHead method) (objectrl.nets.layers.heads.SquashedGaussianHead method) (objectrl.replay_buffers.experience_memory.ReplayBuffer method) (objectrl.utils.custom_act.CReLU method) (objectrl.utils.environment.dmc_wrappers.DMCEnv method) (objectrl.utils.environment.metaworld_wrappers.SparsifyRewardWrapper method) (objectrl.utils.environment.noisy_wrappers.NoisyActionWrapper method) (objectrl.utils.environment.noisy_wrappers.NoisyObservationWrapper method) (objectrl.utils.environment.reward_wrappers.PositionDelayWrapper method) (objectrl.utils.harvest_utils.Harvester method) (objectrl.utils.net_utils.BayesianMLP method) (objectrl.utils.net_utils.FeatureExtractor method) (objectrl.utils.net_utils.MLP method) _abc_impl (objectrl.agents.base_agent.Agent attribute) _agent_name (objectrl.models.basic.ac.ActorCritic attribute) (objectrl.models.ddpg.DeepDeterministicPolicyGradient attribute) (objectrl.models.drnd.DRND attribute) (objectrl.models.drnd.DRNDCritics attribute) (objectrl.models.dsac.DistributionalSoftActorCritic attribute) (objectrl.models.oac.OptimisticActorCritic attribute) (objectrl.models.pbac.PACBayesianAC attribute) (objectrl.models.ppo.ProximalPolicyOptimization attribute) (objectrl.models.redq.RandomizedEnsembledDoubleQLearning attribute) (objectrl.models.sac.SoftActorCritic attribute) (objectrl.models.td3.TwinDelayedDeepDeterministicPolicyGradient attribute) _apply_reduction() (objectrl.models.basic.loss.ProbabilisticLoss method) _gamma (objectrl.agents.base_agent.Agent attribute) (objectrl.models.basic.actor.Actor attribute) (objectrl.models.basic.critic.Critic attribute) (objectrl.models.basic.critic.CriticEnsemble attribute) (objectrl.models.drnd.DRNDCritics attribute) (objectrl.models.sac.SACCritic attribute) _get_all_members() (objectrl.models.basic.ensemble.Ensemble method) _get_single_critic() (objectrl.models.basic.critic.CriticEnsemble method) _get_single_member() (objectrl.models.basic.ensemble.Ensemble method) _get_storage() (objectrl.replay_buffers.experience_memory.ReplayBuffer method) _kappa (objectrl.models.basic.loss.DSACLoss attribute) _manual_reset (objectrl.nets.layers.bayesian_layers.BayesianLinear attribute) (objectrl.nets.layers.bayesian_layers.BBBLinear attribute) _map (objectrl.nets.layers.bayesian_layers.BayesianLinear attribute) _n (objectrl.nets.layers.heads.GaussianHead attribute) _plot_eval_curve() (objectrl.loggers.logger.Logger method) _plot_model_metrics() (objectrl.utils.harvest_utils.Harvester method) _prepare_input() (objectrl.models.basic.critic.Critic static method) _reset (objectrl.models.basic.actor.Actor attribute) (objectrl.models.basic.critic.CriticEnsemble attribute) _tau (objectrl.agents.base_agent.Agent attribute) (objectrl.models.basic.actor.Actor attribute) (objectrl.models.basic.critic.Critic attribute) (objectrl.models.basic.critic.CriticEnsemble attribute) A act (objectrl.nets.layers.bayesian_layers.CLTLinear attribute) act() (objectrl.models.basic.actor.Actor method) (objectrl.models.ddpg.DDPGActor method) (objectrl.models.pbac.PBACActor method) (objectrl.models.td3.TD3Actor method) act_target() (objectrl.models.basic.actor.Actor method) (objectrl.models.td3.TD3Actor method) action_limit_high (objectrl.models.td3.TD3Actor attribute) action_limit_low (objectrl.models.td3.TD3Actor attribute) action_space (objectrl.utils.environment.dmc_wrappers.DMCEnv attribute) Actor (class in objectrl.models.basic.actor) actor (objectrl.models.basic.ac.ActorCritic attribute) ActorCritic (class in objectrl.models.basic.ac) ActorNet (class in objectrl.nets.actor_nets) ActorNetProbabilistic (class in objectrl.nets.actor_nets) add() (objectrl.replay_buffers.experience_memory.ReplayBuffer method) add_batch() (objectrl.replay_buffers.experience_memory.ReplayBuffer method) add_noise() (objectrl.models.oac.GaussianNoise method) Agent (class in objectrl.agents.base_agent) B B2() (objectrl.models.drnd.DRNDBonus method) base_model (objectrl.models.basic.ensemble.Ensemble attribute) BayesianLinear (class in objectrl.nets.layers.bayesian_layers) BayesianMLP (class in objectrl.utils.net_utils) BBBLinear (class in objectrl.nets.layers.bayesian_layers) beta_ub (objectrl.models.oac.OptimisticNoise attribute) bias_mu (objectrl.nets.layers.bayesian_layers.BayesianLinear attribute) (objectrl.nets.layers.bayesian_layers.BBBLinear attribute) (objectrl.nets.layers.bayesian_layers.CLTLinearDet attribute) (objectrl.nets.layers.bayesian_layers.LRLinear attribute) bias_rho (objectrl.nets.layers.bayesian_layers.BayesianLinear attribute) (objectrl.nets.layers.bayesian_layers.BBBLinear attribute) (objectrl.nets.layers.bayesian_layers.CLTLinearDet attribute) (objectrl.nets.layers.bayesian_layers.LRLinear attribute) BNNCriticNet (class in objectrl.nets.critic_nets) bonus() (objectrl.models.drnd.DRNDBonus method) bonus_conf (objectrl.models.drnd.DRNDBonus attribute) buffers (objectrl.models.basic.ensemble.Ensemble attribute) C calculate_GAE_estimates() (objectrl.models.ppo.ProximalPolicyOptimization method) calculate_num_batches() (objectrl.replay_buffers.experience_memory.ReplayBuffer method) CategoricalHead (class in objectrl.nets.layers.heads) CLTLinear (class in objectrl.nets.layers.bayesian_layers) CLTLinearDet (class in objectrl.nets.layers.bayesian_layers) collect_results() (objectrl.utils.harvest_utils.Harvester method) compute() (objectrl.models.oac.OptimisticNoise method) config (objectrl.agents.base_agent.Agent attribute) (objectrl.models.basic.actor.Actor attribute) (objectrl.models.basic.critic.CriticEnsemble attribute) (objectrl.utils.harvest_utils.Harvester attribute) config_env (objectrl.agents.base_agent.Agent attribute) config_train (objectrl.agents.base_agent.Agent attribute) create_epoch_iterator() (objectrl.replay_buffers.experience_memory.ReplayBuffer method) create_logger() (objectrl.loggers.logger.Logger method) create_loss() (in module objectrl.utils.net_utils) create_optimizer() (in module objectrl.utils.net_utils) CReLU (class in objectrl.utils.custom_act) crelu_moments() (objectrl.nets.layers.bayesian_layers.CLTLinear static method) Critic (class in objectrl.models.basic.critic) critic (objectrl.models.basic.ac.ActorCritic attribute) critical() (objectrl.loggers.logger.Logger method) CriticEnsemble (class in objectrl.models.basic.critic) CriticNet (class in objectrl.nets.critic_nets) CriticNetProbabilistic (class in objectrl.nets.critic_nets) ctrl_w (objectrl.utils.environment.reward_wrappers.PositionDelayWrapper attribute) curves (objectrl.utils.harvest_utils.Harvester attribute) D DDPGActor (class in objectrl.models.ddpg) DDPGCritic (class in objectrl.models.ddpg) DeepDeterministicPolicyGradient (class in objectrl.models.ddpg) delta (objectrl.models.oac.OptimisticNoise attribute) DeterministicHead (class in objectrl.nets.layers.heads) device (objectrl.agents.base_agent.Agent attribute) (objectrl.models.basic.actor.Actor attribute) (objectrl.models.basic.critic.Critic attribute) (objectrl.models.basic.critic.CriticEnsemble attribute) (objectrl.models.basic.ensemble.Ensemble attribute) (objectrl.models.drnd.DRNDBonus attribute) dim_act (objectrl.agents.base_agent.Agent attribute) (objectrl.models.basic.actor.Actor attribute) (objectrl.models.basic.critic.CriticEnsemble attribute) dim_check() (in module objectrl.utils.utils) dim_state (objectrl.agents.base_agent.Agent attribute) (objectrl.models.basic.actor.Actor attribute) (objectrl.models.basic.critic.CriticEnsemble attribute) DistributionalSoftActorCritic (class in objectrl.models.dsac) dmc_spec2gym_space() (in module objectrl.utils.environment.dmc_wrappers) DMCEnv (class in objectrl.utils.environment.dmc_wrappers) domain_name (objectrl.utils.environment.dmc_wrappers.DMCEnv attribute) DQNNet (class in objectrl.nets.critic_nets) DRND (class in objectrl.models.drnd) DRNDActor (class in objectrl.models.drnd) DRNDBonus (class in objectrl.models.drnd) DRNDCritics (class in objectrl.models.drnd) DSACActor (class in objectrl.models.dsac) DSACCritic (class in objectrl.models.dsac) DSACLoss (class in objectrl.models.basic.loss) E EMstyle (class in objectrl.nets.critic_nets) Ensemble (class in objectrl.models.basic.ensemble) env (objectrl.utils.environment.noisy_wrappers.NoisyActionWrapper attribute) (objectrl.utils.environment.noisy_wrappers.NoisyObservationWrapper attribute) (objectrl.utils.environment.reward_wrappers.PositionDelayWrapper attribute) episode_summary() (objectrl.loggers.logger.Logger method) eval_results (objectrl.loggers.logger.Logger attribute) evolve_state() (objectrl.models.ddpg.OrnsteinUhlenbeckNoise method) expand() (objectrl.models.basic.ensemble.Ensemble method) experience_memory (objectrl.agents.base_agent.Agent attribute) F FeatureExtractor (class in objectrl.utils.net_utils) format_model_name() (objectrl.utils.harvest_utils.Harvester method) forward() (objectrl.models.basic.ensemble.Ensemble method) (objectrl.models.basic.loss.DSACLoss method) (objectrl.models.basic.loss.PACBayesLoss method) (objectrl.models.basic.loss.ProbabilisticLoss method) (objectrl.models.ppo.PPOActorNetProbabilistic method) (objectrl.nets.actor_nets.ActorNet method) (objectrl.nets.actor_nets.ActorNetProbabilistic method) (objectrl.nets.critic_nets.BNNCriticNet method) (objectrl.nets.critic_nets.CriticNet method) (objectrl.nets.critic_nets.CriticNetProbabilistic method) (objectrl.nets.critic_nets.DQNNet method) (objectrl.nets.critic_nets.EMstyle method) (objectrl.nets.critic_nets.QuantileCriticNet method) (objectrl.nets.layers.bayesian_layers.BayesianLinear method) (objectrl.nets.layers.bayesian_layers.BBBLinear method) (objectrl.nets.layers.bayesian_layers.CLTLinear method) (objectrl.nets.layers.bayesian_layers.CLTLinearDet method) (objectrl.nets.layers.bayesian_layers.LRLinear method) (objectrl.nets.layers.heads.CategoricalHead method) (objectrl.nets.layers.heads.DeterministicHead method) (objectrl.nets.layers.heads.GaussianHead method) (objectrl.nets.layers.heads.SquashedGaussianHead method) (objectrl.utils.custom_act.CReLU method) (objectrl.utils.net_utils.BayesianMLP method) (objectrl.utils.net_utils.FeatureExtractor method) (objectrl.utils.net_utils.MLP method) forward_model (objectrl.models.basic.ensemble.Ensemble attribute) G gamma (objectrl.models.ddpg.DDPGCritic attribute) GaussianHead (class in objectrl.nets.layers.heads) GaussianNoise (class in objectrl.models.oac) generate_transition() (objectrl.agents.base_agent.Agent method) (objectrl.models.ppo.ProximalPolicyOptimization method) get_bellman_target() (objectrl.models.basic.critic.CriticEnsemble method) (objectrl.models.ddpg.DDPGCritic method) (objectrl.models.drnd.DRNDCritics method) (objectrl.models.dsac.DSACCritic method) (objectrl.models.oac.OACCritic method) (objectrl.models.pbac.PBACCritic method) (objectrl.models.ppo.PPOCritic method) (objectrl.models.sac.SACCritic method) (objectrl.models.td3.TD3Critic method) get_kl() (objectrl.utils.net_utils.BayesianMLP method) get_manual_reset() (objectrl.nets.layers.bayesian_layers.BayesianLinear method) get_next_batch() (objectrl.replay_buffers.experience_memory.ReplayBuffer method) get_result_file_path() (objectrl.utils.harvest_utils.Harvester method) get_steps_and_iterator() (objectrl.replay_buffers.experience_memory.ReplayBuffer method) get_tau() (objectrl.models.dsac.DSACCritic method) H harvest() (objectrl.utils.harvest_utils.Harvester method) Harvester (class in objectrl.utils.harvest_utils) has_target (objectrl.models.basic.actor.Actor attribute) (objectrl.models.basic.critic.Critic attribute) (objectrl.models.basic.critic.CriticEnsemble attribute) I idx_active_critic (objectrl.models.ddpg.DDPGActor attribute) in_features (objectrl.nets.layers.bayesian_layers.BayesianLinear attribute) (objectrl.nets.layers.bayesian_layers.BBBLinear attribute) (objectrl.nets.layers.bayesian_layers.CLTLinearDet attribute) (objectrl.nets.layers.bayesian_layers.LRLinear attribute) init_target() (objectrl.models.basic.actor.Actor method) (objectrl.models.basic.critic.Critic method) initialize_data_stores() (objectrl.utils.harvest_utils.Harvester method) interaction_iter (objectrl.models.ddpg.DDPGActor attribute) inv_softplus() (objectrl.nets.layers.bayesian_layers.BayesianLinear static method) IQM_reward_calculator() (objectrl.loggers.logger.Logger static method) is_episode_end (objectrl.models.ddpg.DDPGActor attribute) is_input (objectrl.nets.layers.bayesian_layers.CLTLinear attribute) is_output (objectrl.nets.layers.bayesian_layers.CLTLinear attribute) iter (objectrl.models.basic.actor.Actor attribute) (objectrl.models.basic.critic.CriticEnsemble attribute) K KL() (objectrl.nets.layers.bayesian_layers.BayesianLinear method) (objectrl.nets.layers.bayesian_layers.CLTLinearDet method) L lambda_actor (objectrl.models.drnd.DRNDActor attribute) lambda_critic (objectrl.models.drnd.DRNDCritics attribute) learn() (objectrl.agents.base_agent.Agent method) (objectrl.models.basic.ac.ActorCritic method) (objectrl.models.drnd.DRND method) (objectrl.models.ppo.ProximalPolicyOptimization method) learnable_alpha (objectrl.models.dsac.DSACActor attribute) load() (objectrl.agents.base_agent.Agent method) (objectrl.replay_buffers.experience_memory.ReplayBuffer method) log() (objectrl.loggers.logger.Logger method) log_alpha (objectrl.models.sac.SACActor attribute) Logger (class in objectrl.loggers.logger) logger (objectrl.agents.base_agent.Agent attribute) (objectrl.loggers.logger.Logger attribute) loss (objectrl.models.basic.critic.CriticEnsemble attribute) (objectrl.models.ddpg.DDPGCritic attribute) loss() (objectrl.models.basic.actor.Actor method) (objectrl.models.ddpg.DDPGActor method) (objectrl.models.drnd.DRNDActor method) (objectrl.models.dsac.DSACActor method) (objectrl.models.oac.OACActor method) (objectrl.models.ppo.PPOActor method) (objectrl.models.sac.SACActor method) (objectrl.models.td3.TD3Actor method) LRLinear (class in objectrl.nets.layers.bayesian_layers) M make_env() (in module objectrl.utils.make_env) map() (objectrl.nets.critic_nets.BNNCriticNet method) (objectrl.nets.layers.bayesian_layers.BayesianLinear method) mean() (objectrl.nets.layers.bayesian_layers.BayesianLinear method) metrics (objectrl.utils.harvest_utils.Harvester attribute) MLP (class in objectrl.utils.net_utils) model (objectrl.models.basic.actor.Actor attribute) (objectrl.models.basic.critic.Critic attribute), [1] model_ensemble (objectrl.models.basic.critic.CriticEnsemble attribute) mu() (objectrl.models.drnd.DRNDBonus method) N n_iter (objectrl.models.basic.ac.ActorCritic attribute) n_members (objectrl.models.basic.critic.CriticEnsemble attribute) (objectrl.models.basic.ensemble.Ensemble attribute) (objectrl.models.drnd.DRNDBonus attribute) neg_relu_moments() (objectrl.nets.layers.bayesian_layers.CLTLinear static method) noise_act (objectrl.utils.environment.noisy_wrappers.NoisyActionWrapper attribute) noise_clamp (objectrl.models.oac.GaussianNoise attribute) noise_obs (objectrl.utils.environment.noisy_wrappers.NoisyObservationWrapper attribute) NoisyActionWrapper (class in objectrl.utils.environment.noisy_wrappers) NoisyObservationWrapper (class in objectrl.utils.environment.noisy_wrappers) normal_cdf() (objectrl.nets.layers.bayesian_layers.CLTLinear static method) normal_pdf() (objectrl.nets.layers.bayesian_layers.CLTLinear static method) num_quantiles (objectrl.models.dsac.DSACCritic attribute) O OACActor (class in objectrl.models.oac) OACCritic (class in objectrl.models.oac) observation() (objectrl.utils.environment.noisy_wrappers.NoisyObservationWrapper method) observation_space (objectrl.utils.environment.dmc_wrappers.DMCEnv attribute) optim (objectrl.models.basic.actor.Actor attribute) (objectrl.models.basic.critic.CriticEnsemble attribute) optim_alpha (objectrl.models.sac.SACActor attribute) optim_pred (objectrl.models.drnd.DRNDBonus attribute) optimist_noise (objectrl.models.oac.OACActor attribute) OptimisticActorCritic (class in objectrl.models.oac) OptimisticNoise (class in objectrl.models.oac) OrnsteinUhlenbeckNoise (class in objectrl.models.ddpg) out_features (objectrl.nets.layers.bayesian_layers.BayesianLinear attribute) (objectrl.nets.layers.bayesian_layers.BBBLinear attribute) (objectrl.nets.layers.bayesian_layers.CLTLinearDet attribute) (objectrl.nets.layers.bayesian_layers.LRLinear attribute) P PACBayesianAC (class in objectrl.models.pbac) PACBayesLoss (class in objectrl.models.basic.loss) params (objectrl.models.basic.ensemble.Ensemble attribute) path (objectrl.loggers.logger.Logger attribute) PBACActor (class in objectrl.models.pbac) PBACCritic (class in objectrl.models.pbac) plot_results() (objectrl.utils.harvest_utils.Harvester method) plot_rewards() (objectrl.loggers.logger.Logger method) policy_delay (objectrl.models.basic.ac.ActorCritic attribute) policy_noise (objectrl.models.td3.TD3Actor attribute) position_delay (objectrl.utils.environment.reward_wrappers.PositionDelayWrapper attribute) PositionDelayWrapper (class in objectrl.utils.environment.reward_wrappers) PPOActor (class in objectrl.models.ppo) PPOActorNetProbabilistic (class in objectrl.models.ppo) PPOCritic (class in objectrl.models.ppo) predictor (objectrl.models.drnd.DRNDBonus attribute) prior_mean (objectrl.nets.layers.bayesian_layers.BayesianLinear attribute) (objectrl.nets.layers.bayesian_layers.BBBLinear attribute) (objectrl.nets.layers.bayesian_layers.CLTLinearDet attribute) (objectrl.nets.layers.bayesian_layers.LRLinear attribute) prior_std (objectrl.nets.layers.bayesian_layers.BayesianLinear attribute) (objectrl.nets.layers.bayesian_layers.BBBLinear attribute) (objectrl.nets.layers.bayesian_layers.CLTLinearDet attribute) (objectrl.nets.layers.bayesian_layers.LRLinear attribute) ProbabilisticLoss (class in objectrl.models.basic.loss) prototype (objectrl.models.basic.ensemble.Ensemble attribute) ProximalPolicyOptimization (class in objectrl.models.ppo) Q Q() (objectrl.models.basic.critic.Critic method) (objectrl.models.basic.critic.CriticEnsemble method) (objectrl.models.dsac.DSACCritic method) Q_t() (objectrl.models.basic.critic.Critic method) (objectrl.models.basic.critic.CriticEnsemble method) (objectrl.models.dsac.DSACCritic method) (objectrl.models.pbac.PBACCritic method) QuantileCriticNet (class in objectrl.nets.critic_nets) R RandomizedEnsembledDoubleQLearning (class in objectrl.models.redq) REDQCritic (class in objectrl.models.redq) reduce() (objectrl.models.basic.critic.Critic method) (objectrl.models.basic.critic.CriticEnsemble method) (objectrl.models.redq.REDQCritic method) reduction (objectrl.models.basic.loss.ProbabilisticLoss attribute) relu_moments() (objectrl.nets.layers.bayesian_layers.CLTLinear static method) render() (objectrl.utils.environment.dmc_wrappers.DMCEnv method) ReplayBuffer (class in objectrl.replay_buffers.experience_memory) requires_discrete_actions() (objectrl.agents.base_agent.Agent method) reset() (objectrl.agents.base_agent.Agent method) (objectrl.models.basic.ac.ActorCritic method) (objectrl.models.basic.actor.Actor method) (objectrl.models.basic.critic.CriticEnsemble method) (objectrl.models.ddpg.OrnsteinUhlenbeckNoise method) (objectrl.models.drnd.DRNDBonus method) (objectrl.replay_buffers.experience_memory.ReplayBuffer method) (objectrl.utils.environment.dmc_wrappers.DMCEnv method) reset_parameters() (objectrl.nets.layers.bayesian_layers.BayesianLinear method) reset_randomness() (objectrl.nets.layers.bayesian_layers.BayesianLinear method) (objectrl.nets.layers.bayesian_layers.CLTLinear method) results (objectrl.utils.harvest_utils.Harvester attribute) reward() (objectrl.utils.environment.reward_wrappers.PositionDelayWrapper method) S SACActor (class in objectrl.models.sac) SACCritic (class in objectrl.models.sac) sample() (objectrl.models.ddpg.OrnsteinUhlenbeckNoise method) sample_all() (objectrl.replay_buffers.experience_memory.ReplayBuffer method) sample_batch() (objectrl.replay_buffers.experience_memory.ReplayBuffer method) sample_by_index() (objectrl.replay_buffers.experience_memory.ReplayBuffer method) sample_by_index_fields() (objectrl.replay_buffers.experience_memory.ReplayBuffer method) sample_random() (objectrl.replay_buffers.experience_memory.ReplayBuffer method) sampling_rate (objectrl.models.ddpg.DDPGActor attribute) save() (objectrl.agents.base_agent.Agent method) (objectrl.loggers.logger.Logger method) (objectrl.replay_buffers.experience_memory.ReplayBuffer method) save_eval_results() (objectrl.loggers.logger.Logger method) select_action() (objectrl.agents.base_agent.Agent method) (objectrl.models.basic.ac.ActorCritic method) (objectrl.models.oac.OptimisticActorCritic method) sequential (objectrl.models.basic.ensemble.Ensemble attribute) set_episode_status() (objectrl.models.pbac.PBACActor method) set_manual_reset() (objectrl.nets.layers.bayesian_layers.BayesianLinear method) sigma_target (objectrl.models.oac.GaussianNoise attribute) size (objectrl.replay_buffers.experience_memory.ReplayBuffer property) smooth_curve() (objectrl.utils.harvest_utils.Harvester method) SoftActorCritic (class in objectrl.models.sac) softplus() (objectrl.nets.layers.bayesian_layers.BayesianLinear static method) SparsifyRewardWrapper (class in objectrl.utils.environment.metaworld_wrappers) SquashedGaussianHead (class in objectrl.nets.layers.heads) std() (objectrl.nets.layers.bayesian_layers.BayesianLinear method) (objectrl.nets.layers.bayesian_layers.CLTLinearDet method) step() (objectrl.utils.environment.dmc_wrappers.DMCEnv method) (objectrl.utils.environment.metaworld_wrappers.SparsifyRewardWrapper method) (objectrl.utils.environment.noisy_wrappers.NoisyActionWrapper method) (objectrl.utils.environment.reward_wrappers.PositionDelayWrapper method) store_transition() (objectrl.agents.base_agent.Agent method) (objectrl.models.ddpg.DeepDeterministicPolicyGradient method) (objectrl.models.pbac.PACBayesianAC method) T target (objectrl.models.basic.actor.Actor attribute) (objectrl.models.basic.critic.Critic attribute), [1] target_ensemble (objectrl.models.basic.critic.CriticEnsemble attribute) (objectrl.models.drnd.DRNDBonus attribute) target_entropy (objectrl.models.sac.SACActor attribute) target_policy_noise (objectrl.models.td3.TD3Actor attribute) target_policy_noise_clip (objectrl.models.td3.TD3Actor attribute) task_name (objectrl.utils.environment.dmc_wrappers.DMCEnv attribute) tau_type (objectrl.models.dsac.DSACCritic attribute) TD3Actor (class in objectrl.models.td3) TD3Critic (class in objectrl.models.td3) toint() (in module objectrl.utils.utils) tonumpy() (in module objectrl.utils.utils) totorch() (in module objectrl.utils.utils) TwinDelayedDeepDeterministicPolicyGradient (class in objectrl.models.td3) U update() (objectrl.models.basic.actor.Actor method) (objectrl.models.basic.critic.CriticEnsemble method) (objectrl.models.drnd.DRNDActor method) (objectrl.models.dsac.DSACCritic method) (objectrl.models.pbac.PBACCritic method) (objectrl.models.ppo.PPOActor method) (objectrl.models.ppo.PPOCritic method) (objectrl.models.sac.SACActor method) update_alpha() (objectrl.models.dsac.DSACActor method) (objectrl.models.sac.SACActor method) update_predictor() (objectrl.models.drnd.DRNDBonus method) update_prior() (objectrl.nets.layers.bayesian_layers.BayesianLinear method) update_target() (objectrl.models.basic.actor.Actor method) (objectrl.models.basic.critic.Critic method) (objectrl.models.basic.critic.CriticEnsemble method) use_softplus (objectrl.nets.layers.bayesian_layers.BayesianLinear attribute) (objectrl.nets.layers.bayesian_layers.BBBLinear attribute) (objectrl.nets.layers.bayesian_layers.CLTLinearDet attribute) (objectrl.nets.layers.bayesian_layers.LRLinear attribute) V ValueNet (class in objectrl.nets.critic_nets) var() (objectrl.nets.layers.bayesian_layers.BayesianLinear method) vec_asymmetric_huber_loss_weighted() (objectrl.models.basic.loss.DSACLoss method) verbose (objectrl.models.basic.actor.Actor attribute) W weight_mu (objectrl.nets.layers.bayesian_layers.BayesianLinear attribute) (objectrl.nets.layers.bayesian_layers.BBBLinear attribute) (objectrl.nets.layers.bayesian_layers.CLTLinearDet attribute) (objectrl.nets.layers.bayesian_layers.LRLinear attribute) weight_rho (objectrl.nets.layers.bayesian_layers.BayesianLinear attribute) (objectrl.nets.layers.bayesian_layers.BBBLinear attribute) (objectrl.nets.layers.bayesian_layers.CLTLinearDet attribute) (objectrl.nets.layers.bayesian_layers.LRLinear attribute)