Index A | B | C | D | E | F | G | H | I | L | M | N | O | P | R | S | T | U | X | Z A action_space() (agilerl.wrappers.pettingzoo_wrappers.PettingZooVectorizationParallelWrapper method) activation_mutation() (agilerl.hpo.mutation.Mutations method) add_cnn_channel() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) add_cnn_layer() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) add_decoder_layer() (agilerl.networks.evolvable_bert.EvolvableBERT method) add_encoder_layer() (agilerl.networks.evolvable_bert.EvolvableBERT method) add_layer() (agilerl.networks.evolvable_gpt.EvolvableGPT method) add_mlp_layer() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.networks.evolvable_mlp.EvolvableMLP method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) add_mlp_node() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.networks.evolvable_mlp.EvolvableMLP method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) add_module() (agilerl.algorithms.ilql.ILQL method) add_node() (agilerl.networks.evolvable_bert.EvolvableBERT method) (agilerl.networks.evolvable_gpt.EvolvableGPT method) apply() (agilerl.algorithms.ilql.ILQL method) architecture_mutate() (agilerl.hpo.mutation.Mutations method) B bfloat16() (agilerl.algorithms.ilql.ILQL method) Block (class in agilerl.networks.evolvable_gpt) buffers() (agilerl.algorithms.ilql.ILQL method) C calc_max_kernel_sizes() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) calc_stride_size_ranges() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) CausalSelfAttention (class in agilerl.networks.evolvable_gpt) change_cnn_kernel() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) check_encoder_sparsity_fast_path() (agilerl.networks.evolvable_bert.EvolvableBERT method) check_policy_on_policy_with_probe_env() (in module agilerl.utils.probe_envs) check_policy_q_learning_with_probe_env() (in module agilerl.utils.probe_envs) (in module agilerl.utils.probe_envs_ma) check_q_learning_with_probe_env() (in module agilerl.utils.probe_envs) children() (agilerl.algorithms.ilql.ILQL method) classic_parameter_mutation() (agilerl.hpo.mutation.Mutations method) clone() (agilerl.algorithms.cqn.CQN method) (agilerl.algorithms.ddpg.DDPG method) (agilerl.algorithms.dqn.DQN method) (agilerl.algorithms.dqn_rainbow.RainbowDQN method) (agilerl.algorithms.ilql.ILQL method) (agilerl.algorithms.maddpg.MADDPG method) (agilerl.algorithms.matd3.MATD3 method) (agilerl.algorithms.neural_ts_bandit.NeuralTS method) (agilerl.algorithms.neural_ucb_bandit.NeuralUCB method) (agilerl.algorithms.ppo.PPO method) (agilerl.algorithms.td3.TD3 method) (agilerl.networks.evolvable_bert.EvolvableBERT method) (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.networks.evolvable_gpt.EvolvableGPT method) (agilerl.networks.evolvable_mlp.EvolvableMLP method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) close() (agilerl.wrappers.pettingzoo_wrappers.PettingZooVectorizationParallelWrapper method) configure_optimizers() (agilerl.networks.evolvable_gpt.EvolvableGPT method) ConstantRewardContActionsEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) ConstantRewardContActionsImageEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) ConstantRewardEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) ConstantRewardImageEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) count_parameters() (agilerl.networks.evolvable_bert.EvolvableBERT method) cpu() (agilerl.algorithms.ilql.ILQL method) CQN (class in agilerl.algorithms.cqn) create_cnn() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) create_mask() (agilerl.networks.evolvable_bert.EvolvableBERT method) create_mlp() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.networks.evolvable_mlp.EvolvableMLP method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) create_net() (agilerl.networks.evolvable_gpt.EvolvableGPT method) (agilerl.networks.evolvable_mlp.EvolvableMLP method) create_nets() (agilerl.networks.evolvable_bert.EvolvableBERT method) (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) cuda() (agilerl.algorithms.ilql.ILQL method) D DDPG (class in agilerl.algorithms.ddpg) decode() (agilerl.networks.evolvable_bert.EvolvableBERT method) detect_architecture() (agilerl.wrappers.make_evolvable.MakeEvolvable method) DiscountedRewardContActionsEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) DiscountedRewardContActionsImageEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) DiscountedRewardEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) DiscountedRewardImageEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) double() (agilerl.algorithms.ilql.ILQL method) DQN (class in agilerl.algorithms.dqn) E encode() (agilerl.networks.evolvable_bert.EvolvableBERT method) estimate_mfu() (agilerl.networks.evolvable_gpt.EvolvableGPT method) eval() (agilerl.algorithms.ilql.ILQL method) EvolvableBERT (class in agilerl.networks.evolvable_bert) EvolvableCNN (class in agilerl.networks.evolvable_cnn) EvolvableGPT (class in agilerl.networks.evolvable_gpt) EvolvableMLP (class in agilerl.networks.evolvable_mlp) extra_repr() (agilerl.algorithms.ilql.ILQL method) F FixedObsPolicyContActionsEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) FixedObsPolicyContActionsImageEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) FixedObsPolicyEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) FixedObsPolicyImageEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) float() (agilerl.algorithms.ilql.ILQL method) forward() (agilerl.algorithms.ilql.ILQL method) (agilerl.networks.custom_components.GumbelSoftmax method) (agilerl.networks.evolvable_bert.EvolvableBERT method) (agilerl.networks.evolvable_bert.PositionalEncoder method) (agilerl.networks.evolvable_bert.PositionalEncoding method) (agilerl.networks.evolvable_bert.TokenEmbedding method) (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.networks.evolvable_cnn.NoisyLinear method) (agilerl.networks.evolvable_gpt.Block method) (agilerl.networks.evolvable_gpt.CausalSelfAttention method) (agilerl.networks.evolvable_gpt.EvolvableGPT method) (agilerl.networks.evolvable_gpt.LayerNorm method) (agilerl.networks.evolvable_gpt.MLP method) (agilerl.networks.evolvable_gpt.PositionalEncoding method) (agilerl.networks.evolvable_gpt.TokenEmbedding method) (agilerl.networks.evolvable_mlp.EvolvableMLP method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) G generate() (agilerl.networks.evolvable_gpt.EvolvableGPT method) generate_square_subsequent_mask() (agilerl.networks.evolvable_bert.EvolvableBERT method) get_activation() (agilerl.networks.evolvable_bert.EvolvableBERT method) (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.networks.evolvable_gpt.EvolvableGPT method) (agilerl.networks.evolvable_gpt.MLP method) (agilerl.networks.evolvable_mlp.EvolvableMLP method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) get_algo_nets() (agilerl.hpo.mutation.Mutations method) get_buffer() (agilerl.algorithms.ilql.ILQL method) get_conv_layer() (agilerl.wrappers.make_evolvable.MakeEvolvable method) get_extra_state() (agilerl.algorithms.ilql.ILQL method) get_normalization() (agilerl.wrappers.make_evolvable.MakeEvolvable method) get_num_params() (agilerl.networks.evolvable_gpt.EvolvableGPT method) get_parameter() (agilerl.algorithms.ilql.ILQL method) get_pooling() (agilerl.wrappers.make_evolvable.MakeEvolvable method) get_submodule() (agilerl.algorithms.ilql.ILQL method) getAction() (agilerl.algorithms.cqn.CQN method) (agilerl.algorithms.ddpg.DDPG method) (agilerl.algorithms.dqn.DQN method) (agilerl.algorithms.dqn_rainbow.RainbowDQN method) (agilerl.algorithms.maddpg.MADDPG method) (agilerl.algorithms.matd3.MATD3 method) (agilerl.algorithms.neural_ts_bandit.NeuralTS method) (agilerl.algorithms.neural_ucb_bandit.NeuralUCB method) (agilerl.algorithms.ppo.PPO method) (agilerl.algorithms.td3.TD3 method) gumbel_softmax() (agilerl.networks.custom_components.GumbelSoftmax static method) GumbelSoftmax (class in agilerl.networks.custom_components) H half() (agilerl.algorithms.ilql.ILQL method) hardUpdate() (agilerl.algorithms.ilql.ILQL method) I ILQL (class in agilerl.algorithms.ilql) init_dict (agilerl.networks.evolvable_bert.EvolvableBERT property) (agilerl.networks.evolvable_cnn.EvolvableCNN property) (agilerl.networks.evolvable_gpt.EvolvableGPT property) (agilerl.networks.evolvable_mlp.EvolvableMLP property) (agilerl.wrappers.make_evolvable.MakeEvolvable property) initialPopulation() (in module agilerl.utils.utils) ipu() (agilerl.algorithms.ilql.ILQL method) L layer_init() (agilerl.wrappers.make_evolvable.MakeEvolvable method) LayerNorm (class in agilerl.networks.evolvable_gpt) learn() (agilerl.algorithms.cqn.CQN method) (agilerl.algorithms.ddpg.DDPG method) (agilerl.algorithms.dqn.DQN method) (agilerl.algorithms.dqn_rainbow.RainbowDQN method) (agilerl.algorithms.maddpg.MADDPG method) (agilerl.algorithms.matd3.MATD3 method) (agilerl.algorithms.neural_ts_bandit.NeuralTS method) (agilerl.algorithms.neural_ucb_bandit.NeuralUCB method) (agilerl.algorithms.ppo.PPO method) (agilerl.algorithms.td3.TD3 method) load() (agilerl.algorithms.cqn.CQN class method) (agilerl.algorithms.ddpg.DDPG class method) (agilerl.algorithms.dqn.DQN class method) (agilerl.algorithms.dqn_rainbow.RainbowDQN class method) (agilerl.algorithms.maddpg.MADDPG class method) (agilerl.algorithms.matd3.MATD3 class method) (agilerl.algorithms.neural_ts_bandit.NeuralTS class method) (agilerl.algorithms.neural_ucb_bandit.NeuralUCB class method) (agilerl.algorithms.ppo.PPO class method) (agilerl.algorithms.td3.TD3 class method) load_state_dict() (agilerl.algorithms.ilql.ILQL method) loadCheckpoint() (agilerl.algorithms.cqn.CQN method) (agilerl.algorithms.ddpg.DDPG method) (agilerl.algorithms.dqn.DQN method) (agilerl.algorithms.dqn_rainbow.RainbowDQN method) (agilerl.algorithms.ilql.ILQL method) (agilerl.algorithms.maddpg.MADDPG method) (agilerl.algorithms.matd3.MATD3 method) (agilerl.algorithms.neural_ts_bandit.NeuralTS method) (agilerl.algorithms.neural_ucb_bandit.NeuralUCB method) (agilerl.algorithms.ppo.PPO method) (agilerl.algorithms.td3.TD3 method) M MADDPG (class in agilerl.algorithms.maddpg) MakeEvolvable (class in agilerl.wrappers.make_evolvable) makeMultiAgentVectEnvs() (in module agilerl.utils.utils) makeSkillVectEnvs() (in module agilerl.utils.utils) makeVectEnvs() (in module agilerl.utils.utils) MATD3 (class in agilerl.algorithms.matd3) MLP (class in agilerl.networks.evolvable_gpt) modules() (agilerl.algorithms.ilql.ILQL method) MultiAgentReplayBuffer (class in agilerl.components.multi_agent_replay_buffer) MultiPolicyEnv (class in agilerl.utils.probe_envs_ma) MultiPolicyImageEnv (class in agilerl.utils.probe_envs_ma) MultiStepReplayBuffer (class in agilerl.components.replay_buffer) mutation() (agilerl.hpo.mutation.Mutations method) Mutations (class in agilerl.hpo.mutation) N named_buffers() (agilerl.algorithms.ilql.ILQL method) named_children() (agilerl.algorithms.ilql.ILQL method) named_modules() (agilerl.algorithms.ilql.ILQL method) named_parameters() (agilerl.algorithms.ilql.ILQL method) NeuralTS (class in agilerl.algorithms.neural_ts_bandit) NeuralUCB (class in agilerl.algorithms.neural_ucb_bandit) no_mutation() (agilerl.hpo.mutation.Mutations method) NoisyLinear (class in agilerl.networks.evolvable_cnn) O ObsDependentRewardContActionsEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) ObsDependentRewardContActionsImageEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) ObsDependentRewardEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) ObsDependentRewardImageEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) observation_space() (agilerl.wrappers.pettingzoo_wrappers.PettingZooVectorizationParallelWrapper method) P parameter_mutation() (agilerl.hpo.mutation.Mutations method) parameters() (agilerl.algorithms.ilql.ILQL method) PettingZooVectorizationParallelWrapper (class in agilerl.wrappers.pettingzoo_wrappers) plotPopulationScore() (in module agilerl.utils.utils) PolicyContActionsEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) PolicyContActionsImageEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) PolicyContActionsImageEnvSimple (class in agilerl.utils.probe_envs) PolicyEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) PolicyImageEnv (class in agilerl.utils.probe_envs) (class in agilerl.utils.probe_envs_ma) PositionalEncoder (class in agilerl.networks.evolvable_bert) PositionalEncoding (class in agilerl.networks.evolvable_bert) (class in agilerl.networks.evolvable_gpt) PPO (class in agilerl.algorithms.ppo) prepare_state() (agilerl.algorithms.ppo.PPO method) preserve_parameters() (agilerl.networks.evolvable_bert.EvolvableBERT method) (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.networks.evolvable_gpt.EvolvableGPT method) (agilerl.networks.evolvable_mlp.EvolvableMLP method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) printHyperparams() (in module agilerl.utils.utils) PrioritizedReplayBuffer (class in agilerl.components.replay_buffer) R RainbowDQN (class in agilerl.algorithms.dqn_rainbow) recreate_nets() (agilerl.networks.evolvable_bert.EvolvableBERT method) (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.networks.evolvable_gpt.EvolvableGPT method) (agilerl.networks.evolvable_mlp.EvolvableMLP method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) recreate_shrunk_nets() (agilerl.networks.evolvable_bert.EvolvableBERT method) (agilerl.networks.evolvable_gpt.EvolvableGPT method) register_backward_hook() (agilerl.algorithms.ilql.ILQL method) register_buffer() (agilerl.algorithms.ilql.ILQL method) register_forward_hook() (agilerl.algorithms.ilql.ILQL method) register_forward_pre_hook() (agilerl.algorithms.ilql.ILQL method) register_full_backward_hook() (agilerl.algorithms.ilql.ILQL method) register_full_backward_pre_hook() (agilerl.algorithms.ilql.ILQL method) register_load_state_dict_post_hook() (agilerl.algorithms.ilql.ILQL method) register_module() (agilerl.algorithms.ilql.ILQL method) register_parameter() (agilerl.algorithms.ilql.ILQL method) register_state_dict_pre_hook() (agilerl.algorithms.ilql.ILQL method) remove_cnn_channel() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) remove_cnn_layer() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) remove_decoder_layer() (agilerl.networks.evolvable_bert.EvolvableBERT method) remove_encoder_layer() (agilerl.networks.evolvable_bert.EvolvableBERT method) remove_layer() (agilerl.networks.evolvable_gpt.EvolvableGPT method) remove_mlp_layer() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.networks.evolvable_mlp.EvolvableMLP method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) remove_mlp_node() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.networks.evolvable_mlp.EvolvableMLP method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) remove_node() (agilerl.networks.evolvable_bert.EvolvableBERT method) (agilerl.networks.evolvable_gpt.EvolvableGPT method) render() (agilerl.wrappers.pettingzoo_wrappers.PettingZooVectorizationParallelWrapper method) ReplayBuffer (class in agilerl.components.replay_buffer) requires_grad_() (agilerl.algorithms.ilql.ILQL method) reset() (agilerl.wrappers.pettingzoo_wrappers.PettingZooVectorizationParallelWrapper method) reset_noise() (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.networks.evolvable_cnn.NoisyLinear method) (agilerl.networks.evolvable_mlp.EvolvableMLP method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) reset_parameters() (agilerl.networks.evolvable_cnn.NoisyLinear method) rl_hyperparam_mutation() (agilerl.hpo.mutation.Mutations method) S sample() (agilerl.components.multi_agent_replay_buffer.MultiAgentReplayBuffer method) (agilerl.components.replay_buffer.MultiStepReplayBuffer method) (agilerl.components.replay_buffer.PrioritizedReplayBuffer method) (agilerl.components.replay_buffer.ReplayBuffer method) sample_from_indices() (agilerl.components.replay_buffer.MultiStepReplayBuffer method) (agilerl.components.replay_buffer.PrioritizedReplayBuffer method) save2memory() (agilerl.components.multi_agent_replay_buffer.MultiAgentReplayBuffer method) (agilerl.components.replay_buffer.MultiStepReplayBuffer method) (agilerl.components.replay_buffer.PrioritizedReplayBuffer method) (agilerl.components.replay_buffer.ReplayBuffer method) save2memorySingleEnv() (agilerl.components.multi_agent_replay_buffer.MultiAgentReplayBuffer method) (agilerl.components.replay_buffer.MultiStepReplayBuffer method) (agilerl.components.replay_buffer.PrioritizedReplayBuffer method) (agilerl.components.replay_buffer.ReplayBuffer method) save2memoryVectEnvs() (agilerl.components.multi_agent_replay_buffer.MultiAgentReplayBuffer method) (agilerl.components.replay_buffer.MultiStepReplayBuffer method) (agilerl.components.replay_buffer.PrioritizedReplayBuffer method) (agilerl.components.replay_buffer.ReplayBuffer method) saveCheckpoint() (agilerl.algorithms.cqn.CQN method) (agilerl.algorithms.ddpg.DDPG method) (agilerl.algorithms.dqn.DQN method) (agilerl.algorithms.dqn_rainbow.RainbowDQN method) (agilerl.algorithms.ilql.ILQL method) (agilerl.algorithms.maddpg.MADDPG method) (agilerl.algorithms.matd3.MATD3 method) (agilerl.algorithms.neural_ts_bandit.NeuralTS method) (agilerl.algorithms.neural_ucb_bandit.NeuralUCB method) (agilerl.algorithms.ppo.PPO method) (agilerl.algorithms.td3.TD3 method) scale_to_action_space() (agilerl.algorithms.ddpg.DDPG method) (agilerl.algorithms.maddpg.MADDPG method) (agilerl.algorithms.matd3.MATD3 method) (agilerl.algorithms.td3.TD3 method) select() (agilerl.hpo.tournament.TournamentSelection method) set_extra_state() (agilerl.algorithms.ilql.ILQL method) share_memory() (agilerl.algorithms.ilql.ILQL method) shrink_preserve_parameters() (agilerl.networks.evolvable_bert.EvolvableBERT method) (agilerl.networks.evolvable_cnn.EvolvableCNN method) (agilerl.networks.evolvable_gpt.EvolvableGPT method) (agilerl.networks.evolvable_mlp.EvolvableMLP method) (agilerl.wrappers.make_evolvable.MakeEvolvable method) Skill (class in agilerl.wrappers.learning) softUpdate() (agilerl.algorithms.cqn.CQN method) (agilerl.algorithms.ddpg.DDPG method) (agilerl.algorithms.dqn.DQN method) (agilerl.algorithms.dqn_rainbow.RainbowDQN method) (agilerl.algorithms.ilql.ILQL method) (agilerl.algorithms.maddpg.MADDPG method) (agilerl.algorithms.matd3.MATD3 method) (agilerl.algorithms.td3.TD3 method) state (agilerl.wrappers.pettingzoo_wrappers.PettingZooVectorizationParallelWrapper property) state_dict() (agilerl.algorithms.ilql.ILQL method) step() (agilerl.wrappers.learning.Skill method) (agilerl.wrappers.pettingzoo_wrappers.PettingZooVectorizationParallelWrapper method) T TD3 (class in agilerl.algorithms.td3) test() (agilerl.algorithms.cqn.CQN method) (agilerl.algorithms.ddpg.DDPG method) (agilerl.algorithms.dqn.DQN method) (agilerl.algorithms.dqn_rainbow.RainbowDQN method) (agilerl.algorithms.maddpg.MADDPG method) (agilerl.algorithms.matd3.MATD3 method) (agilerl.algorithms.neural_ts_bandit.NeuralTS method) (agilerl.algorithms.neural_ucb_bandit.NeuralUCB method) (agilerl.algorithms.ppo.PPO method) (agilerl.algorithms.td3.TD3 method) to() (agilerl.algorithms.ilql.ILQL method) to_empty() (agilerl.algorithms.ilql.ILQL method) TokenEmbedding (class in agilerl.networks.evolvable_bert) (class in agilerl.networks.evolvable_gpt) TournamentSelection (class in agilerl.hpo.tournament) train() (agilerl.algorithms.ilql.ILQL method) train_multi_agent() (in module agilerl.training.train_multi_agent) train_off_policy() (in module agilerl.training.train_off_policy) train_offline() (in module agilerl.training.train_offline) train_on_policy() (in module agilerl.training.train_on_policy) type() (agilerl.algorithms.ilql.ILQL method) U update_priorities() (agilerl.components.replay_buffer.PrioritizedReplayBuffer method) X xpu() (agilerl.algorithms.ilql.ILQL method) Z zero_grad() (agilerl.algorithms.ilql.ILQL method)