Index A | B | C | D | E | F | G | H | I | J | K | L | M | N | O | P | Q | R | S | T | U | V | W | Z A A2CAgent (class in evorl.algorithms.a2c) A2CNetworkParams (class in evorl.algorithms.a2c) A2CWorkflow (class in evorl.algorithms.a2c) (class in evorl.algorithms.contrib.a2c_v2) AbstractReplayBuffer (class in evorl.replay_buffers) (class in evorl.replay_buffers.replay_buffer) AbstractWorkflow (class in evorl.workflows.workflow) Action (in module evorl.types) action_fn (evorl.evaluators.episode_collector.EpisodeCollector attribute) (evorl.evaluators.EpisodeCollector attribute) (evorl.evaluators.Evaluator attribute) (evorl.evaluators.evaluator.Evaluator attribute) action_postprocessor_state (evorl.agent.AgentState attribute) action_size (evorl.algorithms.td7.TD7Actor attribute) action_space (evorl.envs.brax.BraxAdapter property) (evorl.envs.env.Env property) (evorl.envs.envpool.EnvPoolGymAdapter property) (evorl.envs.gymnasium.GymnasiumAdapter property) (evorl.envs.gymnax.GymnaxAdapter property) (evorl.envs.jaxmarl.JaxMARLAdapter property) (evorl.envs.jumanji.JumanjiAdapter property) (evorl.envs.mujoco_playground.MjxEnvAdapter property) (evorl.envs.wrappers.action_wrapper.ActionSquashWrapper property) (evorl.envs.wrappers.ActionSquashWrapper property) (evorl.envs.wrappers.Wrapper property) (evorl.envs.wrappers.wrapper.Wrapper property) ActionPostprocessorParams (in module evorl.types) ActionRepeatWrapper (class in evorl.envs.wrappers) (class in evorl.envs.wrappers.action_wrapper) actions (evorl.sample_batch.SampleBatch attribute) ActionSquashWrapper (class in evorl.envs.wrappers) (class in evorl.envs.wrappers.action_wrapper) activation (evorl.networks.linear.MLP attribute) (evorl.networks.linear.SNMLP attribute) (evorl.networks.MLP attribute) (evorl.networks.SNMLP attribute) activation_final (evorl.networks.linear.MLP attribute) (evorl.networks.linear.SNMLP attribute) (evorl.networks.MLP attribute) (evorl.networks.SNMLP attribute) ActivationFn (in module evorl.networks.linear) actor_loss (evorl.algorithms.contrib.td3_v3.TD3TrainMetric attribute) (evorl.algorithms.ddpg.DDPGTrainMetric attribute) (evorl.algorithms.sac.SACTrainMetric attribute) (evorl.algorithms.td3.TD3TrainMetric attribute) (evorl.algorithms.td7.TD7TrainMetric attribute) actor_loss() (evorl.algorithms.ddpg.DDPGAgent method) (evorl.algorithms.sac.SACAgent method) (evorl.algorithms.sac.SACDiscreteAgent method) (evorl.algorithms.td3.TD3Agent method) (evorl.algorithms.td7.TD7Agent method) actor_network (evorl.algorithms.contrib.td3_v3.TD3Agent attribute) (evorl.algorithms.ddpg.DDPGAgent attribute) (evorl.algorithms.sac.SACAgent attribute) (evorl.algorithms.sac.SACDiscreteAgent attribute) (evorl.algorithms.td3.TD3Agent attribute) (evorl.algorithms.td7.TD7Agent attribute) actor_params (evorl.algorithms.contrib.td3_v3.TD3NetworkParams attribute) (evorl.algorithms.ddpg.DDPGNetworkParams attribute) (evorl.algorithms.sac.SACNetworkParams attribute) (evorl.algorithms.td3.TD3NetworkParams attribute) (evorl.algorithms.td7.TD7NetworkParams attribute) add() (evorl.replay_buffers.AbstractReplayBuffer method) (evorl.replay_buffers.prioritized_replay_buffer.PrioritizedReplayBuffer method) (evorl.replay_buffers.PrioritizedReplayBuffer method) (evorl.replay_buffers.replay_buffer.AbstractReplayBuffer method) (evorl.replay_buffers.replay_buffer.ReplayBuffer method) (evorl.replay_buffers.ReplayBuffer method) add_prefix() (in module evorl.recorders) (in module evorl.recorders.wandb_recorder) add_recorder() (evorl.recorders.ChainRecorder method) (evorl.recorders.recorder.ChainRecorder method) add_recorders() (evorl.workflows.Workflow method) (evorl.workflows.workflow.Workflow method) adv_mode (evorl.algorithms.impala.IMPALAAgent attribute) Agent (class in evorl.agent) agent_gradient_update() (in module evorl.distributed) (in module evorl.distributed.gradients) AgentActionFn (class in evorl.agent) AgentID (in module evorl.types) agents (evorl.envs.jaxmarl.JaxMARLAdapter property) AgentState (class in evorl.agent) AgentStateAxis (in module evorl.agent) algo_state (evorl.ec.optimizers.evox_wrapper.EvoXAlgoState attribute) algorithm (evorl.ec.optimizers.evox_wrapper.EvoXAlgorithmAdapter attribute) all_gather() (in module evorl.distributed) (in module evorl.distributed.comm) all_reduce() (evorl.metrics.MetricBase method) all_steps() (evorl.utils.orbax_utils.DummyCheckpointManager method) alpha (evorl.replay_buffers.prioritized_replay_buffer.PrioritizedReplayBuffer attribute) (evorl.replay_buffers.PrioritizedReplayBuffer attribute) alpha_loss (evorl.algorithms.sac.SACTrainMetric attribute) alpha_loss() (evorl.algorithms.sac.SACAgent method) (evorl.algorithms.sac.SACDiscreteAgent method) apply_hyperparams_to_workflow_state() (evorl.algorithms.meta.pbt.PBTWorkflow method) (evorl.algorithms.meta.pbt_openes.pbt_param_openes.PBTParamOpenESWorkflow method) (evorl.algorithms.meta.pbt_ppo.pbt_param_ppo.PBTParamPPOWorkflow method) (evorl.algorithms.meta.pbt_sac.pbt_param_sac.PBTParamSACWorkflow method) (evorl.algorithms.meta.pbt_workflow.PBTWorkflowBase method) approximate_kl() (in module evorl.utils.rl_toolkits) Array (in module evorl.networks.spectral_norm) ARS (class in evorl.ec.optimizers) (class in evorl.ec.optimizers.ars) ARSState (class in evorl.ec.optimizers.ars) ARSWorkflow (class in evorl.algorithms.contrib.ars_linear) (class in evorl.algorithms.ec.so.ars) ask() (evorl.algorithms.meta.pbt_openes.param_openes.OpenES method) (evorl.ec.evox_algorithm.cmaes.CMAES method) (evorl.ec.evox_algorithm.cmaes.SepCMAES method) (evorl.ec.evox_algorithm.cso.CSO method) (evorl.ec.evox_algorithm.openes.OpenES method) (evorl.ec.optimizers.ARS method) (evorl.ec.optimizers.ars.ARS method) (evorl.ec.optimizers.cem.SepCEM method) (evorl.ec.optimizers.ec_optimizer.EvoOptimizer method) (evorl.ec.optimizers.erl_ga.ERLGA method) (evorl.ec.optimizers.ERLGA method) (evorl.ec.optimizers.EvoOptimizer method) (evorl.ec.optimizers.evox_wrapper.EvoXAlgorithmAdapter method) (evorl.ec.optimizers.OpenES method) (evorl.ec.optimizers.openes.OpenES method) (evorl.ec.optimizers.openes.OpenESNoiseTable method) (evorl.ec.optimizers.OpenESNoiseTable method) (evorl.ec.optimizers.SepCEM method) (evorl.ec.optimizers.vanilla_es.VanillaES method) (evorl.ec.optimizers.vanilla_ga.VanillaGA method) (evorl.ec.optimizers.VanillaES method) (evorl.ec.optimizers.VanillaGA method) AutoresetMode (class in evorl.envs.wrappers.training_wrapper) average_episode_discount_return() (in module evorl.utils.rl_toolkits) avg_l1_norm() (in module evorl.algorithms.td7) Axis (in module evorl.types) B batchify() (in module evorl.utils.ma_utils) best_objective (evorl.metrics.ECWorkflowMetric attribute) best_step() (evorl.utils.orbax_utils.DummyCheckpointManager method) bias_init (evorl.networks.spectral_norm.SNDense attribute) Box (class in evorl.envs.space) BraxAdapter (class in evorl.envs.brax) BraxEvaluator (class in evorl.evaluators) (class in evorl.evaluators.mo_brax_evaluator) buffer_size (evorl.replay_buffers.replay_buffer.ReplayBufferState attribute) (evorl.replay_buffers.ReplayBufferState attribute) build_cemrl_rl_update_fn() (in module evorl.algorithms.erl.cemrl_td3.cemrl_td3_workflow) build_erl_rl_update_fn() (in module evorl.algorithms.erl.erl_td3.erl_td3_workflow) build_from_config() (evorl.algorithms.contrib.pop_ppo.PopPPOWorkflow class method) (evorl.algorithms.contrib.pop_td3.PopTD3Workflow class method) (evorl.algorithms.erl.cemrl_workflow.CEMRLWorkflowBase class method) (evorl.algorithms.erl.erl_workflow.ERLWorkflowBase class method) (evorl.algorithms.meta.pbt_workflow.PBTWorkflowBase class method) (evorl.workflows.ec_workflow.ECWorkflow class method) (evorl.workflows.ECWorkflow class method) (evorl.workflows.rl_workflow.RLWorkflow class method) (evorl.workflows.RLWorkflow class method) (evorl.workflows.Workflow class method) (evorl.workflows.workflow.Workflow class method) build_rl_update_fn() (in module evorl.algorithms.contrib.pop_episodic_td3) (in module evorl.algorithms.contrib.td3_onpolicy) (in module evorl.algorithms.erl.erl_td3.erl_eda) C can_sample() (evorl.replay_buffers.AbstractReplayBuffer method) (evorl.replay_buffers.replay_buffer.AbstractReplayBuffer method) (evorl.replay_buffers.replay_buffer.ReplayBuffer method) (evorl.replay_buffers.ReplayBuffer method) capacity (evorl.replay_buffers.replay_buffer.ReplayBuffer attribute) (evorl.replay_buffers.ReplayBuffer attribute) cemrl_replace_td3_actor_params() (in module evorl.algorithms.erl.cemrl_td3.cemrl_td3_workflow) CEMRLOpenESWorkflow (class in evorl.algorithms.erl.cemrl_td3.cemrl_openes) CEMRLTD3WorkflowTemplate (class in evorl.algorithms.erl.cemrl_td3.cemrl_td3_workflow) CEMRLTrainMetric (class in evorl.algorithms.erl.cemrl_td3.cemrl_origin) (class in evorl.algorithms.erl.cemrl_workflow) CEMRLWorkflow (class in evorl.algorithms.erl.cemrl_td3.cemrl) (class in evorl.algorithms.erl.cemrl_td3.cemrl_origin) CEMRLWorkflowBase (class in evorl.algorithms.erl.cemrl_workflow) ChainRecorder (class in evorl.recorders) (class in evorl.recorders.recorder) check_for_errors() (evorl.utils.orbax_utils.DummyCheckpointManager method) checkpoint_actor_params (evorl.algorithms.td7.TD7NetworkParams attribute) checkpoint_encoder_params (evorl.algorithms.td7.TD7NetworkParams attribute) CheckpointManager (class in evorl.utils.orbax_utils) clean_trajectory() (in module evorl.algorithms.offpolicy_utils) clip_c_threshold (evorl.algorithms.impala.IMPALAAgent attribute) clip_epsilon (evorl.algorithms.ppo.PPOAgent attribute) clip_pg_rho_threshold (evorl.algorithms.impala.IMPALAAgent attribute) clip_policy_noise (evorl.algorithms.contrib.td3_v3.TD3Agent attribute) (evorl.algorithms.td3.TD3Agent attribute) (evorl.algorithms.td7.TD7Agent attribute) clip_rho_threshold (evorl.algorithms.impala.IMPALAAgent attribute) close() (evorl.recorders.ChainRecorder method) (evorl.recorders.log_recorder.LogRecorder method) (evorl.recorders.LogRecorder method) (evorl.recorders.Recorder method) (evorl.recorders.recorder.ChainRecorder method) (evorl.recorders.recorder.Recorder method) (evorl.recorders.wandb_recorder.WandbRecorder method) (evorl.recorders.WandbRecorder method) (evorl.utils.orbax_utils.DummyCheckpointManager method) (evorl.workflows.Workflow method) (evorl.workflows.workflow.Workflow method) CMAES (class in evorl.ec.evox_algorithm.cmaes) CMAESWorkflow (class in evorl.algorithms.ec.so.cmaes) compute_actions() (evorl.agent.Agent method) (evorl.agent.RandomAgent method) (evorl.algorithms.a2c.A2CAgent method) (evorl.algorithms.contrib.td3_v3.TD3Agent method) (evorl.algorithms.ddpg.DDPGAgent method) (evorl.algorithms.dqn.DQNAgent method) (evorl.algorithms.ec.ec_agent.DeterministicECAgent method) (evorl.algorithms.ec.ec_agent.StochasticECAgent method) (evorl.algorithms.impala.IMPALAAgent method) (evorl.algorithms.ppo.PPOAgent method) (evorl.algorithms.sac.SACAgent method) (evorl.algorithms.sac.SACDiscreteAgent method) (evorl.algorithms.td3.TD3Agent method) (evorl.algorithms.td7.TD7Agent method) compute_centered_ranks() (in module evorl.ec.evox_algorithm.openes) (in module evorl.ec.optimizers.openes) compute_discount_return() (in module evorl.utils.rl_toolkits) compute_episode_length() (in module evorl.utils.rl_toolkits) compute_gae() (in module evorl.utils.rl_toolkits) compute_gae_with_horizon() (in module evorl.utils.rl_toolkits) compute_pg_advantage() (in module evorl.algorithms.impala) compute_ranks() (in module evorl.ec.evox_algorithm.openes) (in module evorl.ec.optimizers.openes) compute_values() (evorl.algorithms.a2c.A2CAgent method) (evorl.algorithms.ppo.PPOAgent method) compute_vtrace() (in module evorl.algorithms.impala) concatenate() (evorl.types.PyTreeArrayMixin method) contains() (evorl.envs.space.Box method) (evorl.envs.space.Discrete method) (evorl.envs.space.Space method) (evorl.envs.space.SpaceContainer method) continuous_action (evorl.algorithms.a2c.A2CAgent attribute) (evorl.algorithms.ec.ec_agent.StochasticECAgent attribute) (evorl.algorithms.impala.IMPALAAgent attribute) (evorl.algorithms.ppo.PPOAgent attribute) convert_pop_to_df() (in module evorl.algorithms.meta.pbt_utils) copy() (evorl.types.PyTreeDict method) count (evorl.utils.running_statistics.RunningStatisticsState attribute) cov_eps (evorl.ec.optimizers.cem.SepCEMState attribute) cov_eps_schedule (evorl.ec.optimizers.cem.SepCEM attribute) (evorl.ec.optimizers.SepCEM attribute) create_brax_env() (in module evorl.envs.brax) create_dummy_td3_trainmetric() (in module evorl.algorithms.erl.cemrl_td3.cemrl_td3_workflow) (in module evorl.algorithms.erl.erl_td3.erl_td3_workflow) create_env() (in module evorl.envs) create_envpool_env() (in module evorl.envs.envpool) create_gymnasium_env() (in module evorl.envs.gymnasium) create_gymnax_env() (in module evorl.envs.gymnax) create_jumanji_env() (in module evorl.envs.jumanji) create_mabrax_env() (in module evorl.envs.jaxmarl) create_mujoco_playground_env() (in module evorl.envs.mujoco_playground) create_wrapped_brax_env() (in module evorl.envs.brax) create_wrapped_gymnax_env() (in module evorl.envs.gymnax) create_wrapped_mabrax_env() (in module evorl.envs.jaxmarl) create_wrapped_mujoco_playground_env() (in module evorl.envs.mujoco_playground) critic1_loss (evorl.algorithms.contrib.td3_v3.TD3TrainMetric attribute) critic1_params (evorl.algorithms.contrib.td3_v3.TD3NetworkParams attribute) critic2_loss (evorl.algorithms.contrib.td3_v3.TD3TrainMetric attribute) critic2_params (evorl.algorithms.contrib.td3_v3.TD3NetworkParams attribute) critic_loss (evorl.algorithms.ddpg.DDPGTrainMetric attribute) (evorl.algorithms.sac.SACTrainMetric attribute) (evorl.algorithms.td3.TD3TrainMetric attribute) (evorl.algorithms.td7.TD7TrainMetric attribute) critic_loss() (evorl.algorithms.ddpg.DDPGAgent method) (evorl.algorithms.meta.pbt_sac.param_sac.ParamSACAgent method) (evorl.algorithms.sac.SACAgent method) (evorl.algorithms.sac.SACDiscreteAgent method) (evorl.algorithms.td3.TD3Agent method) (evorl.algorithms.td7.TD7Agent method) critic_network (evorl.algorithms.contrib.td3_v3.TD3Agent attribute) (evorl.algorithms.ddpg.DDPGAgent attribute) (evorl.algorithms.sac.SACAgent attribute) (evorl.algorithms.sac.SACDiscreteAgent attribute) (evorl.algorithms.td3.TD3Agent attribute) (evorl.algorithms.td7.TD7Agent attribute) critic_params (evorl.algorithms.ddpg.DDPGNetworkParams attribute) (evorl.algorithms.sac.SACNetworkParams attribute) (evorl.algorithms.td3.TD3NetworkParams attribute) (evorl.algorithms.td7.TD7NetworkParams attribute) critics_in_actor_loss (evorl.algorithms.contrib.td3_v3.TD3Agent attribute) (evorl.algorithms.td3.TD3Agent attribute) CSO (class in evorl.ec.evox_algorithm.cso) CSOState (class in evorl.ec.evox_algorithm.cso) current_index (evorl.replay_buffers.replay_buffer.ReplayBufferState attribute) (evorl.replay_buffers.ReplayBufferState attribute) D data (evorl.replay_buffers.replay_buffer.ReplayBufferState attribute) (evorl.replay_buffers.ReplayBufferState attribute) dataclass() (in module evorl.types) DDPGAgent (class in evorl.algorithms.ddpg) DDPGNetworkParams (class in evorl.algorithms.ddpg) DDPGTrainMetric (class in evorl.algorithms.ddpg) DDPGWorkflow (class in evorl.algorithms.ddpg) decay (evorl.ec.optimizers.ExponentialScheduleSpec attribute) (evorl.ec.optimizers.utils.ExponentialScheduleSpec attribute) delete() (evorl.utils.orbax_utils.DummyCheckpointManager method) denormalize() (in module evorl.utils.running_statistics) DeterministicECAgent (class in evorl.algorithms.ec.ec_agent) dim (evorl.ec.evox_algorithm.cso.CSO attribute) directory() (evorl.utils.orbax_utils.DummyCheckpointManager method) disable_gpu_preallocation() (in module evorl.utils.jax_utils) DISABLED (evorl.envs.wrappers.training_wrapper.AutoresetMode attribute) discount (evorl.algorithms.contrib.td3_v3.TD3Agent attribute) (evorl.algorithms.ddpg.DDPGAgent attribute) (evorl.algorithms.dqn.DQNAgent attribute) (evorl.algorithms.impala.IMPALAAgent attribute) (evorl.algorithms.sac.SACAgent attribute) (evorl.algorithms.sac.SACDiscreteAgent attribute) (evorl.algorithms.td3.TD3Agent attribute) (evorl.algorithms.td7.TD7Agent attribute) (evorl.evaluators.episode_collector.EpisodeCollector attribute) (evorl.evaluators.EpisodeCollector attribute) (evorl.evaluators.Evaluator attribute) (evorl.evaluators.evaluator.Evaluator attribute) Discrete (class in evorl.envs.space) DistributedInfo (class in evorl.workflows.ec_workflow) done (evorl.envs.env.EnvState attribute) Done (in module evorl.types) dones (evorl.sample_batch.SampleBatch attribute) DP_AXIS_NAME (in module evorl.distributed) DQNAgent (class in evorl.algorithms.dqn) DQNNetworkParams (class in evorl.algorithms.dqn) DQNTrainMetric (class in evorl.algorithms.dqn) DQNWorkflow (class in evorl.algorithms.dqn) DQNWorkflowMetric (class in evorl.algorithms.dqn) dtype (evorl.networks.spectral_norm.SNDense attribute) Dtype (in module evorl.networks.spectral_norm) DUMMY_TD3_TRAINMETRIC (in module evorl.algorithms.erl.cemrl_td3.cemrl_td3_workflow) (in module evorl.algorithms.erl.erl_td3.erl_td3_workflow) DummyCheckpointManager (class in evorl.utils.orbax_utils) E ec_info (evorl.algorithms.erl.cemrl_workflow.CEMRLTrainMetric attribute) (evorl.algorithms.erl.erl_workflow.ERLTrainMetric attribute) ec_metrics (evorl.metrics.ECTrainMetric attribute) ECNetworkParams (class in evorl.algorithms.ec.ec_agent) ECState (in module evorl.ec.optimizers) (in module evorl.ec.optimizers.ec_optimizer) ECTrainMetric (class in evorl.metrics) ECWorkflow (class in evorl.workflows) (class in evorl.workflows.ec_workflow) ECWorkflowMetric (class in evorl.metrics) ECWorkflowTemplate (class in evorl.workflows) (class in evorl.workflows.ec_workflow) elite_weights (evorl.ec.optimizers.cem.SepCEM attribute) (evorl.ec.optimizers.SepCEM attribute) (evorl.ec.optimizers.vanilla_es.VanillaES attribute) (evorl.ec.optimizers.VanillaES attribute) enable_crossover (evorl.ec.optimizers.erl_ga.ERLGA attribute) (evorl.ec.optimizers.ERLGA attribute) (evorl.ec.optimizers.vanilla_ga.VanillaGA attribute) (evorl.ec.optimizers.VanillaGA attribute) enable_deterministic_mode() (in module evorl.utils.jax_utils) enable_jit() (evorl.algorithms.ec.so.es_workflow.ESWorkflowTemplate class method) (evorl.algorithms.erl.cemrl_td3.cemrl_origin.CEMRLWorkflow class method) (evorl.algorithms.erl.cemrl_workflow.CEMRLWorkflowBase class method) (evorl.algorithms.erl.erl_td3.erl_origin.ERLWorkflow class method) (evorl.algorithms.erl.erl_workflow.ERLWorkflowBase class method) (evorl.algorithms.meta.pbt_workflow.PBTOffpolicyWorkflowTemplate class method) (evorl.algorithms.meta.pbt_workflow.PBTWorkflowBase class method) (evorl.algorithms.offpolicy_utils.OffPolicyWorkflowTemplate class method) (evorl.workflows.ec_workflow.ECWorkflow class method) (evorl.workflows.ec_workflow.ECWorkflowTemplate class method) (evorl.workflows.ECWorkflow class method) (evorl.workflows.ECWorkflowTemplate class method) (evorl.workflows.rl_workflow.RLWorkflow class method) (evorl.workflows.RLWorkflow class method) enable_multi_devices (evorl.workflows.ec_workflow.ECWorkflow property) (evorl.workflows.ECWorkflow property) (evorl.workflows.rl_workflow.RLWorkflow property) (evorl.workflows.RLWorkflow property) enable_shmap() (evorl.algorithms.ec.so.es_workflow.ESWorkflowTemplate class method) (evorl.workflows.ec_workflow.ECWorkflow class method) (evorl.workflows.ec_workflow.ECWorkflowTemplate class method) (evorl.workflows.ECWorkflow class method) (evorl.workflows.ECWorkflowTemplate class method) (evorl.workflows.rl_workflow.RLWorkflow class method) (evorl.workflows.RLWorkflow class method) encoder_loss (evorl.algorithms.td7.TD7TrainMetric attribute) encoder_loss() (evorl.algorithms.td7.TD7Agent method) encoder_network (evorl.algorithms.td7.TD7Agent attribute) encoder_params (evorl.algorithms.td7.TD7NetworkParams attribute) entropy() (evorl.distribution.TanhTransformedDistribution method) Env (class in evorl.envs.env) env (evorl.evaluators.episode_collector.EpisodeCollector attribute) (evorl.evaluators.EpisodeCollector attribute) (evorl.evaluators.Evaluator attribute) (evorl.evaluators.evaluator.Evaluator attribute) env_extra_fields (evorl.evaluators.episode_collector.EpisodeCollector attribute) (evorl.evaluators.EpisodeCollector attribute) env_state (evorl.envs.env.EnvState attribute) env_step() (in module evorl.evaluators.ec_evaluator) (in module evorl.rollout) EnvAdapter (class in evorl.envs.env) EnvInternalState (in module evorl.types) ENVPOOL (evorl.envs.wrappers.training_wrapper.AutoresetMode attribute) EnvPoolGymAdapter (class in evorl.envs.envpool) EnvResetFn (in module evorl.envs.env) EnvState (class in evorl.envs.env) EnvStepFn (in module evorl.envs.env) Episode (class in evorl.sample_batch) episode_lengths (evorl.metrics.EvaluateMetric attribute) episode_returns (evorl.metrics.EvaluateMetric attribute) EpisodeCollector (class in evorl.evaluators) (class in evorl.evaluators.episode_collector) EpisodeObsCollector (class in evorl.evaluators) (class in evorl.evaluators.ec_evaluator) EpisodeWrapper (class in evorl.envs.wrappers) (class in evorl.envs.wrappers.ma_training_wrapper) (class in evorl.envs.wrappers.training_wrapper) eps (evorl.networks.spectral_norm.SNDense attribute) erl_replace_td3_actor_params() (in module evorl.algorithms.erl.erl_td3.erl_td3_workflow) ERLEDAWorkflow (class in evorl.algorithms.erl.erl_td3.erl_eda) ERLESWorkflow (class in evorl.algorithms.erl.erl_td3.erl_es) ERLGA (class in evorl.ec.optimizers) (class in evorl.ec.optimizers.erl_ga) ERLGAMod (class in evorl.ec.optimizers) (class in evorl.ec.optimizers.erl_ga) ERLGAModState (class in evorl.ec.optimizers.erl_ga) ERLGAState (class in evorl.ec.optimizers.erl_ga) ERLGAWorkflow (class in evorl.algorithms.erl.erl_td3.erl_ga) ERLMutation (class in evorl.ec.operators) ERLTD3WorkflowTemplate (class in evorl.algorithms.erl.erl_td3.erl_td3_workflow) ERLTrainMetric (class in evorl.algorithms.erl.erl_td3.erl_origin) (class in evorl.algorithms.erl.erl_workflow) ERLWorkflow (class in evorl.algorithms.erl.erl_td3.erl_origin) ERLWorkflowBase (class in evorl.algorithms.erl.erl_workflow) ESWorkflowTemplate (class in evorl.algorithms.ec.so.es_workflow) eval_env_step() (in module evorl.evaluators.mo_brax_evaluator) (in module evorl.rollout) eval_metrics() (in module evorl.evaluators.mo_brax_evaluator) eval_rollout_episode() (in module evorl.evaluators.mo_brax_evaluator) (in module evorl.rollout) evaluate() (evorl.algorithms.contrib.pop_episodic_td3.PopEpisodicTD3Workflow method) (evorl.algorithms.contrib.pop_ppo.PopPPOWorkflow method) (evorl.algorithms.contrib.pop_td3.PopTD3Workflow method) (evorl.algorithms.ec.so.es_workflow.ESWorkflowTemplate method) (evorl.algorithms.erl.cemrl_td3.cemrl.CEMRLWorkflow method) (evorl.algorithms.erl.cemrl_workflow.CEMRLWorkflowBase method) (evorl.algorithms.erl.erl_td3.erl_eda.ERLEDAWorkflow method) (evorl.algorithms.erl.erl_td3.erl_es.ERLESWorkflow method) (evorl.algorithms.erl.erl_td3.erl_ga.ERLGAWorkflow method) (evorl.algorithms.erl.erl_workflow.ERLWorkflowBase method) (evorl.algorithms.meta.pbt_openes.pbt_param_openes.PBTParamOpenESWorkflow method) (evorl.algorithms.meta.pbt_workflow.PBTWorkflowBase method) (evorl.algorithms.random_agent.RandomAgentWorkflow method) (evorl.evaluators.BraxEvaluator method) (evorl.evaluators.Evaluator method) (evorl.evaluators.evaluator.Evaluator method) (evorl.evaluators.mo_brax_evaluator.BraxEvaluator method) (evorl.workflows.OffPolicyWorkflow method) (evorl.workflows.OnPolicyWorkflow method) (evorl.workflows.rl_workflow.OffPolicyWorkflow method) (evorl.workflows.rl_workflow.OnPolicyWorkflow method) (evorl.workflows.rl_workflow.RLWorkflow method) (evorl.workflows.RLWorkflow method) evaluate_actions() (evorl.agent.Agent method) (evorl.agent.RandomAgent method) (evorl.algorithms.a2c.A2CAgent method) (evorl.algorithms.contrib.td3_v3.TD3Agent method) (evorl.algorithms.ddpg.DDPGAgent method) (evorl.algorithms.dqn.DQNAgent method) (evorl.algorithms.ec.ec_agent.DeterministicECAgent method) (evorl.algorithms.ec.ec_agent.StochasticECAgent method) (evorl.algorithms.impala.IMPALAAgent method) (evorl.algorithms.ppo.PPOAgent method) (evorl.algorithms.sac.SACAgent method) (evorl.algorithms.sac.SACDiscreteAgent method) (evorl.algorithms.td3.TD3Agent method) (evorl.algorithms.td7.TD7Agent method) EvaluateMetric (class in evorl.algorithms.erl.cemrl_td3.cemrl) (class in evorl.algorithms.erl.erl_td3.erl_eda) (class in evorl.algorithms.erl.erl_td3.erl_es) (class in evorl.algorithms.erl.erl_td3.erl_ga) (class in evorl.metrics) Evaluator (class in evorl.evaluators) (class in evorl.evaluators.evaluator) EvoOptimizer (class in evorl.ec.optimizers) (class in evorl.ec.optimizers.ec_optimizer) evorl module evorl.agent module evorl.algorithms module evorl.algorithms.a2c module evorl.algorithms.contrib module evorl.algorithms.contrib.a2c_v2 module evorl.algorithms.contrib.ars_linear module evorl.algorithms.contrib.openes_noise_table module evorl.algorithms.contrib.pop_episodic_td3 module evorl.algorithms.contrib.pop_ppo module evorl.algorithms.contrib.pop_td3 module evorl.algorithms.contrib.td3_ep module evorl.algorithms.contrib.td3_onpolicy module evorl.algorithms.contrib.td3_v2 module evorl.algorithms.contrib.td3_v3 module evorl.algorithms.ddpg module evorl.algorithms.dqn module evorl.algorithms.ec module evorl.algorithms.ec.ec_agent module evorl.algorithms.ec.mo module evorl.algorithms.ec.mo.nsga2_brax module evorl.algorithms.ec.obs_utils module evorl.algorithms.ec.so module evorl.algorithms.ec.so.ars module evorl.algorithms.ec.so.cmaes module evorl.algorithms.ec.so.es_workflow module evorl.algorithms.ec.so.openes module evorl.algorithms.ec.so.sepcem module evorl.algorithms.ec.so.vanilla_es module evorl.algorithms.erl module evorl.algorithms.erl.cemrl_td3 module evorl.algorithms.erl.cemrl_td3.cemrl module evorl.algorithms.erl.cemrl_td3.cemrl_openes module evorl.algorithms.erl.cemrl_td3.cemrl_origin module evorl.algorithms.erl.cemrl_td3.cemrl_td3_workflow module evorl.algorithms.erl.cemrl_workflow module evorl.algorithms.erl.erl_td3 module evorl.algorithms.erl.erl_td3.erl_eda module evorl.algorithms.erl.erl_td3.erl_es module evorl.algorithms.erl.erl_td3.erl_ga module evorl.algorithms.erl.erl_td3.erl_origin module evorl.algorithms.erl.erl_td3.erl_td3_workflow module evorl.algorithms.erl.erl_workflow module evorl.algorithms.impala module evorl.algorithms.meta module evorl.algorithms.meta.pbt module evorl.algorithms.meta.pbt_openes module evorl.algorithms.meta.pbt_openes.param_openes module evorl.algorithms.meta.pbt_openes.pbt_param_openes module evorl.algorithms.meta.pbt_operations module evorl.algorithms.meta.pbt_ppo module evorl.algorithms.meta.pbt_ppo.param_ppo module evorl.algorithms.meta.pbt_ppo.pbt_cso_param_ppo module evorl.algorithms.meta.pbt_ppo.pbt_param_ppo module evorl.algorithms.meta.pbt_sac module evorl.algorithms.meta.pbt_sac.param_sac module evorl.algorithms.meta.pbt_sac.pbt_param_sac module evorl.algorithms.meta.pbt_utils module evorl.algorithms.meta.pbt_workflow module evorl.algorithms.multi_agents module evorl.algorithms.multi_agents.ippo_mabrax module evorl.algorithms.multi_agents.maddpg_mabrax module evorl.algorithms.multi_agents.mappo_mabrax module evorl.algorithms.multi_agents.matd3_mabrax module evorl.algorithms.offpolicy_utils module evorl.algorithms.ppo module evorl.algorithms.random_agent module evorl.algorithms.sac module evorl.algorithms.td3 module evorl.algorithms.td7 module evorl.distributed module evorl.distributed.comm module evorl.distributed.gradients module evorl.distributed.sharding module evorl.distribution module evorl.ec module evorl.ec.evox_algorithm module evorl.ec.evox_algorithm.cmaes module evorl.ec.evox_algorithm.cso module evorl.ec.evox_algorithm.openes module evorl.ec.evox_algorithm.sort_utils module evorl.ec.operators module evorl.ec.operators.utils module evorl.ec.optimizers module evorl.ec.optimizers.ars module evorl.ec.optimizers.cem module evorl.ec.optimizers.ec_optimizer module evorl.ec.optimizers.erl_ga module evorl.ec.optimizers.evox_wrapper module evorl.ec.optimizers.openes module evorl.ec.optimizers.utils module evorl.ec.optimizers.vanilla_es module evorl.ec.optimizers.vanilla_ga module evorl.envs module evorl.envs.brax module evorl.envs.env module evorl.envs.envpool module evorl.envs.gymnasium module evorl.envs.gymnax module evorl.envs.jaxmarl module evorl.envs.jumanji module evorl.envs.mujoco_playground module evorl.envs.space module evorl.envs.utils module evorl.envs.wrappers module evorl.envs.wrappers.action_wrapper module evorl.envs.wrappers.ma_training_wrapper module evorl.envs.wrappers.obs_wrapper module evorl.envs.wrappers.reward_wrapper module evorl.envs.wrappers.training_wrapper module evorl.envs.wrappers.wrapper module evorl.evaluators module evorl.evaluators.ec_evaluator module evorl.evaluators.episode_collector module evorl.evaluators.evaluator module evorl.evaluators.mo_brax_evaluator module evorl.metrics module evorl.networks module evorl.networks.layer_norm module evorl.networks.linear module evorl.networks.spectral_norm module evorl.recorders module evorl.recorders.log_recorder module evorl.recorders.recorder module evorl.recorders.wandb_recorder module evorl.replay_buffers module evorl.replay_buffers.lap_replay_buffer module evorl.replay_buffers.prioritized_replay_buffer module evorl.replay_buffers.replay_buffer module evorl.rollout module evorl.sample_batch module evorl.types module evorl.utils module evorl.utils.ec_utils module evorl.utils.jax_utils module evorl.utils.ma_utils module evorl.utils.orbax_utils module evorl.utils.rl_toolkits module evorl.utils.running_statistics module evorl.workflows module evorl.workflows.ec_workflow module evorl.workflows.rl_workflow module evorl.workflows.workflow module EvoXAlgorithmAdapter (class in evorl.ec.optimizers.evox_wrapper) EvoXAlgoState (class in evorl.ec.optimizers.evox_wrapper) exp_uniform_init() (in module evorl.algorithms.meta.pbt_utils) exploit_and_explore() (evorl.algorithms.meta.pbt_ppo.pbt_cso_param_ppo.PBTCSOParamPPOWorkflow method) (evorl.algorithms.meta.pbt_workflow.PBTWorkflowBase method) (evorl.algorithms.meta.pbt_workflow.PBTWorkflowTemplate method) exploration_epsilon (evorl.algorithms.contrib.td3_v3.TD3Agent attribute) (evorl.algorithms.ddpg.DDPGAgent attribute) (evorl.algorithms.dqn.DQNNetworkParams attribute) (evorl.algorithms.td3.TD3Agent attribute) (evorl.algorithms.td7.TD7Agent attribute) explore() (in module evorl.algorithms.meta.pbt_operations) ExponentialScheduleSpec (class in evorl.ec.optimizers) (class in evorl.ec.optimizers.utils) external_pop (evorl.ec.optimizers.erl_ga.ERLGAModState attribute) external_size (evorl.ec.optimizers.erl_ga.ERLGAMod attribute) (evorl.ec.optimizers.ERLGAMod attribute) (evorl.ec.optimizers.vanilla_es.VanillaESMod attribute) (evorl.ec.optimizers.VanillaESMod attribute) extra_state (evorl.agent.AgentState attribute) ExtraInfo (in module evorl.types) extras (evorl.sample_batch.SampleBatch attribute) F f_layer_sizes (evorl.algorithms.td7.TD7Encoder attribute) FAST (evorl.envs.wrappers.training_wrapper.AutoresetMode attribute) fast_eval_metrics() (in module evorl.evaluators.mo_brax_evaluator) fast_eval_rollout_episode() (in module evorl.rollout) FastVmapAutoResetWrapper (class in evorl.envs.wrappers) (class in evorl.envs.wrappers.ma_training_wrapper) (class in evorl.envs.wrappers.training_wrapper) features (evorl.networks.spectral_norm.SNDense attribute) filter_zero_size_arrays_on_restore() (in module evorl.utils.orbax_utils) filter_zero_size_arrays_on_save() (in module evorl.utils.orbax_utils) final (evorl.ec.optimizers.ExponentialScheduleSpec attribute) (evorl.ec.optimizers.utils.ExponentialScheduleSpec attribute) fitness (evorl.ec.evox_algorithm.cso.CSOState attribute) fitness_shaping_fn (evorl.algorithms.meta.pbt_openes.param_openes.OpenES attribute) (evorl.ec.optimizers.OpenES attribute) (evorl.ec.optimizers.openes.OpenES attribute) (evorl.ec.optimizers.openes.OpenESNoiseTable attribute) (evorl.ec.optimizers.OpenESNoiseTable attribute) fitness_std_eps (evorl.ec.optimizers.ARS attribute) (evorl.ec.optimizers.ars.ARS attribute) fixed_bias (evorl.networks.layer_norm.StaticLayerNorm attribute) (evorl.networks.StaticLayerNorm attribute) fixed_encoder_params (evorl.algorithms.td7.TD7NetworkParams attribute) fixed_encoder_target_params (evorl.algorithms.td7.TD7NetworkParams attribute) fixed_scale (evorl.networks.layer_norm.StaticLayerNorm attribute) (evorl.networks.StaticLayerNorm attribute) flatten_pop_rollout_episode() (in module evorl.utils.rl_toolkits) flatten_pop_rollout_trajectory() (in module evorl.algorithms.contrib.pop_td3) flatten_rollout_trajectory() (in module evorl.utils.rl_toolkits) fold_multi_steps() (in module evorl.utils.rl_toolkits) G g_layer_sizes (evorl.algorithms.td7.TD7Encoder attribute) get_1d_array() (in module evorl.recorders) (in module evorl.recorders.wandb_recorder) get_1d_array_statistics() (in module evorl.recorders) (in module evorl.recorders.wandb_recorder) get_categorical_dist() (in module evorl.distribution) get_ec_pop_statistics() (in module evorl.algorithms.erl.erl_td3.erl_origin) get_global_ranks() (in module evorl.distributed) (in module evorl.distributed.comm) get_norm_layer() (in module evorl.networks.layer_norm) get_process_id() (in module evorl.distributed) (in module evorl.distributed.comm) get_random_actions() (in module evorl.envs.jaxmarl) get_std_statistics() (in module evorl.algorithms.erl.cemrl_td3.cemrl) get_tanh_norm_dist() (in module evorl.distribution) get_train_episode_return() (in module evorl.algorithms.contrib.a2c_v2) get_trancated_norm_dist() (in module evorl.distribution) get_wrapper() (in module evorl.envs.wrappers) (in module evorl.envs.wrappers.wrapper) gradient_update() (in module evorl.distributed) (in module evorl.distributed.gradients) gym_space_to_evorl_space() (in module evorl.envs.envpool) gymnasium_space_to_evorl_space() (in module evorl.envs.gymnasium) GymnasiumAdapter (class in evorl.envs.gymnasium) gymnax_space_to_evorl_space() (in module evorl.envs.gymnax) GymnaxAdapter (class in evorl.envs.gymnax) H has_nan() (in module evorl.utils.jax_utils) hidden_layer_sizes (evorl.algorithms.td7.TD7Actor attribute) (evorl.algorithms.td7.TD7Critic attribute) high (evorl.envs.space.Box attribute) I IMPALAAgent (class in evorl.algorithms.impala) IMPALANetworkParams (class in evorl.algorithms.impala) IMPALAWorkflow (class in evorl.algorithms.impala) index_set() (evorl.types.PyTreeArrayMixin method) index_sum() (evorl.types.PyTreeArrayMixin method) info (evorl.envs.env.EnvState attribute) init (evorl.ec.optimizers.ExponentialScheduleSpec attribute) (evorl.ec.optimizers.utils.ExponentialScheduleSpec attribute) init() (evorl.agent.Agent method) (evorl.agent.RandomAgent method) (evorl.algorithms.a2c.A2CAgent method) (evorl.algorithms.contrib.td3_v3.TD3Agent method) (evorl.algorithms.ddpg.DDPGAgent method) (evorl.algorithms.dqn.DQNAgent method) (evorl.algorithms.ec.ec_agent.DeterministicECAgent method) (evorl.algorithms.ec.ec_agent.StochasticECAgent method) (evorl.algorithms.impala.IMPALAAgent method) (evorl.algorithms.meta.pbt_openes.param_openes.OpenES method) (evorl.algorithms.meta.pbt_ppo.param_ppo.ParamPPOAgent method) (evorl.algorithms.meta.pbt_sac.param_sac.ParamSACAgent method) (evorl.algorithms.ppo.PPOAgent method) (evorl.algorithms.sac.SACAgent method) (evorl.algorithms.sac.SACDiscreteAgent method) (evorl.algorithms.td3.TD3Agent method) (evorl.algorithms.td7.TD7Agent method) (evorl.ec.optimizers.ARS method) (evorl.ec.optimizers.ars.ARS method) (evorl.ec.optimizers.cem.SepCEM method) (evorl.ec.optimizers.ec_optimizer.EvoOptimizer method) (evorl.ec.optimizers.erl_ga.ERLGA method) (evorl.ec.optimizers.erl_ga.ERLGAMod method) (evorl.ec.optimizers.ERLGA method) (evorl.ec.optimizers.ERLGAMod method) (evorl.ec.optimizers.EvoOptimizer method) (evorl.ec.optimizers.evox_wrapper.EvoXAlgorithmAdapter method) (evorl.ec.optimizers.OpenES method) (evorl.ec.optimizers.openes.OpenES method) (evorl.ec.optimizers.openes.OpenESNoiseTable method) (evorl.ec.optimizers.OpenESNoiseTable method) (evorl.ec.optimizers.SepCEM method) (evorl.ec.optimizers.vanilla_es.VanillaES method) (evorl.ec.optimizers.vanilla_ga.VanillaGA method) (evorl.ec.optimizers.VanillaES method) (evorl.ec.optimizers.VanillaGA method) (evorl.recorders.ChainRecorder method) (evorl.recorders.log_recorder.LogRecorder method) (evorl.recorders.LogRecorder method) (evorl.recorders.Recorder method) (evorl.recorders.recorder.ChainRecorder method) (evorl.recorders.recorder.Recorder method) (evorl.recorders.wandb_recorder.WandbRecorder method) (evorl.recorders.WandbRecorder method) (evorl.replay_buffers.AbstractReplayBuffer method) (evorl.replay_buffers.prioritized_replay_buffer.PrioritizedReplayBuffer method) (evorl.replay_buffers.PrioritizedReplayBuffer method) (evorl.replay_buffers.replay_buffer.AbstractReplayBuffer method) (evorl.replay_buffers.replay_buffer.ReplayBuffer method) (evorl.replay_buffers.ReplayBuffer method) (evorl.workflows.Workflow method) (evorl.workflows.workflow.AbstractWorkflow method) (evorl.workflows.workflow.Workflow method) init_alpha (evorl.algorithms.sac.SACAgent attribute) (evorl.algorithms.sac.SACDiscreteAgent attribute) init_ask() (evorl.ec.evox_algorithm.cso.CSO method) init_obs_preprocessor() (in module evorl.algorithms.ec.obs_utils) init_obs_preprocessor_with_random_timesteps() (in module evorl.algorithms.ec.obs_utils) init_state() (in module evorl.utils.running_statistics) init_std (evorl.ec.evox_algorithm.cso.CSO attribute) init_step (evorl.ec.optimizers.evox_wrapper.EvoXAlgoState attribute) init_tell() (evorl.ec.evox_algorithm.cso.CSO method) Initializer (in module evorl.networks.linear) invert_permutation() (in module evorl.utils.jax_utils) is_dist_initialized() (in module evorl.distributed) (in module evorl.distributed.comm) is_full() (evorl.replay_buffers.AbstractReplayBuffer method) (evorl.replay_buffers.replay_buffer.AbstractReplayBuffer method) (evorl.replay_buffers.replay_buffer.ReplayBuffer method) (evorl.replay_buffers.ReplayBuffer method) is_jitted() (in module evorl.utils.jax_utils) is_layer_norm_layer() (in module evorl.ec.operators.utils) is_leaf_space() (in module evorl.envs.space) item_metadata() (evorl.utils.orbax_utils.DummyCheckpointManager method) iterations (evorl.algorithms.contrib.pop_td3.WorkflowMetric attribute) (evorl.algorithms.erl.cemrl_td3.cemrl_origin.WorkflowMetric attribute) (evorl.algorithms.erl.erl_workflow.WorkflowMetric attribute) (evorl.algorithms.meta.pbt_workflow.PBTWorkflowMetric attribute) (evorl.metrics.ECWorkflowMetric attribute) (evorl.metrics.MultiObjectiveECWorkflowMetric attribute) (evorl.metrics.WorkflowMetric attribute) J jaxmarl_space_to_evorl_space() (in module evorl.envs.jaxmarl) JaxMARLAdapter (class in evorl.envs.jaxmarl) jit_method() (in module evorl.utils.jax_utils) jumanji_specs_to_evorl_space() (in module evorl.envs.jumanji) JumanjiAdapter (class in evorl.envs.jumanji) K kernel_init (evorl.networks.linear.MLP attribute) (evorl.networks.linear.SNMLP attribute) (evorl.networks.MLP attribute) (evorl.networks.SNMLP attribute) (evorl.networks.spectral_norm.SNDense attribute) key (evorl.ec.evox_algorithm.cso.CSOState attribute) (evorl.ec.optimizers.ars.ARSState attribute) (evorl.ec.optimizers.cem.SepCEMState attribute) (evorl.ec.optimizers.erl_ga.ERLGAState attribute) (evorl.ec.optimizers.openes.OpenESNoiseTableState attribute) (evorl.ec.optimizers.openes.OpenESState attribute) (evorl.ec.optimizers.vanilla_es.VanillaESState attribute) (evorl.ec.optimizers.vanilla_ga.VanillaGAState attribute) L LAPReplayBuffer (class in evorl.replay_buffers) (class in evorl.replay_buffers.lap_replay_buffer) latest_step() (evorl.utils.orbax_utils.DummyCheckpointManager method) layer_sizes (evorl.networks.linear.MLP attribute) (evorl.networks.linear.SNMLP attribute) (evorl.networks.MLP attribute) (evorl.networks.SNMLP attribute) lb (evorl.ec.evox_algorithm.cso.CSO attribute) learn() (evorl.algorithms.a2c.A2CWorkflow method) (evorl.algorithms.contrib.a2c_v2.A2CWorkflow method) (evorl.algorithms.contrib.pop_episodic_td3.PopEpisodicTD3Workflow method) (evorl.algorithms.contrib.pop_ppo.PopPPOWorkflow method) (evorl.algorithms.contrib.pop_td3.PopTD3Workflow method) (evorl.algorithms.contrib.td3_ep.TD3WorkflowMod method) (evorl.algorithms.contrib.td3_onpolicy.TD3OnPolicyWorkflow method) (evorl.algorithms.contrib.td3_v2.TD3V2Workflow method) (evorl.algorithms.contrib.td3_v3.TD3V3Workflow method) (evorl.algorithms.ec.mo.nsga2_brax.NSGA2Workflow method) (evorl.algorithms.ec.so.es_workflow.ESWorkflowTemplate method) (evorl.algorithms.erl.cemrl_td3.cemrl.CEMRLWorkflow method) (evorl.algorithms.erl.cemrl_td3.cemrl_openes.CEMRLOpenESWorkflow method) (evorl.algorithms.erl.erl_td3.erl_eda.ERLEDAWorkflow method) (evorl.algorithms.erl.erl_td3.erl_es.ERLESWorkflow method) (evorl.algorithms.erl.erl_td3.erl_ga.ERLGAWorkflow method) (evorl.algorithms.impala.IMPALAWorkflow method) (evorl.algorithms.meta.pbt_workflow.PBTOffpolicyWorkflowTemplate method) (evorl.algorithms.meta.pbt_workflow.PBTWorkflowTemplate method) (evorl.algorithms.offpolicy_utils.OffPolicyWorkflowTemplate method) (evorl.algorithms.ppo.PPOWorkflow method) (evorl.algorithms.random_agent.RandomAgentWorkflow method) (evorl.algorithms.td7.TD7Workflow method) (evorl.workflows.Workflow method) (evorl.workflows.workflow.Workflow method) load() (in module evorl.utils.orbax_utils) log_alpha (evorl.algorithms.sac.SACNetworkParams attribute) log_prob() (evorl.distribution.TanhTransformedDistribution method) log_uniform_init() (in module evorl.algorithms.meta.pbt_utils) LOGGING_WARMUP_FLAG (evorl.algorithms.erl.erl_td3.erl_td3_workflow.ERLTD3WorkflowTemplate attribute) LogRecorder (class in evorl.recorders) (class in evorl.recorders.log_recorder) loss (evorl.algorithms.dqn.DQNTrainMetric attribute) (evorl.metrics.TrainMetric attribute) loss() (evorl.algorithms.a2c.A2CAgent method) (evorl.algorithms.dqn.DQNAgent method) (evorl.algorithms.impala.IMPALAAgent method) (evorl.algorithms.meta.pbt_ppo.param_ppo.ParamPPOAgent method) (evorl.algorithms.ppo.PPOAgent method) loss_and_pgrad() (in module evorl.distributed.gradients) LossDict (in module evorl.types) LossFn (class in evorl.agent) low (evorl.envs.space.Box attribute) lr (evorl.algorithms.meta.pbt_openes.param_openes.OpenES attribute) (evorl.ec.optimizers.ARS attribute) (evorl.ec.optimizers.ars.ARS attribute) lr_schedule (evorl.ec.optimizers.OpenES attribute) (evorl.ec.optimizers.openes.OpenES attribute) (evorl.ec.optimizers.openes.OpenESNoiseTable attribute) (evorl.ec.optimizers.OpenESNoiseTable attribute) M ma_brax_env_list (in module evorl.envs.jaxmarl) MABraxAdapter (class in evorl.envs.jaxmarl) make_deterministic_ec_agent() (in module evorl.algorithms.contrib.ars_linear) (in module evorl.algorithms.ec.ec_agent) make_discrete_q_network() (in module evorl.networks) (in module evorl.networks.linear) make_mlp() (in module evorl.networks) (in module evorl.networks.linear) make_mlp_a2c_agent() (in module evorl.algorithms.a2c) make_mlp_ddpg_agent() (in module evorl.algorithms.ddpg) make_mlp_discrete_dqn_agent() (in module evorl.algorithms.dqn) make_mlp_impala_agent() (in module evorl.algorithms.impala) make_mlp_ppo_agent() (in module evorl.algorithms.meta.pbt_ppo.param_ppo) (in module evorl.algorithms.ppo) make_mlp_sac_agent() (in module evorl.algorithms.meta.pbt_sac.param_sac) (in module evorl.algorithms.sac) make_mlp_td3_agent() (in module evorl.algorithms.contrib.td3_v3) (in module evorl.algorithms.td3) make_policy_network() (in module evorl.algorithms.contrib.ars_linear) (in module evorl.networks) (in module evorl.networks.linear) make_q_network() (in module evorl.networks) (in module evorl.networks.linear) make_stochastic_ec_agent() (in module evorl.algorithms.ec.ec_agent) make_td7_agent() (in module evorl.algorithms.td7) make_v_network() (in module evorl.networks) (in module evorl.networks.linear) make_vmap_mlp() (in module evorl.networks) (in module evorl.networks.linear) matrix_num_mutation_frac (evorl.ec.operators.MLPMutation attribute) (evorl.ec.optimizers.vanilla_ga.VanillaGA attribute) (evorl.ec.optimizers.VanillaGA attribute) max_episode_steps (evorl.evaluators.episode_collector.EpisodeCollector attribute) (evorl.evaluators.EpisodeCollector attribute) (evorl.evaluators.Evaluator attribute) (evorl.evaluators.evaluator.Evaluator attribute) max_priority (evorl.replay_buffers.prioritized_replay_buffer.PrioritizedReplayBufferState attribute) (evorl.replay_buffers.PrioritizedReplayBufferState attribute) mean (evorl.ec.optimizers.ars.ARSState attribute) (evorl.ec.optimizers.cem.SepCEMState attribute) (evorl.ec.optimizers.openes.OpenESNoiseTableState attribute) (evorl.ec.optimizers.openes.OpenESState attribute) (evorl.ec.optimizers.vanilla_es.VanillaESState attribute) (evorl.utils.running_statistics.NestedMeanStd attribute) metadata() (evorl.utils.orbax_utils.DummyCheckpointManager method) metric_field() (in module evorl.metrics) metric_names (evorl.evaluators.BraxEvaluator attribute) (evorl.evaluators.mo_brax_evaluator.BraxEvaluator attribute) MetricBase (class in evorl.metrics) Metrics (in module evorl.types) metrics() (evorl.utils.orbax_utils.DummyCheckpointManager method) min_priority (evorl.algorithms.td7.TD7Agent attribute) min_sample_timesteps (evorl.replay_buffers.replay_buffer.ReplayBuffer attribute) (evorl.replay_buffers.ReplayBuffer attribute) mirror_sampling (evorl.algorithms.meta.pbt_openes.param_openes.OpenES attribute) (evorl.ec.optimizers.cem.SepCEM attribute) (evorl.ec.optimizers.OpenES attribute) (evorl.ec.optimizers.openes.OpenES attribute) (evorl.ec.optimizers.openes.OpenESNoiseTable attribute) (evorl.ec.optimizers.OpenESNoiseTable attribute) (evorl.ec.optimizers.SepCEM attribute) MISSING_LOSS (in module evorl.algorithms.contrib.td3_onpolicy) (in module evorl.algorithms.contrib.td3_v2) (in module evorl.algorithms.contrib.td3_v3) MISSING_REWARD (in module evorl.types) mix_strategy (evorl.ec.optimizers.vanilla_es.VanillaESMod attribute) (evorl.ec.optimizers.VanillaESMod attribute) MjxEnvAdapter (class in evorl.envs.mujoco_playground) MLP (class in evorl.networks) (class in evorl.networks.linear) MLPCrossover (class in evorl.ec.operators) MLPMutation (class in evorl.ec.operators) mode() (evorl.distribution.TanhTransformedDistribution method) module evorl evorl.agent evorl.algorithms evorl.algorithms.a2c evorl.algorithms.contrib evorl.algorithms.contrib.a2c_v2 evorl.algorithms.contrib.ars_linear evorl.algorithms.contrib.openes_noise_table evorl.algorithms.contrib.pop_episodic_td3 evorl.algorithms.contrib.pop_ppo evorl.algorithms.contrib.pop_td3 evorl.algorithms.contrib.td3_ep evorl.algorithms.contrib.td3_onpolicy evorl.algorithms.contrib.td3_v2 evorl.algorithms.contrib.td3_v3 evorl.algorithms.ddpg evorl.algorithms.dqn evorl.algorithms.ec evorl.algorithms.ec.ec_agent evorl.algorithms.ec.mo evorl.algorithms.ec.mo.nsga2_brax evorl.algorithms.ec.obs_utils evorl.algorithms.ec.so evorl.algorithms.ec.so.ars evorl.algorithms.ec.so.cmaes evorl.algorithms.ec.so.es_workflow evorl.algorithms.ec.so.openes evorl.algorithms.ec.so.sepcem evorl.algorithms.ec.so.vanilla_es evorl.algorithms.erl evorl.algorithms.erl.cemrl_td3 evorl.algorithms.erl.cemrl_td3.cemrl evorl.algorithms.erl.cemrl_td3.cemrl_openes evorl.algorithms.erl.cemrl_td3.cemrl_origin evorl.algorithms.erl.cemrl_td3.cemrl_td3_workflow evorl.algorithms.erl.cemrl_workflow evorl.algorithms.erl.erl_td3 evorl.algorithms.erl.erl_td3.erl_eda evorl.algorithms.erl.erl_td3.erl_es evorl.algorithms.erl.erl_td3.erl_ga evorl.algorithms.erl.erl_td3.erl_origin evorl.algorithms.erl.erl_td3.erl_td3_workflow evorl.algorithms.erl.erl_workflow evorl.algorithms.impala evorl.algorithms.meta evorl.algorithms.meta.pbt evorl.algorithms.meta.pbt_openes evorl.algorithms.meta.pbt_openes.param_openes evorl.algorithms.meta.pbt_openes.pbt_param_openes evorl.algorithms.meta.pbt_operations evorl.algorithms.meta.pbt_ppo evorl.algorithms.meta.pbt_ppo.param_ppo evorl.algorithms.meta.pbt_ppo.pbt_cso_param_ppo evorl.algorithms.meta.pbt_ppo.pbt_param_ppo evorl.algorithms.meta.pbt_sac evorl.algorithms.meta.pbt_sac.param_sac evorl.algorithms.meta.pbt_sac.pbt_param_sac evorl.algorithms.meta.pbt_utils evorl.algorithms.meta.pbt_workflow evorl.algorithms.multi_agents evorl.algorithms.multi_agents.ippo_mabrax evorl.algorithms.multi_agents.maddpg_mabrax evorl.algorithms.multi_agents.mappo_mabrax evorl.algorithms.multi_agents.matd3_mabrax evorl.algorithms.offpolicy_utils evorl.algorithms.ppo evorl.algorithms.random_agent evorl.algorithms.sac evorl.algorithms.td3 evorl.algorithms.td7 evorl.distributed evorl.distributed.comm evorl.distributed.gradients evorl.distributed.sharding evorl.distribution evorl.ec evorl.ec.evox_algorithm evorl.ec.evox_algorithm.cmaes evorl.ec.evox_algorithm.cso evorl.ec.evox_algorithm.openes evorl.ec.evox_algorithm.sort_utils evorl.ec.operators evorl.ec.operators.utils evorl.ec.optimizers evorl.ec.optimizers.ars evorl.ec.optimizers.cem evorl.ec.optimizers.ec_optimizer evorl.ec.optimizers.erl_ga evorl.ec.optimizers.evox_wrapper evorl.ec.optimizers.openes evorl.ec.optimizers.utils evorl.ec.optimizers.vanilla_es evorl.ec.optimizers.vanilla_ga evorl.envs evorl.envs.brax evorl.envs.env evorl.envs.envpool evorl.envs.gymnasium evorl.envs.gymnax evorl.envs.jaxmarl evorl.envs.jumanji evorl.envs.mujoco_playground evorl.envs.space evorl.envs.utils evorl.envs.wrappers evorl.envs.wrappers.action_wrapper evorl.envs.wrappers.ma_training_wrapper evorl.envs.wrappers.obs_wrapper evorl.envs.wrappers.reward_wrapper evorl.envs.wrappers.training_wrapper evorl.envs.wrappers.wrapper evorl.evaluators evorl.evaluators.ec_evaluator evorl.evaluators.episode_collector evorl.evaluators.evaluator evorl.evaluators.mo_brax_evaluator evorl.metrics evorl.networks evorl.networks.layer_norm evorl.networks.linear evorl.networks.spectral_norm evorl.recorders evorl.recorders.log_recorder evorl.recorders.recorder evorl.recorders.wandb_recorder evorl.replay_buffers evorl.replay_buffers.lap_replay_buffer evorl.replay_buffers.prioritized_replay_buffer evorl.replay_buffers.replay_buffer evorl.rollout evorl.sample_batch evorl.types evorl.utils evorl.utils.ec_utils evorl.utils.jax_utils evorl.utils.ma_utils evorl.utils.orbax_utils evorl.utils.rl_toolkits evorl.utils.running_statistics evorl.workflows evorl.workflows.ec_workflow evorl.workflows.rl_workflow evorl.workflows.workflow multi_agent_episode_done() (in module evorl.utils.ma_utils) MultiObjectiveECWorkflowMetric (class in evorl.metrics) MultiObjectiveECWorkflowTemplate (class in evorl.workflows) (class in evorl.workflows.ec_workflow) mut_strength (evorl.ec.operators.ERLMutation attribute) (evorl.ec.operators.MLPMutation attribute) (evorl.ec.optimizers.erl_ga.ERLGA attribute) (evorl.ec.optimizers.ERLGA attribute) (evorl.ec.optimizers.vanilla_ga.VanillaGA attribute) (evorl.ec.optimizers.VanillaGA attribute) N n (evorl.envs.space.Discrete attribute) n_steps (evorl.networks.spectral_norm.SNDense attribute) name() (evorl.algorithms.a2c.A2CWorkflow class method) (evorl.algorithms.contrib.a2c_v2.A2CWorkflow class method) (evorl.algorithms.contrib.ars_linear.ARSWorkflow class method) (evorl.algorithms.contrib.openes_noise_table.OpenESWorkflow class method) (evorl.algorithms.contrib.pop_episodic_td3.PopEpisodicTD3Workflow class method) (evorl.algorithms.contrib.pop_ppo.PopPPOWorkflow class method) (evorl.algorithms.contrib.pop_td3.PopTD3Workflow class method) (evorl.algorithms.contrib.td3_onpolicy.TD3OnPolicyWorkflow class method) (evorl.algorithms.contrib.td3_v2.TD3V2Workflow class method) (evorl.algorithms.contrib.td3_v3.TD3V3Workflow class method) (evorl.algorithms.ddpg.DDPGWorkflow class method) (evorl.algorithms.dqn.DQNWorkflow class method) (evorl.algorithms.ec.mo.nsga2_brax.NSGA2Workflow class method) (evorl.algorithms.ec.so.ars.ARSWorkflow class method) (evorl.algorithms.ec.so.cmaes.CMAESWorkflow class method) (evorl.algorithms.ec.so.cmaes.SepCMAESWorkflow class method) (evorl.algorithms.ec.so.openes.OpenESWorkflow class method) (evorl.algorithms.ec.so.sepcem.SepCEMWorkflow class method) (evorl.algorithms.ec.so.vanilla_es.VanillaESWorkflow class method) (evorl.algorithms.erl.cemrl_td3.cemrl.CEMRLWorkflow class method) (evorl.algorithms.erl.cemrl_td3.cemrl_openes.CEMRLOpenESWorkflow class method) (evorl.algorithms.erl.cemrl_td3.cemrl_origin.CEMRLWorkflow class method) (evorl.algorithms.erl.erl_td3.erl_eda.ERLEDAWorkflow class method) (evorl.algorithms.erl.erl_td3.erl_es.ERLESWorkflow class method) (evorl.algorithms.erl.erl_td3.erl_ga.ERLGAWorkflow class method) (evorl.algorithms.erl.erl_td3.erl_origin.ERLWorkflow class method) (evorl.algorithms.impala.IMPALAWorkflow class method) (evorl.algorithms.meta.pbt.PBTWorkflow class method) (evorl.algorithms.meta.pbt_openes.param_openes.ParamOpenESWorkflow class method) (evorl.algorithms.meta.pbt_openes.pbt_param_openes.PBTParamOpenESWorkflow class method) (evorl.algorithms.meta.pbt_ppo.param_ppo.ParamPPOWorkflow class method) (evorl.algorithms.meta.pbt_ppo.pbt_cso_param_ppo.PBTCSOParamPPOWorkflow class method) (evorl.algorithms.meta.pbt_ppo.pbt_param_ppo.PBTParamPPOWorkflow class method) (evorl.algorithms.meta.pbt_sac.param_sac.ParamSACWorkflow class method) (evorl.algorithms.meta.pbt_sac.pbt_param_sac.PBTParamSACWorkflow class method) (evorl.algorithms.ppo.PPOWorkflow class method) (evorl.algorithms.random_agent.RandomAgentWorkflow class method) (evorl.algorithms.sac.SACWorkflow class method) (evorl.algorithms.td3.TD3Workflow class method) (evorl.algorithms.td7.TD7Workflow class method) (evorl.workflows.workflow.AbstractWorkflow class method) NestedMeanStd (class in evorl.utils.running_statistics) next_obs (evorl.sample_batch.SampleBatch attribute) noise (evorl.ec.optimizers.ars.ARSState attribute) (evorl.ec.optimizers.openes.OpenESNoiseTableState attribute) (evorl.ec.optimizers.openes.OpenESState attribute) (evorl.ec.optimizers.vanilla_es.VanillaESState attribute) noise_std (evorl.algorithms.meta.pbt_openes.param_openes.OpenES attribute) (evorl.ec.optimizers.ARS attribute) (evorl.ec.optimizers.ars.ARS attribute) (evorl.ec.optimizers.openes.OpenESNoiseTableState attribute) (evorl.ec.optimizers.openes.OpenESState attribute) (evorl.ec.optimizers.vanilla_es.VanillaESState attribute) noise_std_schedule (evorl.ec.optimizers.OpenES attribute) (evorl.ec.optimizers.openes.OpenES attribute) (evorl.ec.optimizers.openes.OpenESNoiseTable attribute) (evorl.ec.optimizers.OpenESNoiseTable attribute) (evorl.ec.optimizers.vanilla_es.VanillaES attribute) (evorl.ec.optimizers.VanillaES attribute) noise_table (evorl.ec.optimizers.openes.OpenESNoiseTableState attribute) noise_table_size (evorl.ec.optimizers.openes.OpenESNoiseTable attribute) (evorl.ec.optimizers.OpenESNoiseTable attribute) norm_layer (evorl.networks.linear.MLP attribute) (evorl.networks.MLP attribute) NORMAL (evorl.envs.wrappers.training_wrapper.AutoresetMode attribute) normalize() (in module evorl.utils.running_statistics) normalize_gae (evorl.algorithms.ppo.PPOAgent attribute) normalize_obs (evorl.algorithms.a2c.A2CAgent property) (evorl.algorithms.contrib.td3_v3.TD3Agent property) (evorl.algorithms.ddpg.DDPGAgent property) (evorl.algorithms.dqn.DQNAgent property) (evorl.algorithms.ec.ec_agent.DeterministicECAgent property) (evorl.algorithms.ec.ec_agent.StochasticECAgent property) (evorl.algorithms.impala.IMPALAAgent property) (evorl.algorithms.ppo.PPOAgent property) (evorl.algorithms.sac.SACAgent property) (evorl.algorithms.sac.SACDiscreteAgent property) (evorl.algorithms.td3.TD3Agent property) (evorl.algorithms.td7.TD7Agent property) NSGA2Workflow (class in evorl.algorithms.ec.mo.nsga2_brax) num_crossover_frac (evorl.ec.operators.MLPCrossover attribute) (evorl.ec.optimizers.erl_ga.ERLGA attribute) (evorl.ec.optimizers.ERLGA attribute) (evorl.ec.optimizers.vanilla_ga.VanillaGA attribute) (evorl.ec.optimizers.VanillaGA attribute) num_elites (evorl.ec.optimizers.ARS attribute) (evorl.ec.optimizers.ars.ARS attribute) (evorl.ec.optimizers.cem.SepCEM attribute) (evorl.ec.optimizers.erl_ga.ERLGA attribute) (evorl.ec.optimizers.ERLGA attribute) (evorl.ec.optimizers.SepCEM attribute) (evorl.ec.optimizers.vanilla_es.VanillaES attribute) (evorl.ec.optimizers.vanilla_ga.VanillaGA attribute) (evorl.ec.optimizers.VanillaES attribute) (evorl.ec.optimizers.VanillaGA attribute) num_mutation_frac (evorl.ec.operators.ERLMutation attribute) (evorl.ec.optimizers.erl_ga.ERLGA attribute) (evorl.ec.optimizers.ERLGA attribute) num_updates_per_iter (evorl.algorithms.erl.cemrl_td3.cemrl_origin.CEMRLTrainMetric attribute) (evorl.algorithms.erl.erl_td3.erl_origin.ERLTrainMetric attribute) O objectives (evorl.metrics.ECTrainMetric attribute) obs (evorl.envs.env.EnvState attribute) (evorl.sample_batch.SampleBatch attribute) obs_preprocessor (evorl.algorithms.a2c.A2CAgent attribute) (evorl.algorithms.contrib.td3_v3.TD3Agent attribute) (evorl.algorithms.ddpg.DDPGAgent attribute) (evorl.algorithms.dqn.DQNAgent attribute) (evorl.algorithms.ec.ec_agent.DeterministicECAgent attribute) (evorl.algorithms.ec.ec_agent.StochasticECAgent attribute) (evorl.algorithms.impala.IMPALAAgent attribute) (evorl.algorithms.ppo.PPOAgent attribute) (evorl.algorithms.sac.SACAgent attribute) (evorl.algorithms.sac.SACDiscreteAgent attribute) (evorl.algorithms.td3.TD3Agent attribute) (evorl.algorithms.td7.TD7Agent attribute) obs_preprocessor_state (evorl.agent.AgentState attribute) obs_space (evorl.envs.brax.BraxAdapter property) (evorl.envs.env.Env property) (evorl.envs.envpool.EnvPoolGymAdapter property) (evorl.envs.gymnasium.GymnasiumAdapter property) (evorl.envs.gymnax.GymnaxAdapter property) (evorl.envs.jaxmarl.JaxMARLAdapter property) (evorl.envs.jumanji.JumanjiAdapter property) (evorl.envs.mujoco_playground.MjxEnvAdapter property) (evorl.envs.wrappers.obs_wrapper.ObsFlattenWrapper property) (evorl.envs.wrappers.ObsFlattenWrapper property) (evorl.envs.wrappers.Wrapper property) (evorl.envs.wrappers.wrapper.Wrapper property) Observation (in module evorl.types) ObsFlattenWrapper (class in evorl.envs.wrappers) (class in evorl.envs.wrappers.obs_wrapper) ObsPreprocessor (class in evorl.algorithms.ec.obs_utils) ObsPreprocessorFn (class in evorl.agent) ObsPreprocessorParams (in module evorl.types) OffPolicyWorkflow (class in evorl.workflows) (class in evorl.workflows.rl_workflow) OffPolicyWorkflowTemplate (class in evorl.algorithms.offpolicy_utils) OneEpisodeWrapper (class in evorl.envs.envpool) (class in evorl.envs.gymnasium) (class in evorl.envs.wrappers) (class in evorl.envs.wrappers.ma_training_wrapper) (class in evorl.envs.wrappers.training_wrapper) OnPolicyWorkflow (class in evorl.workflows) (class in evorl.workflows.rl_workflow) OpenES (class in evorl.algorithms.meta.pbt_openes.param_openes) (class in evorl.ec.evox_algorithm.openes) (class in evorl.ec.optimizers) (class in evorl.ec.optimizers.openes) OpenESNoiseTable (class in evorl.ec.optimizers) (class in evorl.ec.optimizers.openes) OpenESNoiseTableState (class in evorl.ec.optimizers.openes) OpenESState (class in evorl.ec.optimizers.openes) OpenESWorkflow (class in evorl.algorithms.contrib.openes_noise_table) (class in evorl.algorithms.ec.so.openes) opt_state (evorl.ec.optimizers.ars.ARSState attribute) (evorl.ec.optimizers.openes.OpenESNoiseTableState attribute) (evorl.ec.optimizers.openes.OpenESState attribute) optimize_gpu_utilization() (in module evorl.utils.jax_utils) optimizer (evorl.algorithms.meta.pbt_openes.param_openes.OpenES attribute) (evorl.ec.optimizers.ARS attribute) (evorl.ec.optimizers.ars.ARS attribute) (evorl.ec.optimizers.OpenES attribute) (evorl.ec.optimizers.openes.OpenES attribute) (evorl.ec.optimizers.openes.OpenESNoiseTable attribute) (evorl.ec.optimizers.OpenESNoiseTable attribute) optimizer_map (in module evorl.ec.optimizers.utils) optimizer_name (evorl.ec.optimizers.ARS attribute) (evorl.ec.optimizers.ars.ARS attribute) (evorl.ec.optimizers.OpenES attribute) (evorl.ec.optimizers.openes.OpenES attribute) (evorl.ec.optimizers.openes.OpenESNoiseTable attribute) (evorl.ec.optimizers.OpenESNoiseTable attribute) P param_vec_spec (evorl.ec.optimizers.evox_wrapper.EvoXAlgorithmAdapter attribute) ParamOpenESWorkflow (class in evorl.algorithms.meta.pbt_openes.param_openes) ParamPPOAgent (class in evorl.algorithms.meta.pbt_ppo.param_ppo) ParamPPOWorkflow (class in evorl.algorithms.meta.pbt_ppo.param_ppo) params (evorl.agent.AgentState attribute) Params (in module evorl.types) ParamSACAgent (class in evorl.algorithms.meta.pbt_sac.param_sac) ParamSACTrainMetric (class in evorl.algorithms.meta.pbt_sac.param_sac) ParamSACWorkflow (class in evorl.algorithms.meta.pbt_sac.param_sac) ParamVectorSpec (class in evorl.utils.ec_utils) PBTCSOOptState (class in evorl.algorithms.meta.pbt_ppo.pbt_cso_param_ppo) PBTCSOParamPPOWorkflow (class in evorl.algorithms.meta.pbt_ppo.pbt_cso_param_ppo) PBTEvalMetric (class in evorl.algorithms.meta.pbt_workflow) PBTOffpolicyTrainMetric (class in evorl.algorithms.meta.pbt_workflow) PBTOffpolicyWorkflowTemplate (class in evorl.algorithms.meta.pbt_workflow) PBTOptState (class in evorl.algorithms.meta.pbt_workflow) PBTParamOpenESWorkflow (class in evorl.algorithms.meta.pbt_openes.pbt_param_openes) PBTParamPPOWorkflow (class in evorl.algorithms.meta.pbt_ppo.pbt_param_ppo) PBTParamSACWorkflow (class in evorl.algorithms.meta.pbt_sac.pbt_param_sac) PBTTrainMetric (class in evorl.algorithms.meta.pbt_workflow) PBTWorkflow (class in evorl.algorithms.meta.pbt) PBTWorkflowBase (class in evorl.algorithms.meta.pbt_workflow) PBTWorkflowMetric (class in evorl.algorithms.meta.pbt_workflow) PBTWorkflowTemplate (class in evorl.algorithms.meta.pbt_workflow) phi (evorl.ec.evox_algorithm.cso.CSO attribute) pmap_method() (in module evorl.utils.jax_utils) pmax() (in module evorl.distributed) (in module evorl.distributed.comm) pmean() (in module evorl.distributed) (in module evorl.distributed.comm) pmin() (in module evorl.distributed) (in module evorl.distributed.comm) policy_network (evorl.algorithms.a2c.A2CAgent attribute) (evorl.algorithms.ec.ec_agent.DeterministicECAgent attribute) (evorl.algorithms.ec.ec_agent.StochasticECAgent attribute) (evorl.algorithms.impala.IMPALAAgent attribute) (evorl.algorithms.ppo.PPOAgent attribute) policy_noise (evorl.algorithms.contrib.td3_v3.TD3Agent attribute) (evorl.algorithms.td3.TD3Agent attribute) (evorl.algorithms.td7.TD7Agent attribute) policy_obs_key (evorl.algorithms.ppo.PPOAgent attribute) policy_params (evorl.algorithms.a2c.A2CNetworkParams attribute) (evorl.algorithms.ec.ec_agent.ECNetworkParams attribute) (evorl.algorithms.impala.IMPALANetworkParams attribute) (evorl.algorithms.ppo.PPONetworkParams attribute) PolicyExtraInfo (in module evorl.types) pop (evorl.algorithms.meta.pbt_workflow.PBTTrainMetric attribute) (evorl.ec.optimizers.cem.SepCEMState attribute) (evorl.ec.optimizers.erl_ga.ERLGAState attribute) (evorl.ec.optimizers.vanilla_ga.VanillaGAState attribute) pop() (evorl.types.PyTreeDict method) POP_AXIS_NAME (in module evorl.distributed) pop_center_episode_lengths (evorl.algorithms.erl.cemrl_td3.cemrl.EvaluateMetric attribute) (evorl.algorithms.erl.erl_td3.erl_eda.EvaluateMetric attribute) (evorl.algorithms.erl.erl_td3.erl_es.EvaluateMetric attribute) pop_center_episode_returns (evorl.algorithms.erl.cemrl_td3.cemrl.EvaluateMetric attribute) (evorl.algorithms.erl.erl_td3.erl_eda.EvaluateMetric attribute) (evorl.algorithms.erl.erl_td3.erl_es.EvaluateMetric attribute) pop_episode_lengths (evorl.algorithms.erl.cemrl_workflow.CEMRLTrainMetric attribute) (evorl.algorithms.erl.erl_workflow.ERLTrainMetric attribute) (evorl.algorithms.meta.pbt_workflow.PBTEvalMetric attribute) (evorl.algorithms.meta.pbt_workflow.PBTTrainMetric attribute) pop_episode_returns (evorl.algorithms.erl.cemrl_workflow.CEMRLTrainMetric attribute) (evorl.algorithms.erl.erl_workflow.ERLTrainMetric attribute) (evorl.algorithms.meta.pbt_workflow.PBTEvalMetric attribute) (evorl.algorithms.meta.pbt_workflow.PBTTrainMetric attribute) pop_size (evorl.algorithms.meta.pbt_openes.param_openes.OpenES attribute) (evorl.ec.evox_algorithm.cso.CSO attribute) (evorl.ec.optimizers.ARS attribute) (evorl.ec.optimizers.ars.ARS attribute) (evorl.ec.optimizers.cem.SepCEM attribute) (evorl.ec.optimizers.erl_ga.ERLGA attribute) (evorl.ec.optimizers.ERLGA attribute) (evorl.ec.optimizers.OpenES attribute) (evorl.ec.optimizers.openes.OpenES attribute) (evorl.ec.optimizers.openes.OpenESNoiseTable attribute) (evorl.ec.optimizers.OpenESNoiseTable attribute) (evorl.ec.optimizers.SepCEM attribute) (evorl.ec.optimizers.vanilla_es.VanillaES attribute) (evorl.ec.optimizers.vanilla_ga.VanillaGA attribute) (evorl.ec.optimizers.VanillaES attribute) (evorl.ec.optimizers.VanillaGA attribute) pop_train_metrics (evorl.algorithms.meta.pbt_workflow.PBTTrainMetric attribute) PopEpisodicTD3Workflow (class in evorl.algorithms.contrib.pop_episodic_td3) PopPPOWorkflow (class in evorl.algorithms.contrib.pop_ppo) PopTD3Workflow (class in evorl.algorithms.contrib.pop_td3) population (evorl.ec.evox_algorithm.cso.CSOState attribute) PPOAgent (class in evorl.algorithms.ppo) PPONetworkParams (class in evorl.algorithms.ppo) PPOWorkflow (class in evorl.algorithms.ppo) precision (evorl.networks.spectral_norm.SNDense attribute) PrioritizedReplayBuffer (class in evorl.replay_buffers) (class in evorl.replay_buffers.prioritized_replay_buffer) PrioritizedReplayBufferState (class in evorl.replay_buffers) (class in evorl.replay_buffers.prioritized_replay_buffer) priority (evorl.replay_buffers.prioritized_replay_buffer.PrioritizedReplayBufferState attribute) (evorl.replay_buffers.PrioritizedReplayBufferState attribute) psum() (in module evorl.distributed) (in module evorl.distributed.comm) pytree_field() (in module evorl.types) PyTreeArrayMixin (class in evorl.types) PyTreeData (class in evorl.types) PyTreeDict (class in evorl.types) PyTreeNode (class in evorl.types) Q q1 (evorl.algorithms.contrib.td3_v3.TD3TrainMetric attribute) q2 (evorl.algorithms.contrib.td3_v3.TD3TrainMetric attribute) q_network (evorl.algorithms.dqn.DQNAgent attribute) q_params (evorl.algorithms.dqn.DQNNetworkParams attribute) R random_timesteps (evorl.algorithms.ec.obs_utils.ObsPreprocessor attribute) RandomAgent (class in evorl.agent) RandomAgentWorkflow (class in evorl.algorithms.random_agent) RandomTrainMetric (class in evorl.algorithms.random_agent) rank (evorl.workflows.ec_workflow.DistributedInfo attribute) rank_weight_shift (evorl.ec.optimizers.cem.SepCEM attribute) (evorl.ec.optimizers.SepCEM attribute) raw_loss_dict (evorl.algorithms.ddpg.DDPGTrainMetric attribute) (evorl.algorithms.dqn.DQNTrainMetric attribute) (evorl.algorithms.sac.SACTrainMetric attribute) (evorl.algorithms.td3.TD3TrainMetric attribute) (evorl.algorithms.td7.TD7TrainMetric attribute) (evorl.metrics.TrainMetric attribute) rb_size (evorl.algorithms.erl.cemrl_workflow.CEMRLTrainMetric attribute) (evorl.algorithms.erl.erl_workflow.ERLTrainMetric attribute) (evorl.algorithms.meta.pbt_workflow.PBTOffpolicyTrainMetric attribute) reached_preemption() (evorl.utils.orbax_utils.DummyCheckpointManager method) Recorder (class in evorl.recorders) (class in evorl.recorders.recorder) reload() (evorl.utils.orbax_utils.DummyCheckpointManager method) replace() (evorl.types.PyTreeDict method) ReplayBuffer (class in evorl.replay_buffers) (class in evorl.replay_buffers.replay_buffer) ReplayBufferState (class in evorl.replay_buffers) (class in evorl.replay_buffers.replay_buffer) (in module evorl.types) reset() (evorl.envs.brax.BraxAdapter method) (evorl.envs.env.Env method) (evorl.envs.envpool.EnvPoolGymAdapter method) (evorl.envs.gymnasium.GymnasiumAdapter method) (evorl.envs.gymnax.GymnaxAdapter method) (evorl.envs.jaxmarl.JaxMARLAdapter method) (evorl.envs.jaxmarl.MABraxAdapter method) (evorl.envs.jumanji.JumanjiAdapter method) (evorl.envs.mujoco_playground.MjxEnvAdapter method) (evorl.envs.wrappers.EpisodeWrapper method) (evorl.envs.wrappers.FastVmapAutoResetWrapper method) (evorl.envs.wrappers.ma_training_wrapper.EpisodeWrapper method) (evorl.envs.wrappers.ma_training_wrapper.FastVmapAutoResetWrapper method) (evorl.envs.wrappers.ma_training_wrapper.VmapAutoResetWrapper method) (evorl.envs.wrappers.ma_training_wrapper.VmapWrapper method) (evorl.envs.wrappers.obs_wrapper.ObsFlattenWrapper method) (evorl.envs.wrappers.ObsFlattenWrapper method) (evorl.envs.wrappers.reward_wrapper.RewardScaleWrapper method) (evorl.envs.wrappers.reward_wrapper.SparseRewardWrapper method) (evorl.envs.wrappers.RewardScaleWrapper method) (evorl.envs.wrappers.SparseRewardWrapper method) (evorl.envs.wrappers.training_wrapper.EpisodeWrapper method) (evorl.envs.wrappers.training_wrapper.FastVmapAutoResetWrapper method) (evorl.envs.wrappers.training_wrapper.VmapAutoResetWrapper method) (evorl.envs.wrappers.training_wrapper.VmapEnvPoolAutoResetWrapper method) (evorl.envs.wrappers.training_wrapper.VmapWrapper method) (evorl.envs.wrappers.VmapAutoResetWrapper method) (evorl.envs.wrappers.VmapEnvPoolAutoResetWrapper method) (evorl.envs.wrappers.VmapWrapper method) (evorl.envs.wrappers.Wrapper method) (evorl.envs.wrappers.wrapper.Wrapper method) reset_max_priority() (evorl.replay_buffers.prioritized_replay_buffer.PrioritizedReplayBuffer method) (evorl.replay_buffers.PrioritizedReplayBuffer method) reset_prob (evorl.ec.operators.ERLMutation attribute) (evorl.ec.optimizers.erl_ga.ERLGA attribute) (evorl.ec.optimizers.ERLGA attribute) reshape() (evorl.types.PyTreeArrayMixin method) restore() (evorl.utils.orbax_utils.CheckpointManager method) (evorl.utils.orbax_utils.DummyCheckpointManager method) reward (evorl.envs.env.EnvState attribute) Reward (in module evorl.types) RewardDict (in module evorl.types) rewards (evorl.sample_batch.SampleBatch attribute) RewardScaleWrapper (class in evorl.envs.wrappers) (class in evorl.envs.wrappers.reward_wrapper) right_shift_with_padding() (in module evorl.utils.jax_utils) rl_episode_lengths (evorl.algorithms.erl.erl_td3.erl_eda.EvaluateMetric attribute) (evorl.algorithms.erl.erl_td3.erl_es.EvaluateMetric attribute) (evorl.algorithms.erl.erl_td3.erl_ga.EvaluateMetric attribute) (evorl.algorithms.erl.erl_workflow.ERLTrainMetric attribute) rl_episode_returns (evorl.algorithms.erl.erl_td3.erl_eda.EvaluateMetric attribute) (evorl.algorithms.erl.erl_td3.erl_es.EvaluateMetric attribute) (evorl.algorithms.erl.erl_td3.erl_ga.EvaluateMetric attribute) (evorl.algorithms.erl.erl_workflow.ERLTrainMetric attribute) rl_metrics (evorl.algorithms.erl.cemrl_workflow.CEMRLTrainMetric attribute) (evorl.algorithms.erl.erl_workflow.ERLTrainMetric attribute) rl_sampled_timesteps (evorl.algorithms.erl.erl_workflow.WorkflowMetric attribute) RLWorkflow (class in evorl.workflows) (class in evorl.workflows.rl_workflow) rng_split() (in module evorl.utils.jax_utils) rng_split_by_shape() (in module evorl.utils.jax_utils) rng_split_like_tree() (in module evorl.utils.jax_utils) rollout() (evorl.evaluators.episode_collector.EpisodeCollector method) (evorl.evaluators.EpisodeCollector method) (in module evorl.evaluators.ec_evaluator) (in module evorl.rollout) rollout_episode() (in module evorl.algorithms.erl.cemrl_td3.cemrl_td3_workflow) (in module evorl.algorithms.erl.erl_td3.erl_td3_workflow) rollout_fn (evorl.evaluators.ec_evaluator.EpisodeObsCollector attribute) (evorl.evaluators.episode_collector.EpisodeCollector attribute) (evorl.evaluators.EpisodeCollector attribute) (evorl.evaluators.EpisodeObsCollector attribute) rollout_obs() (in module evorl.algorithms.ec.obs_utils) RolloutFn (class in evorl.rollout) RunningStatisticsState (class in evorl.utils.running_statistics) S SACAgent (class in evorl.algorithms.sac) SACDiscreteAgent (class in evorl.algorithms.sac) SACNetworkParams (class in evorl.algorithms.sac) SACTrainMetric (class in evorl.algorithms.sac) SACWorkflow (class in evorl.algorithms.sac) sample() (evorl.envs.space.Box method) (evorl.envs.space.Discrete method) (evorl.envs.space.Space method) (evorl.envs.space.SpaceContainer method) (evorl.replay_buffers.AbstractReplayBuffer method) (evorl.replay_buffers.lap_replay_buffer.LAPReplayBuffer method) (evorl.replay_buffers.LAPReplayBuffer method) (evorl.replay_buffers.prioritized_replay_buffer.PrioritizedReplayBuffer method) (evorl.replay_buffers.PrioritizedReplayBuffer method) (evorl.replay_buffers.replay_buffer.AbstractReplayBuffer method) (evorl.replay_buffers.replay_buffer.ReplayBuffer method) (evorl.replay_buffers.ReplayBuffer method) sample_batch_size (evorl.replay_buffers.replay_buffer.ReplayBuffer attribute) (evorl.replay_buffers.ReplayBuffer attribute) sample_indices (evorl.replay_buffers.prioritized_replay_buffer.PrioritizedReplayBufferState attribute) (evorl.replay_buffers.PrioritizedReplayBufferState attribute) SampleBatch (class in evorl.sample_batch) sampled_episodes (evorl.algorithms.contrib.pop_td3.WorkflowMetric attribute) (evorl.algorithms.erl.cemrl_td3.cemrl_origin.WorkflowMetric attribute) (evorl.algorithms.erl.erl_workflow.WorkflowMetric attribute) (evorl.metrics.ECWorkflowMetric attribute) (evorl.metrics.MultiObjectiveECWorkflowMetric attribute) (evorl.metrics.WorkflowMetric attribute) sampled_timesteps (evorl.algorithms.contrib.pop_td3.WorkflowMetric attribute) (evorl.algorithms.erl.cemrl_td3.cemrl_origin.WorkflowMetric attribute) (evorl.algorithms.erl.erl_workflow.WorkflowMetric attribute) (evorl.metrics.WorkflowMetric attribute) sampled_timesteps_m (evorl.algorithms.meta.pbt_workflow.PBTWorkflowMetric attribute) (evorl.metrics.ECWorkflowMetric attribute) (evorl.metrics.MultiObjectiveECWorkflowMetric attribute) sampled_timesteps_per_agent (evorl.algorithms.contrib.pop_td3.WorkflowMetric attribute) sampled_timesteps_per_iter (evorl.algorithms.erl.cemrl_td3.cemrl_origin.WorkflowMetric attribute) save() (evorl.utils.orbax_utils.CheckpointManager method) (evorl.utils.orbax_utils.DummyCheckpointManager method) (in module evorl.utils.orbax_utils) scan_and_last() (in module evorl.utils.jax_utils) scan_and_mean() (in module evorl.utils.jax_utils) select() (in module evorl.algorithms.meta.pbt_operations) SepCEM (class in evorl.ec.optimizers) (class in evorl.ec.optimizers.cem) SepCEMState (class in evorl.ec.optimizers.cem) SepCEMWorkflow (class in evorl.algorithms.ec.so.sepcem) SepCMAES (class in evorl.ec.evox_algorithm.cmaes) SepCMAESWorkflow (class in evorl.algorithms.ec.so.cmaes) set_frozen_attr() (evorl.types.PyTreeNode method) setup() (evorl.algorithms.contrib.pop_ppo.PopPPOWorkflow method) (evorl.algorithms.contrib.pop_td3.PopTD3Workflow method) (evorl.algorithms.erl.cemrl_workflow.CEMRLWorkflowBase method) (evorl.algorithms.erl.erl_td3.erl_td3_workflow.ERLTD3WorkflowTemplate method) (evorl.algorithms.erl.erl_workflow.ERLWorkflowBase method) (evorl.algorithms.meta.pbt_ppo.param_ppo.ParamPPOWorkflow method) (evorl.algorithms.meta.pbt_sac.param_sac.ParamSACWorkflow method) (evorl.algorithms.meta.pbt_workflow.PBTOffpolicyWorkflowTemplate method) (evorl.algorithms.meta.pbt_workflow.PBTWorkflowBase method) (evorl.algorithms.random_agent.RandomAgentWorkflow method) (evorl.algorithms.td7.TD7Encoder method) (evorl.ec.evox_algorithm.cmaes.CMAES method) (evorl.ec.evox_algorithm.cmaes.SepCMAES method) (evorl.ec.evox_algorithm.cso.CSO method) (evorl.ec.evox_algorithm.openes.OpenES method) (evorl.workflows.ec_workflow.ECWorkflowTemplate method) (evorl.workflows.ECWorkflowTemplate method) (evorl.workflows.OffPolicyWorkflow method) (evorl.workflows.OnPolicyWorkflow method) (evorl.workflows.rl_workflow.OffPolicyWorkflow method) (evorl.workflows.rl_workflow.OnPolicyWorkflow method) (evorl.workflows.Workflow method) (evorl.workflows.workflow.Workflow method) setup_checkpoint_manager() (in module evorl.utils.orbax_utils) setup_env_callback() (evorl.envs.envpool.EnvPoolGymAdapter method) (evorl.envs.gymnasium.GymnasiumAdapter method) shape (evorl.envs.space.Box property) (evorl.envs.space.Discrete property) (evorl.envs.space.Space property) (evorl.envs.space.SpaceContainer property) Shape (in module evorl.networks.spectral_norm) shmap_map() (in module evorl.distributed) (in module evorl.distributed.sharding) shmap_vmap() (in module evorl.distributed) (in module evorl.distributed.sharding) should_save() (evorl.utils.orbax_utils.DummyCheckpointManager method) shuffle_sample_batch() (in module evorl.utils.rl_toolkits) skip_replay_buffer_state() (in module evorl.algorithms.offpolicy_utils) slice() (evorl.types.PyTreeArrayMixin method) sliding_window() (in module evorl.utils.jax_utils) SNDense (class in evorl.networks.spectral_norm) SNMLP (class in evorl.networks) (class in evorl.networks.linear) soft_target_update() (in module evorl.utils.rl_toolkits) sort_by_key() (in module evorl.ec.evox_algorithm.sort_utils) sort_dict() (in module evorl.envs.utils) Space (class in evorl.envs.space) SpaceContainer (class in evorl.envs.space) spaces (evorl.envs.space.SpaceContainer attribute) SparseRewardWrapper (class in evorl.envs.wrappers) (class in evorl.envs.wrappers.reward_wrapper) split_key_to_devices() (in module evorl.distributed) (in module evorl.distributed.comm) State (class in evorl.types) state_action_emb_dim (evorl.algorithms.td7.TD7Critic attribute) state_emb_dim (evorl.algorithms.td7.TD7Actor attribute) static (evorl.algorithms.ec.obs_utils.ObsPreprocessor attribute) StaticLayerNorm (class in evorl.networks) (class in evorl.networks.layer_norm) std (evorl.utils.running_statistics.NestedMeanStd attribute) step() (evorl.algorithms.a2c.A2CWorkflow method) (evorl.algorithms.contrib.pop_episodic_td3.PopEpisodicTD3Workflow method) (evorl.algorithms.contrib.pop_ppo.PopPPOWorkflow method) (evorl.algorithms.contrib.pop_td3.PopTD3Workflow method) (evorl.algorithms.contrib.td3_onpolicy.TD3OnPolicyWorkflow method) (evorl.algorithms.contrib.td3_v2.TD3V2Workflow method) (evorl.algorithms.contrib.td3_v3.TD3V3Workflow method) (evorl.algorithms.ddpg.DDPGWorkflow method) (evorl.algorithms.dqn.DQNWorkflow method) (evorl.algorithms.erl.cemrl_td3.cemrl.CEMRLWorkflow method) (evorl.algorithms.erl.cemrl_td3.cemrl_openes.CEMRLOpenESWorkflow method) (evorl.algorithms.erl.cemrl_td3.cemrl_origin.CEMRLWorkflow method) (evorl.algorithms.erl.erl_td3.erl_eda.ERLEDAWorkflow method) (evorl.algorithms.erl.erl_td3.erl_es.ERLESWorkflow method) (evorl.algorithms.erl.erl_td3.erl_ga.ERLGAWorkflow method) (evorl.algorithms.erl.erl_td3.erl_origin.ERLWorkflow method) (evorl.algorithms.impala.IMPALAWorkflow method) (evorl.algorithms.meta.pbt_ppo.param_ppo.ParamPPOWorkflow method) (evorl.algorithms.meta.pbt_sac.param_sac.ParamSACWorkflow method) (evorl.algorithms.meta.pbt_workflow.PBTOffpolicyWorkflowTemplate method) (evorl.algorithms.meta.pbt_workflow.PBTWorkflowBase method) (evorl.algorithms.ppo.PPOWorkflow method) (evorl.algorithms.random_agent.RandomAgentWorkflow method) (evorl.algorithms.sac.SACWorkflow method) (evorl.algorithms.td3.TD3Workflow method) (evorl.algorithms.td7.TD7Workflow method) (evorl.envs.brax.BraxAdapter method) (evorl.envs.env.Env method) (evorl.envs.envpool.EnvPoolGymAdapter method) (evorl.envs.envpool.OneEpisodeWrapper method) (evorl.envs.gymnasium.GymnasiumAdapter method) (evorl.envs.gymnasium.OneEpisodeWrapper method) (evorl.envs.gymnax.GymnaxAdapter method) (evorl.envs.jaxmarl.JaxMARLAdapter method) (evorl.envs.jaxmarl.MABraxAdapter method) (evorl.envs.jumanji.JumanjiAdapter method) (evorl.envs.mujoco_playground.MjxEnvAdapter method) (evorl.envs.wrappers.action_wrapper.ActionRepeatWrapper method) (evorl.envs.wrappers.action_wrapper.ActionSquashWrapper method) (evorl.envs.wrappers.ActionRepeatWrapper method) (evorl.envs.wrappers.ActionSquashWrapper method) (evorl.envs.wrappers.EpisodeWrapper method) (evorl.envs.wrappers.FastVmapAutoResetWrapper method) (evorl.envs.wrappers.ma_training_wrapper.EpisodeWrapper method) (evorl.envs.wrappers.ma_training_wrapper.FastVmapAutoResetWrapper method) (evorl.envs.wrappers.ma_training_wrapper.OneEpisodeWrapper method) (evorl.envs.wrappers.ma_training_wrapper.VmapAutoResetWrapper method) (evorl.envs.wrappers.ma_training_wrapper.VmapWrapper method) (evorl.envs.wrappers.obs_wrapper.ObsFlattenWrapper method) (evorl.envs.wrappers.ObsFlattenWrapper method) (evorl.envs.wrappers.OneEpisodeWrapper method) (evorl.envs.wrappers.reward_wrapper.RewardScaleWrapper method) (evorl.envs.wrappers.reward_wrapper.SparseRewardWrapper method) (evorl.envs.wrappers.RewardScaleWrapper method) (evorl.envs.wrappers.SparseRewardWrapper method) (evorl.envs.wrappers.training_wrapper.EpisodeWrapper method) (evorl.envs.wrappers.training_wrapper.FastVmapAutoResetWrapper method) (evorl.envs.wrappers.training_wrapper.OneEpisodeWrapper method) (evorl.envs.wrappers.training_wrapper.VmapAutoResetWrapper method) (evorl.envs.wrappers.training_wrapper.VmapEnvPoolAutoResetWrapper method) (evorl.envs.wrappers.training_wrapper.VmapWrapper method) (evorl.envs.wrappers.VmapAutoResetWrapper method) (evorl.envs.wrappers.VmapEnvPoolAutoResetWrapper method) (evorl.envs.wrappers.VmapWrapper method) (evorl.envs.wrappers.Wrapper method) (evorl.envs.wrappers.wrapper.Wrapper method) (evorl.workflows.ec_workflow.ECWorkflowTemplate method) (evorl.workflows.ec_workflow.MultiObjectiveECWorkflowTemplate method) (evorl.workflows.ECWorkflowTemplate method) (evorl.workflows.MultiObjectiveECWorkflowTemplate method) (evorl.workflows.rl_workflow.RLWorkflow method) (evorl.workflows.RLWorkflow method) (evorl.workflows.workflow.AbstractWorkflow method) StochasticECAgent (class in evorl.algorithms.ec.ec_agent) students (evorl.ec.evox_algorithm.cso.CSOState attribute) summed_variance (evorl.utils.running_statistics.RunningStatisticsState attribute) super_mut_prob (evorl.ec.operators.ERLMutation attribute) (evorl.ec.optimizers.erl_ga.ERLGA attribute) (evorl.ec.optimizers.ERLGA attribute) super_mut_strength (evorl.ec.operators.ERLMutation attribute) (evorl.ec.optimizers.erl_ga.ERLGA attribute) (evorl.ec.optimizers.ERLGA attribute) supported_jaxmarl_env_list (in module evorl.envs.jaxmarl) T T (evorl.types.PyTreeArrayMixin property) take() (evorl.types.PyTreeArrayMixin method) TanhTransformedDistribution (class in evorl.distribution) target_actor_params (evorl.algorithms.contrib.td3_v3.TD3NetworkParams attribute) (evorl.algorithms.ddpg.DDPGNetworkParams attribute) (evorl.algorithms.td3.TD3NetworkParams attribute) (evorl.algorithms.td7.TD7NetworkParams attribute) target_critic1_params (evorl.algorithms.contrib.td3_v3.TD3NetworkParams attribute) target_critic2_params (evorl.algorithms.contrib.td3_v3.TD3NetworkParams attribute) target_critic_params (evorl.algorithms.ddpg.DDPGNetworkParams attribute) (evorl.algorithms.sac.SACNetworkParams attribute) (evorl.algorithms.td3.TD3NetworkParams attribute) (evorl.algorithms.td7.TD7NetworkParams attribute) target_entropy_ratio (evorl.algorithms.sac.SACDiscreteAgent attribute) target_q_params (evorl.algorithms.dqn.DQNNetworkParams attribute) target_type (evorl.algorithms.dqn.DQNAgent attribute) TD3Agent (class in evorl.algorithms.contrib.td3_v3) (class in evorl.algorithms.td3) TD3NetworkParams (class in evorl.algorithms.contrib.td3_v3) (class in evorl.algorithms.td3) TD3OnPolicyWorkflow (class in evorl.algorithms.contrib.td3_onpolicy) TD3TrainMetric (class in evorl.algorithms.contrib.td3_v3) (class in evorl.algorithms.td3) TD3V2Workflow (class in evorl.algorithms.contrib.td3_v2) TD3V3Workflow (class in evorl.algorithms.contrib.td3_v3) TD3Workflow (class in evorl.algorithms.td3) TD3WorkflowMod (class in evorl.algorithms.contrib.td3_ep) TD7Actor (class in evorl.algorithms.td7) TD7Agent (class in evorl.algorithms.td7) TD7Critic (class in evorl.algorithms.td7) TD7Encoder (class in evorl.algorithms.td7) TD7NetworkParams (class in evorl.algorithms.td7) TD7TrainMetric (class in evorl.algorithms.td7) TD7Workflow (class in evorl.algorithms.td7) tell() (evorl.algorithms.meta.pbt_openes.param_openes.OpenES method) (evorl.ec.evox_algorithm.cmaes.CMAES method) (evorl.ec.evox_algorithm.cmaes.SepCMAES method) (evorl.ec.evox_algorithm.cso.CSO method) (evorl.ec.evox_algorithm.openes.OpenES method) (evorl.ec.optimizers.ARS method) (evorl.ec.optimizers.ars.ARS method) (evorl.ec.optimizers.cem.SepCEM method) (evorl.ec.optimizers.ec_optimizer.EvoOptimizer method) (evorl.ec.optimizers.erl_ga.ERLGA method) (evorl.ec.optimizers.ERLGA method) (evorl.ec.optimizers.EvoOptimizer method) (evorl.ec.optimizers.evox_wrapper.EvoXAlgorithmAdapter method) (evorl.ec.optimizers.OpenES method) (evorl.ec.optimizers.openes.OpenES method) (evorl.ec.optimizers.openes.OpenESNoiseTable method) (evorl.ec.optimizers.OpenESNoiseTable method) (evorl.ec.optimizers.SepCEM method) (evorl.ec.optimizers.vanilla_es.VanillaES method) (evorl.ec.optimizers.vanilla_ga.VanillaGA method) (evorl.ec.optimizers.VanillaES method) (evorl.ec.optimizers.VanillaGA method) tell_external() (evorl.ec.optimizers.erl_ga.ERLGAMod method) (evorl.ec.optimizers.ERLGAMod method) (evorl.ec.optimizers.vanilla_es.VanillaESMod method) (evorl.ec.optimizers.VanillaESMod method) tfd (in module evorl.distribution) time_cost_per_iter (evorl.algorithms.erl.cemrl_td3.cemrl_origin.CEMRLTrainMetric attribute) (evorl.algorithms.erl.erl_td3.erl_origin.ERLTrainMetric attribute) to_local_dict() (evorl.metrics.MetricBase method) (in module evorl.metrics) to_tree() (evorl.utils.ec_utils.ParamVectorSpec method) to_vector() (evorl.utils.ec_utils.ParamVectorSpec method) tournament_size (evorl.ec.operators.TournamentSelection attribute) (evorl.ec.optimizers.erl_ga.ERLGA attribute) (evorl.ec.optimizers.ERLGA attribute) (evorl.ec.optimizers.vanilla_ga.VanillaGA attribute) (evorl.ec.optimizers.VanillaGA attribute) TournamentSelection (class in evorl.ec.operators) train_episode_return (evorl.metrics.TrainMetric attribute) training_updates (evorl.algorithms.dqn.DQNWorkflowMetric attribute) TrainMetric (class in evorl.metrics) trajectory (evorl.algorithms.meta.pbt_sac.param_sac.ParamSACTrainMetric attribute) (evorl.sample_batch.Episode attribute) tree_astype() (in module evorl.utils.jax_utils) tree_concat() (in module evorl.utils.jax_utils) tree_deepcopy() (in module evorl.utils.jax_utils) tree_device_put() (in module evorl.distributed) (in module evorl.distributed.sharding) tree_flatten() (evorl.types.PyTreeDict method) tree_get() (in module evorl.utils.jax_utils) tree_has_nan() (in module evorl.utils.jax_utils) tree_last() (in module evorl.utils.jax_utils) tree_ones_like() (in module evorl.utils.jax_utils) tree_set() (in module evorl.utils.jax_utils) tree_stop_gradient() (in module evorl.utils.jax_utils) tree_unflatten() (evorl.types.PyTreeDict class method) tree_zeros_like() (in module evorl.utils.jax_utils) truncated_normal_init() (in module evorl.algorithms.meta.pbt_utils) U ub (evorl.ec.evox_algorithm.cso.CSO attribute) unbatchify() (in module evorl.utils.ma_utils) uniform_init() (in module evorl.algorithms.meta.pbt_utils) unwrapped (evorl.envs.env.EnvAdapter property) (evorl.envs.wrappers.Wrapper property) (evorl.envs.wrappers.wrapper.Wrapper property) update() (evorl.types.PyTreeDict method) (in module evorl.utils.running_statistics) update_priority() (evorl.replay_buffers.prioritized_replay_buffer.PrioritizedReplayBuffer method) (evorl.replay_buffers.PrioritizedReplayBuffer method) use_bias (evorl.networks.layer_norm.StaticLayerNorm attribute) (evorl.networks.linear.MLP attribute) (evorl.networks.linear.SNMLP attribute) (evorl.networks.MLP attribute) (evorl.networks.SNMLP attribute) (evorl.networks.spectral_norm.SNDense attribute) (evorl.networks.StaticLayerNorm attribute) use_scale (evorl.networks.layer_norm.StaticLayerNorm attribute) (evorl.networks.StaticLayerNorm attribute) V valid_mask (evorl.sample_batch.Episode property) value_network (evorl.algorithms.a2c.A2CAgent attribute) (evorl.algorithms.impala.IMPALAAgent attribute) (evorl.algorithms.ppo.PPOAgent attribute) value_obs_key (evorl.algorithms.ppo.PPOAgent attribute) value_params (evorl.algorithms.a2c.A2CNetworkParams attribute) (evorl.algorithms.impala.IMPALANetworkParams attribute) (evorl.algorithms.ppo.PPONetworkParams attribute) VanillaES (class in evorl.ec.optimizers) (class in evorl.ec.optimizers.vanilla_es) VanillaESMod (class in evorl.ec.optimizers) (class in evorl.ec.optimizers.vanilla_es) VanillaESState (class in evorl.ec.optimizers.vanilla_es) VanillaESWorkflow (class in evorl.algorithms.ec.so.vanilla_es) VanillaGA (class in evorl.ec.optimizers) (class in evorl.ec.optimizers.vanilla_ga) VanillaGAState (class in evorl.ec.optimizers.vanilla_ga) variance (evorl.ec.optimizers.cem.SepCEMState attribute) vec_relative_prob (evorl.ec.operators.ERLMutation attribute) (evorl.ec.optimizers.erl_ga.ERLGA attribute) (evorl.ec.optimizers.ERLGA attribute) vector_num_mutation_frac (evorl.ec.operators.MLPMutation attribute) (evorl.ec.optimizers.vanilla_ga.VanillaGA attribute) (evorl.ec.optimizers.VanillaGA attribute) velocity (evorl.algorithms.meta.pbt_ppo.pbt_cso_param_ppo.PBTCSOOptState attribute) (evorl.ec.evox_algorithm.cso.CSOState attribute) VmapAutoResetWrapper (class in evorl.envs.wrappers) (class in evorl.envs.wrappers.ma_training_wrapper) (class in evorl.envs.wrappers.training_wrapper) VmapEnvPoolAutoResetWrapper (class in evorl.envs.wrappers) (class in evorl.envs.wrappers.training_wrapper) VmapWrapper (class in evorl.envs.wrappers) (class in evorl.envs.wrappers.ma_training_wrapper) (class in evorl.envs.wrappers.training_wrapper) vtrace_lambda (evorl.algorithms.impala.IMPALAAgent attribute) W wait_until_finished() (evorl.utils.orbax_utils.DummyCheckpointManager method) WandbRecorder (class in evorl.recorders) (class in evorl.recorders.wandb_recorder) warmup_step() (evorl.algorithms.erl.erl_td3.erl_td3_workflow.ERLTD3WorkflowTemplate method) (evorl.algorithms.erl.erl_workflow.ERLWorkflowBase method) weight_decay (evorl.algorithms.meta.pbt_openes.param_openes.OpenES attribute) (evorl.ec.optimizers.OpenES attribute) (evorl.ec.optimizers.openes.OpenES attribute) (evorl.ec.optimizers.openes.OpenESNoiseTable attribute) (evorl.ec.optimizers.OpenESNoiseTable attribute) weight_max_magnitude (evorl.ec.operators.ERLMutation attribute) (evorl.ec.operators.MLPMutation attribute) (evorl.ec.optimizers.erl_ga.ERLGA attribute) (evorl.ec.optimizers.ERLGA attribute) (evorl.ec.optimizers.vanilla_ga.VanillaGA attribute) (evorl.ec.optimizers.VanillaGA attribute) weight_sum() (in module evorl.ec.optimizers.utils) weighted_update (evorl.ec.optimizers.cem.SepCEM attribute) (evorl.ec.optimizers.SepCEM attribute) Workflow (class in evorl.workflows) (class in evorl.workflows.workflow) WorkflowMetric (class in evorl.algorithms.contrib.pop_td3) (class in evorl.algorithms.erl.cemrl_td3.cemrl_origin) (class in evorl.algorithms.erl.erl_workflow) (class in evorl.metrics) world_size (evorl.workflows.ec_workflow.DistributedInfo attribute) Wrapper (class in evorl.envs.wrappers) (class in evorl.envs.wrappers.wrapper) write() (evorl.recorders.ChainRecorder method) (evorl.recorders.log_recorder.LogRecorder method) (evorl.recorders.LogRecorder method) (evorl.recorders.Recorder method) (evorl.recorders.recorder.ChainRecorder method) (evorl.recorders.recorder.Recorder method) (evorl.recorders.wandb_recorder.WandbRecorder method) (evorl.recorders.WandbRecorder method) Z z_s_dim (evorl.algorithms.td7.TD7Actor attribute) (evorl.algorithms.td7.TD7Critic attribute) (evorl.algorithms.td7.TD7Encoder attribute) z_sa_dim (evorl.algorithms.td7.TD7Critic attribute) (evorl.algorithms.td7.TD7Encoder attribute) zs() (evorl.algorithms.td7.TD7Encoder method) zsa() (evorl.algorithms.td7.TD7Encoder method)