evorl.algorithms.contrib.td3_onpolicy

Module Contents

Classes

Functions

Data

API

evorl.algorithms.contrib.td3_onpolicy.MISSING_LOSS

None

class evorl.algorithms.contrib.td3_onpolicy.TD3OnPolicyWorkflow(env: evorl.envs.Env, agent: evorl.agent.Agent, optimizer: optax.GradientTransformation, evaluator: evorl.evaluators.Evaluator, config: omegaconf.DictConfig)[source]

Bases: evorl.workflows.OnPolicyWorkflow

learn(state: evorl.types.State) evorl.types.State[source]
classmethod name()[source]
step(state: evorl.types.State) tuple[evorl.metrics.MetricBase, evorl.types.State][source]
evorl.algorithms.contrib.td3_onpolicy.build_rl_update_fn(agent: evorl.agent.Agent, optimizer: optax.GradientTransformation, config: omegaconf.DictConfig)[source]