policy_wrapper#


class PolicyWrapperFactory[source]#
abstract create_wrapped_policy(policy: BasePolicy, envs: Environments, optim_factory: OptimizerFactory, device: str | device) TPolicyOut[source]#
class PolicyWrapperFactoryIntrinsicCuriosity(*, feature_net_factory: IntermediateModuleFactory, hidden_sizes: Sequence[int], lr: float, lr_scale: float, reward_scale: float, forward_loss_weight: float)[source]#
create_wrapped_policy(policy: BasePolicy, envs: Environments, optim_factory: OptimizerFactory, device: str | device) ICMPolicy[source]#