algorithm_wrapper#


class AlgorithmWrapperFactory[source]#

Bases: Generic[TAlgorithmOut], ToStringMixin, ABC

abstract create_wrapped_algorithm(policy: Algorithm, envs: Environments, optim_factory: OptimizerFactoryFactory, device: str | device) TAlgorithmOut[source]#
class AlgorithmWrapperFactoryIntrinsicCuriosity(*, feature_net_factory: IntermediateModuleFactory, hidden_sizes: Sequence[int], lr: float, lr_scale: float, reward_scale: float, forward_loss_weight: float, optim: OptimizerFactoryFactory | None = None)[source]#

Bases: AlgorithmWrapperFactory[ICMOffPolicyWrapper | ICMOnPolicyWrapper]

create_wrapped_algorithm(algorithm: Algorithm, envs: Environments, optim_factory_default: OptimizerFactoryFactory, device: str | device) ICMOffPolicyWrapper | ICMOnPolicyWrapper[source]#