Index A | B | C | D | E | F | G | H | I | J | K | L | M | N | O | P | Q | R | S | T | U | V | W A A2C (class in tianshou.algorithm.modelfree.a2c) A2CAlgorithmFactory (class in tianshou.highlevel.algorithm) A2CExperimentBuilder (class in tianshou.highlevel.experiment) A2CParams (class in tianshou.highlevel.params.algorithm_params) A2CTrainingStats (class in tianshou.algorithm.modelfree.a2c) AbstractContinuousActorDeterministic (class in tianshou.utils.net.continuous) AbstractContinuousActorProbabilistic (class in tianshou.utils.net.common) AbstractContinuousCritic (class in tianshou.utils.net.continuous) AbstractDiscreteActor (class in tianshou.utils.net.common) acc_exp (GailTrainingStats attribute) acc_pi (GailTrainingStats attribute) act (ActBatchProtocol attribute) (CollectActionBatchProtocol attribute) (RolloutBatchProtocol attribute) act_normalized (CollectActionBatchProtocol attribute) ActBatchProtocol (class in tianshou.data.types) action() (ContinuousToDiscrete method) (MultiDiscreteToDiscrete method) action_bound_method (ParamsMixinActionScalingAndBounding attribute) action_dim (ActionSpaceInfo property) ACTION_DIST_KEY (StepHookAddActionDistribution attribute) action_info (SpaceInfo attribute) action_scaling (ParamsMixinActionScaling attribute) action_shape (ActionSpaceInfo attribute) action_space (BaseCollector property) (RandomActor property) action_type (Policy property) ActionReprNet (class in tianshou.utils.net.common) ActionReprNetDataParallelWrapper (class in tianshou.utils.net.common) ActionReprNetWithVectorOutput (class in tianshou.utils.net.common) ActionSpaceInfo (class in tianshou.utils.space_info) actor (ActorFuture attribute) Actor (class in tianshou.utils.net.common) actor_delay (REDQParams attribute) actor_loss (A2CTrainingStats attribute) (BCQTrainingStats attribute) (DDPGTrainingStats attribute) (DiscreteCRRTrainingStats attribute) (NPGTrainingStats attribute) (SACTrainingStats attribute) (TD3TrainingStats attribute) actor_lr (ParamsMixinActorAndCritic attribute) (ParamsMixinActorAndDualCritics attribute) actor_lr_scheduler (ParamsMixinActorAndCritic attribute) (ParamsMixinActorAndDualCritics attribute) actor_optim (ParamsMixinActorAndCritic attribute) (ParamsMixinActorAndDualCritics attribute) ActorCritic (class in tianshou.utils.net.common) ActorCriticOffPolicyAlgorithm (class in tianshou.algorithm.modelfree.ddpg) ActorCriticOnPolicyAlgorithm (class in tianshou.algorithm.modelfree.a2c) ActorCriticOnPolicyAlgorithmFactory (class in tianshou.highlevel.algorithm) ActorCriticOnPolicyParams (class in tianshou.highlevel.params.algorithm_params) ActorDualCriticsOffPolicyAlgorithm (class in tianshou.algorithm.modelfree.td3) ActorDualCriticsOffPolicyAlgorithmFactory (class in tianshou.highlevel.algorithm) ActorFactory (class in tianshou.highlevel.module.actor) ActorFactoryAtariDQN (class in tianshou.env.atari.atari_network) ActorFactoryContinuous (class in tianshou.highlevel.module.actor) ActorFactoryContinuousDeterministicNet (class in tianshou.highlevel.module.actor) ActorFactoryContinuousGaussianNet (class in tianshou.highlevel.module.actor) ActorFactoryDefault (class in tianshou.highlevel.module.actor) ActorFactoryDiscreteNet (class in tianshou.highlevel.module.actor) ActorFactoryTransientStorageDecorator (class in tianshou.highlevel.module.actor) ActorFuture (class in tianshou.highlevel.module.actor) ActorFutureProviderProtocol (class in tianshou.highlevel.module.actor) ActStateBatchProtocol (class in tianshou.data.types) AdamOptimizerFactory (class in tianshou.algorithm.optim) add() (CachedReplayBuffer method) (HERReplayBuffer method) (HERReplayBufferManager method) (MovAvg method) (PrioritizedReplayBuffer method) (ReplayBuffer method) (ReplayBufferManager method) add_discounted_returns() (DiscountedReturnComputation method) add_exploration_noise() (BDQNPolicy method) (ContinuousPolicyWithExplorationNoise method) (DiscreteQLearningPolicy method) (MultiAgentPolicy method) (Policy method) add_lagged_network() (LaggedNetworkCollection method) adv (BatchWithAdvantagesProtocol attribute) advantage_normalization (NPGParams attribute) (PPOParams attribute) agent_idx (MARLDispatcher attribute) Algorithm (class in tianshou.algorithm.algorithm_base) algorithm (World attribute) Algorithm.Optimizer (class in tianshou.algorithm.algorithm_base) AlgorithmFactory (class in tianshou.highlevel.algorithm) algorithms (MARLDispatcher attribute) AlgorithmWrapperFactory (class in tianshou.highlevel.params.algorithm_wrapper) AlgorithmWrapperFactoryIntrinsicCuriosity (class in tianshou.highlevel.params.algorithm_wrapper) alloc_by_keys_diff() (in module tianshou.data.batch) Alpha (class in tianshou.algorithm.modelfree.sac) alpha (ParamsMixinAlpha attribute) (REDQTrainingStats attribute) (SACTrainingStats attribute) alpha_loss (REDQTrainingStats attribute) (SACTrainingStats attribute) apply_values_transform() (Batch method) (BatchProtocol method) assert_continuous() (EnvType method) assert_discrete() (EnvType method) AsyncCollector (class in tianshou.data.collector) AtariEnvFactory (class in tianshou.env.atari.atari_wrapper) AtariEnvFactory.EnvPoolFactoryAtari (class in tianshou.env.atari.atari_wrapper) AtariEpochStopCallback (class in tianshou.env.atari.atari_wrapper) AutoAlpha (class in tianshou.algorithm.modelfree.sac) AutoAlphaFactory (class in tianshou.highlevel.params.alpha) AutoAlphaFactoryDefault (class in tianshou.highlevel.params.alpha) B backend (JoblibConfig attribute) backtrack_coeff (TRPOParams attribute) BaseCollector (class in tianshou.data.collector) BaseLogger (class in tianshou.utils.logger.logger_base) BaseNoise (class in tianshou.exploration.random) BaseVectorEnv (class in tianshou.env.venvs) Batch (class in tianshou.data.batch) batch_size (OfflineTrainerParams attribute) (OffPolicyTrainerParams attribute) (OffPolicyTrainingConfig attribute) (OnPolicyTrainerParams attribute) (OnPolicyTrainingConfig attribute) BatchProtocol (class in tianshou.data.batch) BatchWithAdvantagesProtocol (class in tianshou.data.types) BatchWithReturnsProtocol (class in tianshou.data.types) BCQ (class in tianshou.algorithm.imitation.bcq) BCQPolicy (class in tianshou.algorithm.imitation.bcq) BCQTrainingStats (class in tianshou.algorithm.imitation.bcq) BDQN (class in tianshou.algorithm.modelfree.bdqn) BDQNPolicy (class in tianshou.algorithm.modelfree.bdqn) best_reward (InfoStats attribute) best_reward_std (InfoStats attribute) best_score (InfoStats attribute) BranchingNet (class in tianshou.utils.net.common) buffer (OfflineTrainerParams attribute) buffer_size (TrainingConfig attribute) build() (ExperimentBuilder method) build_and_run() (ExperimentBuilder method) build_seeded_collection() (ExperimentBuilder method) C C51 (class in tianshou.algorithm.modelfree.c51) C51Net (class in tianshou.env.atari.atari_network) C51Policy (class in tianshou.algorithm.modelfree.c51) CachedReplayBuffer (class in tianshou.data.buffer.cached) callback() (EpochTestCallback method) (EpochTestCallbackDQNSetEps method) (EpochTrainCallback method) (EpochTrainCallbackDQNEpsLinearDecay method) (EpochTrainCallbackDQNSetEps method) cat() (Batch static method) (BatchProtocol static method) cat_() (Batch method) (BatchProtocol method) cell (RecurrentStateBatch attribute) change_value() (ParamTransformerActionScaling method) (ParamTransformerChangeValue method) (ParamTransformerFloatEnvParamFactory method) (ParamTransformerNoiseFactory method) check() (TraceDeterminismTest method) ClipRewardEnv (class in tianshou.env.atari.atari_wrapper) close() (BaseCollector method) (BaseVectorEnv method) (Collector method) (EnvWorker method) (PettingZooEnv method) (VectorEnvWrapper method) close_env() (DummyEnvWorker method) (EnvWorker method) (RayEnvWorker method) (SubprocEnvWorker method) CloudpickleWrapper (class in tianshou.env.utils) collect() (BaseCollector method) collect_speed (CollectStats attribute) (LoggedCollectStats attribute) collect_time (CollectStats attribute) (LoggedCollectStats attribute) CollectActionBatchProtocol (class in tianshou.data.collector) collection_step_num_env_steps (OnlineTrainerParams attribute) (OnlineTrainingConfig attribute) (TrainingConfig attribute) collection_step_num_episodes (OnlineTrainerParams attribute) (OnlineTrainingConfig attribute) (TrainingConfig attribute) Collector (class in tianshou.data.collector) CollectorFactory (class in tianshou.highlevel.params.collector) CollectorFactoryDefault (class in tianshou.highlevel.params.collector) CollectStats (class in tianshou.data.collector) CollectStatsBase (class in tianshou.data.collector) CollectStepBatchProtocol (class in tianshou.data.collector) compute_action() (Policy method) compute_action_batch() (RandomActor method) compute_dim_to_summary_stats() (in module tianshou.data.stats) compute_episodic_return() (Algorithm static method) compute_nstep_return() (Algorithm static method) compute_q_value() (C51Policy method) (DiscreteQLearningPolicy method) (QRDQNPolicy method) compute_score_fn (TrainerParams attribute) CONTINUOUS (EnvType attribute) ContinuousActorDeterministic (class in tianshou.utils.net.continuous) ContinuousActorProbabilistic (class in tianshou.utils.net.continuous) ContinuousActorType (class in tianshou.highlevel.module.actor) ContinuousCritic (class in tianshou.utils.net.continuous) ContinuousDeterministicPolicy (class in tianshou.algorithm.modelfree.ddpg) ContinuousEnvironments (class in tianshou.highlevel.env) ContinuousPolicyWithExplorationNoise (class in tianshou.algorithm.modelfree.ddpg) ContinuousToDiscrete (class in tianshou.env.gym_wrappers) copy() (ExperimentBuilder method) correct_log_prob_gaussian_tanh() (in module tianshou.algorithm.modelfree.sac) CosineEmbeddingNetwork (class in tianshou.utils.net.discrete) CQL (class in tianshou.algorithm.imitation.cql) cql_alpha (CQLTrainingStats attribute) cql_alpha_loss (CQLTrainingStats attribute) cql_loss (DiscreteCQLTrainingStats attribute) (DiscreteCRRTrainingStats attribute) CQLTrainingStats (class in tianshou.algorithm.imitation.cql) create_algorithm() (AlgorithmFactory method) create_auto_alpha() (AutoAlphaFactory method) (AutoAlphaFactoryDefault method) create_collector() (CollectorFactory method) (CollectorFactoryDefault method) create_dist_fn() (ActorFactory method) (ActorFactoryAtariDQN method) (ActorFactoryContinuousDeterministicNet method) (ActorFactoryContinuousGaussianNet method) (ActorFactoryDefault method) (ActorFactoryDiscreteNet method) (ActorFactoryTransientStorageDecorator method) (DistributionFunctionFactory method) (DistributionFunctionFactoryCategorical method) (DistributionFunctionFactoryIndependentGaussians method) create_env() (EnvFactory method) create_envs() (EnvFactory method) create_experiment_world() (Experiment method) create_instances() (OptimizerFactory method) create_intermediate_module() (IntermediateModuleFactory method) (IntermediateModuleFactoryAtariDQN method) (IntermediateModuleFactoryFromActorFactory method) create_kwargs() (Params method) create_launcher() (RegisteredExpLauncher method) create_logger() (LoggerFactory method) (LoggerFactoryDefault method) create_lr_scheduler_factory() (LRSchedulerFactoryFactory method) (LRSchedulerFactoryFactoryLinear method) create_module() (ActorFactory method) (ActorFactoryAtariDQN method) (ActorFactoryContinuousDeterministicNet method) (ActorFactoryContinuousGaussianNet method) (ActorFactoryDefault method) (ActorFactoryDiscreteNet method) (ActorFactoryTransientStorageDecorator method) (CriticEnsembleFactory method) (CriticEnsembleFactoryContinuousNet method) (CriticEnsembleFactoryDefault method) (CriticFactory method) (CriticFactoryContinuousNet method) (CriticFactoryDefault method) (CriticFactoryDiscreteNet method) (CriticFactoryReuseActor method) (ImplicitQuantileNetworkFactory method) (IntermediateModuleFactory method) (ModuleFactory method) create_noise() (NoiseFactory method) (NoiseFactoryMaxActionScaledGaussian method) create_optimizer_factory() (OptimizerFactoryFactory method) (OptimizerFactoryFactoryAdam method) (OptimizerFactoryFactoryRMSprop method) (OptimizerFactoryFactoryTorch method) create_policy() (MARLDispatcher method) create_scheduler() (LRSchedulerFactory method) (LRSchedulerFactoryLinear method) create_train_test_collectors() (AlgorithmFactory method) create_trainer() (Algorithm method) (AlgorithmFactory method) (OfflineAlgorithm method) (OffPolicyAlgorithm method) (OffPolicyAlgorithmFactory method) (OnPolicyAlgorithm method) (OnPolicyAlgorithmFactory method) create_uniform_action_dist() (in module tianshou.utils.torch_utils) create_value() (EnvValueFactory method) (FloatEnvValueFactoryMaxActionScaled method) (in module tianshou.data.batch) create_venv() (EnvFactory method) (EnvFactoryRegistered method) (EnvPoolFactory method) (VectorEnvType method) create_wrapped_algorithm() (AlgorithmWrapperFactory method) (AlgorithmWrapperFactoryIntrinsicCuriosity method) critic1_loss (BCQTrainingStats attribute) (SACTrainingStats attribute) (TD3TrainingStats attribute) critic1_lr (ParamsMixinActorAndDualCritics attribute) critic1_lr_scheduler (ParamsMixinActorAndDualCritics attribute) critic1_optim (ParamsMixinActorAndDualCritics attribute) critic2_loss (BCQTrainingStats attribute) (SACTrainingStats attribute) (TD3TrainingStats attribute) critic2_lr (ParamsMixinActorAndDualCritics attribute) critic2_lr_scheduler (ParamsMixinActorAndDualCritics attribute) critic2_optim (ParamsMixinActorAndDualCritics attribute) critic_loss (DDPGTrainingStats attribute) (DiscreteCRRTrainingStats attribute) critic_lr (ParamsMixinActorAndCritic attribute) critic_lr_scheduler (ParamsMixinActorAndCritic attribute) critic_optim (ParamsMixinActorAndCritic attribute) CriticEnsembleFactory (class in tianshou.highlevel.module.critic) CriticEnsembleFactoryContinuousNet (class in tianshou.highlevel.module.critic) CriticEnsembleFactoryDefault (class in tianshou.highlevel.module.critic) CriticFactory (class in tianshou.highlevel.module.critic) CriticFactoryContinuousNet (class in tianshou.highlevel.module.critic) CriticFactoryDefault (class in tianshou.highlevel.module.critic) CriticFactoryDiscreteNet (class in tianshou.highlevel.module.critic) CriticFactoryReuseActor (class in tianshou.highlevel.module.critic) D DataclassPPrintMixin (class in tianshou.utils.print) DataParallelNet (class in tianshou.utils.net.common) DataScope (class in tianshou.utils.logger.logger_base) DDPG (class in tianshou.algorithm.modelfree.ddpg) DDPGAlgorithmFactory (class in tianshou.highlevel.algorithm) DDPGExperimentBuilder (class in tianshou.highlevel.experiment) DDPGParams (class in tianshou.highlevel.params.algorithm_params) DDPGTrainingStats (class in tianshou.algorithm.modelfree.ddpg) decode() (VAE method) default() (OptimizerFactoryFactory static method) default_experiment_execution() (in module tianshou.evaluation.launcher) DEFAULT_HIDDEN_SIZES (ActorFactoryDefault attribute) (CriticEnsembleFactoryDefault attribute) (CriticFactoryDefault attribute) deprecation() (in module tianshou.utils.warning) DETERMINISTIC (ContinuousActorType attribute) deterministic_eval (ParamsMixinDeterministicEval attribute) device (ExperimentConfig attribute) (ParamTransformerData attribute) disc() (GAIL method) disc_loss (GailTrainingStats attribute) DiscountedReturnComputation (class in tianshou.algorithm.modelfree.reinforce) DISCRETE (EnvType attribute) DiscreteActor (class in tianshou.utils.net.discrete) DiscreteActorPolicy (class in tianshou.algorithm.modelfree.reinforce) DiscreteBCQ (class in tianshou.algorithm.imitation.discrete_bcq) DiscreteBCQPolicy (class in tianshou.algorithm.imitation.discrete_bcq) DiscreteBCQTrainingStats (class in tianshou.algorithm.imitation.discrete_bcq) DiscreteCQL (class in tianshou.algorithm.imitation.discrete_cql) DiscreteCQLTrainingStats (class in tianshou.algorithm.imitation.discrete_cql) DiscreteCritic (class in tianshou.utils.net.discrete) DiscreteCriticOnlyOffPolicyAlgorithmFactory (class in tianshou.highlevel.algorithm) DiscreteCRR (class in tianshou.algorithm.imitation.discrete_crr) DiscreteCRRTrainingStats (class in tianshou.algorithm.imitation.discrete_crr) DiscreteEnvironments (class in tianshou.highlevel.env) DiscreteQLearningPolicy (class in tianshou.algorithm.modelfree.dqn) DiscreteSAC (class in tianshou.algorithm.modelfree.discrete_sac) DiscreteSACAlgorithmFactory (class in tianshou.highlevel.algorithm) DiscreteSACExperimentBuilder (class in tianshou.highlevel.experiment) DiscreteSACParams (class in tianshou.highlevel.params.algorithm_params) DiscreteSACPolicy (class in tianshou.algorithm.modelfree.discrete_sac) DiscreteSACTrainingStats (class in tianshou.algorithm.modelfree.discrete_sac) dispatch_process_fn() (MARLDispatcher method) dispatch_update_with_batch() (MARLDispatcher method) dist (CollectActionBatchProtocol attribute) (CollectStepBatchProtocol attribute) (DistBatchProtocol attribute) dist_fn_categorical_from_logits() (in module tianshou.utils.net.discrete) dist_to_atleast_2d() (in module tianshou.data.batch) DistBatchProtocol (class in tianshou.data.types) DistLogProbBatchProtocol (class in tianshou.data.types) DistributionFunctionFactory (class in tianshou.highlevel.params.dist_fn) DistributionFunctionFactoryCategorical (class in tianshou.highlevel.params.dist_fn) DistributionFunctionFactoryIndependentGaussians (class in tianshou.highlevel.params.dist_fn) DQN (class in tianshou.algorithm.modelfree.dqn) DQNAlgorithmFactory (class in tianshou.highlevel.algorithm) DQNet (class in tianshou.env.atari.atari_network) DQNExperimentBuilder (class in tianshou.highlevel.experiment) DQNParams (class in tianshou.highlevel.params.algorithm_params) dropnull() (Batch method) (BatchProtocol method) (ReplayBuffer method) dual_clip (PPOParams attribute) DUMMY (VectorEnvType attribute) DummyEnvWorker (class in tianshou.env.worker.dummy) DummyTqdm (class in tianshou.utils.progress_bar) DummyVectorEnv (class in tianshou.env.venvs) E empty() (Batch static method) (BatchProtocol static method) empty_() (Batch method) (BatchProtocol method) ENABLE_VALIDATION (in module tianshou.config) ensemble_size (REDQParams attribute) EnsembleLinear (class in tianshou.utils.net.common) ent_coef (A2CParams attribute) ent_loss (A2CTrainingStats attribute) entropy_loss (FQFTrainingStats attribute) env_num (BaseCollector property) env_step (EvaluationSequenceEntry attribute) (LoggedCollectStats attribute) EnvFactory (class in tianshou.highlevel.env) EnvFactoryRegistered (class in tianshou.highlevel.env) Environments (class in tianshou.highlevel.env) EnvMode (class in tianshou.highlevel.env) EnvPoolFactory (class in tianshou.highlevel.env) envs (ParamTransformerData attribute) (World attribute) EnvType (class in tianshou.highlevel.env) EnvValueFactory (class in tianshou.highlevel.params.env_param) EnvWorker (class in tianshou.env.worker.worker_base) episode_mc_return_to_go() (in module tianshou.algorithm.algorithm_base) EpisodeBatchProtocol (class in tianshou.data.collector) EpisodeRolloutHook (class in tianshou.data.collector) EpisodeRolloutHookMCReturn (class in tianshou.data.collector) EpisodeRolloutHookMCReturn.OutputDict (class in tianshou.data.collector) EpisodeRolloutHookMerged (class in tianshou.data.collector) EpisodeRolloutHookProtocol (class in tianshou.data.collector) EpisodicLifeEnv (class in tianshou.env.atari.atari_wrapper) epoch (EpochStats attribute) epoch_num_steps (TrainerParams attribute) (TrainingConfig attribute) epoch_stop_callback (TrainerCallbacks attribute) epoch_test_callback (TrainerCallbacks attribute) epoch_train_callback (TrainerCallbacks attribute) EpochStats (class in tianshou.data.stats) EpochStopCallback (class in tianshou.highlevel.trainer) EpochStopCallbackRewardThreshold (class in tianshou.highlevel.trainer) EpochTestCallback (class in tianshou.highlevel.trainer) EpochTestCallbackDQNSetEps (class in tianshou.highlevel.trainer) EpochTrainCallback (class in tianshou.highlevel.trainer) EpochTrainCallbackDQNEpsLinearDecay (class in tianshou.highlevel.trainer) EpochTrainCallbackDQNSetEps (class in tianshou.highlevel.trainer) eps_clip (PPOParams attribute) eps_inference (QLearningOffPolicyParams attribute) eps_training (QLearningOffPolicyParams attribute) eval_results() (MultiRunExperimentResult method) EvalModeModuleWrapper (class in tianshou.utils.lagged_network) EvaluationSequenceEntry (class in tianshou.evaluation.rliable_evaluation) execute_epoch() (Trainer method) exp_dir (MultiRunExperimentResult attribute) exp_name (MultiRunExperimentResult attribute) Experiment (class in tianshou.highlevel.experiment) experiment_config (ExperimentBuilder property) EXPERIMENT_PICKLE_FILENAME (Experiment attribute) ExperimentBuilder (class in tianshou.highlevel.experiment) ExperimentCollection (class in tianshou.highlevel.experiment) ExperimentConfig (class in tianshou.highlevel.experiment) ExperimentResult (class in tianshou.highlevel.experiment) ExpLauncher (class in tianshou.evaluation.launcher) exploration_noise (ParamsMixinExplorationNoise attribute) F f() (NoisyLinear method) filter_messages() (TraceLog method) finalize() (BaseLogger method) (LazyLogger method) (TensorboardLogger method) (WandbLogger method) FireResetEnv (class in tianshou.env.atari.atari_wrapper) FixedAlpha (class in tianshou.algorithm.modelfree.sac) FloatEnvValueFactory (class in tianshou.highlevel.params.env_param) FloatEnvValueFactoryMaxActionScaled (class in tianshou.highlevel.params.env_param) format_log_message() (in module tianshou.utils.determinism) forward() (AbstractContinuousCritic method) (ActionReprNet method) (ActionReprNetDataParallelWrapper method) (BCQPolicy method) (BDQNPolicy method) (BranchingNet method) (C51Net method) (ContinuousActorDeterministic method) (ContinuousActorProbabilistic method) (ContinuousCritic method) (ContinuousDeterministicPolicy method) (CosineEmbeddingNetwork method) (DataParallelNet method) (DiscreteActor method) (DiscreteBCQPolicy method) (DiscreteCritic method) (DiscreteQLearningPolicy method) (DiscreteSACPolicy method) (DQNet method) (EnsembleLinear method) (EvalModeModuleWrapper method) (FQFPolicy method) (FractionProposalNetwork method) (FullQuantileFunction method) (ImitationPolicy method) (ImplicitQuantileNetwork method) (IntrinsicCuriosityModule method) (IQNPolicy method) (MARLRandomDiscreteMaskedOffPolicyAlgorithm.Policy method) (MLP method) (ModuleWithVectorOutputAdapter method) (MultiAgentPolicy method) (Net method) (NoisyLinear method) (Perturbation method) (ProbabilisticActorPolicy method) (PSRLPolicy method) (QRDQNet method) (RainbowNet method) (RandomActionPolicy method) (RandomActor method) (Recurrent method) (RecurrentActorProb method) (RecurrentCritic method) (REDQPolicy method) (SACPolicy method) (ScaledObsInputActionReprNet method) (VAE method) FQF (class in tianshou.algorithm.modelfree.fqf) FQFBatchProtocol (class in tianshou.data.types) FQFPolicy (class in tianshou.algorithm.modelfree.fqf) FQFTrainingStats (class in tianshou.algorithm.modelfree.fqf) fraction_loss (FQFTrainingStats attribute) FractionProposalNetwork (class in tianshou.utils.net.discrete) fractions (FQFBatchProtocol attribute) FrameStack (class in tianshou.env.atari.atari_wrapper) from_data() (ReplayBuffer class method) from_data_dict() (LoggedCollectStats class method) from_directory() (Experiment class method) from_env() (EnvType static method) (SpaceInfo class method) from_factory() (ContinuousEnvironments static method) (DiscreteEnvironments static method) from_factory_and_type() (Environments static method) from_float_or_instance() (Alpha static method) from_hdf5() (in module tianshou.data.utils.converter) from_module() (ModuleWithVectorOutput static method) from_sequence() (SequenceSummaryStats class method) from_single_value() (SequenceSummaryStats class method) from_space() (ActionSpaceInfo class method) (ObservationSpaceInfo class method) from_spaces() (SpaceInfo class method) full_episode_mc_return (EpisodeRolloutHookMCReturn.OutputDict attribute) FULL_EPISODE_MC_RETURN_KEY (EpisodeRolloutHookMCReturn attribute) full_parameter_update() (LaggedNetworkCollection method) FullQuantileFunction (class in tianshou.utils.net.discrete) G gae_lambda (ParamsMixinGeneralAdvantageEstimation attribute) GAIL (class in tianshou.algorithm.imitation.gail) GailTrainingStats (class in tianshou.algorithm.imitation.gail) gamma (ParamsMixinGamma attribute) GAUSSIAN (ContinuousActorType attribute) GaussianNoise (class in tianshou.exploration.random) get() (Batch method) (BatchProtocol method) (MovAvg method) (ParamTransformer static method) (ReplayBuffer method) (ShArray method) get_action_shape() (ContinuousEnvironments method) (DiscreteEnvironments method) (Environments method) get_action_space() (Environments method) get_actor_future() (ActorFutureProviderProtocol method) get_algorithm() (MultiAgentOffPolicyAlgorithm method) (MultiAgentOnPolicyAlgorithm method) get_buffer_indices() (ReplayBuffer method) get_dict_state_decorator() (in module tianshou.utils.net.common) get_env_attr() (BaseVectorEnv method) (DummyEnvWorker method) (EnvWorker method) (RayEnvWorker method) (SubprocEnvWorker method) (VectorEnvWrapper method) get_filename() (PolicyPersistence.Mode method) get_full_log() (TraceLog method) get_keys() (Batch method) (BatchProtocol method) get_len_of_dist() (in module tianshou.data.batch) get_log() (TraceLoggerContext method) get_logger_class() (LoggerFactory method) (LoggerFactoryDefault method) get_loss_stats_dict() (MapTrainingStats method) (TrainingStats method) get_module_with_vector_output() (IntermediateModule method) get_name() (ExpLauncher method) get_obs_rms() (VectorEnvNormObs method) get_observation_shape() (ContinuousEnvironments method) (DiscreteEnvironments method) (Environments method) get_observation_space() (Environments method) get_on_episode_done_hook() (Collector method) get_on_step_hook() (Collector method) get_output_dim() (ContinuousActorDeterministic method) (ModuleWithVectorOutput method) (RandomActor method) get_prefix_sum_idx() (SegmentTree method) get_preprocess_net() (Actor method) (ContinuousActorDeterministic method) (ContinuousActorProbabilistic method) (DiscreteActor method) (RandomActor method) (Recurrent method) get_save_best_fn() (PolicyPersistence method) get_save_checkpoint_fn() (PolicyPersistence method) get_seeding_info_as_str() (Experiment method) get_sliced_dist() (in module tianshou.data.batch) get_space_dtype() (in module tianshou.env.atari.atari_wrapper) get_stddev_from_dist() (in module tianshou.data.collector) get_trainer_fn() (EpochStopCallback method) (EpochTestCallback method) (EpochTrainCallback method) get_type() (ContinuousEnvironments method) (DiscreteEnvironments method) (Environments method) get_weight() (PrioritizedReplayBuffer method) GetParamTransformersProtocol (class in tianshou.highlevel.params.algorithm_params) git_status (TraceDeterminismTest.Result attribute) gradient_steps (A2CTrainingStats attribute) H hasnull() (Batch method) (BatchProtocol method) (ReplayBuffer method) HERReplayBuffer (class in tianshou.data.buffer.her) HERReplayBufferManager (class in tianshou.data.buffer.manager) HERVectorReplayBuffer (class in tianshou.data.buffer.vecbuf) hidden (RecurrentStateBatch attribute) hidden_sizes (IQNParams attribute) hidden_state (CollectActionBatchProtocol attribute) huber_loss_delta (DQNParams attribute) I i_loss (DiscreteBCQTrainingStats attribute) ICMOffPolicyWrapper (class in tianshou.algorithm.modelbased.icm) ICMOnPolicyWrapper (class in tianshou.algorithm.modelbased.icm) ICMTrainingStats (class in tianshou.algorithm.modelbased.icm) imitation_logits (ImitationBatchProtocol attribute) ImitationBatchProtocol (class in tianshou.data.types) ImitationLearningAlgorithmMixin (class in tianshou.algorithm.imitation.imitation_base) ImitationPolicy (class in tianshou.algorithm.imitation.imitation_base) ImitationTrainingStats (class in tianshou.algorithm.imitation.imitation_base) ImplicitQuantileNetwork (class in tianshou.utils.net.discrete) ImplicitQuantileNetworkFactory (class in tianshou.highlevel.module.special) INFO (DataScope attribute) info (ObsBatchProtocol attribute) info() (ContinuousEnvironments method) (Environments method) info_stat (EpochStats attribute) InfoStats (class in tianshou.data.stats) init_linear_orthogonal() (in module tianshou.highlevel.module.core) init_weight() (PrioritizedReplayBuffer method) IntermediateModule (class in tianshou.highlevel.module.intermediate) IntermediateModuleFactory (class in tianshou.highlevel.module.intermediate) IntermediateModuleFactoryAtariDQN (class in tianshou.env.atari.atari_network) IntermediateModuleFactoryAtariDQNFeatures (class in tianshou.env.atari.atari_network) IntermediateModuleFactoryFromActorFactory (class in tianshou.highlevel.module.actor) IntrinsicCuriosityModule (class in tianshou.utils.net.discrete) iqm (EvaluationSequenceEntry attribute) iqm_confidence_interval (EvaluationSequenceEntry attribute) IQN (class in tianshou.algorithm.modelfree.iqn) IQNAlgorithmFactory (class in tianshou.highlevel.algorithm) IQNExperimentBuilder (class in tianshou.highlevel.experiment) IQNParams (class in tianshou.highlevel.params.algorithm_params) IQNPolicy (class in tianshou.algorithm.modelfree.iqn) is_continuous() (EnvType method) is_discrete (RandomActor property) is_discrete() (EnvType method) is_double (DQNParams attribute) is_enabled (TraceLogger attribute) is_within_training_step (Policy attribute) isnull() (Batch method) (BatchProtocol method) (ReplayBuffer method) J JOBLIB (RegisteredExpLauncher attribute) JoblibConfig (class in tianshou.evaluation.launcher) JoblibExpLauncher (class in tianshou.evaluation.launcher) K kl (NPGTrainingStats attribute) L LaggedNetworkAlgorithmMixin (class in tianshou.algorithm.algorithm_base) LaggedNetworkCollection (class in tianshou.utils.lagged_network) LaggedNetworkFullUpdateAlgorithmMixin (class in tianshou.algorithm.algorithm_base) LaggedNetworkPair (class in tianshou.utils.lagged_network) LaggedNetworkPolyakUpdateAlgorithmMixin (class in tianshou.algorithm.algorithm_base) launch() (ExpLauncher method) layer_init() (in module tianshou.env.atari.atari_network) LazyLogger (class in tianshou.utils.logger.logger_base) lens (CollectStats attribute) lens_stat (CollectStats attribute) (LoggedCollectStats attribute) load() (WandbLogger method) load_and_eval_experiment() (in module tianshou.evaluation.rliable_evaluation) load_from_disk() (MultiRunExperimentResult class method) load_hdf5() (ReplayBuffer class method) load_state_dict() (Algorithm method) (Algorithm.Optimizer method) log (TraceDeterminismTest.Result attribute) log() (TraceLogger class method) log_buffer (TraceLogger attribute) log_file_enabled (ExperimentConfig attribute) LOG_FILENAME (Experiment attribute) log_formatter (TraceLogger attribute) log_info_data() (BaseLogger method) LOG_LEVEL (TraceLogger attribute) log_lines (TraceLog attribute) log_prob (DistLogProbBatchProtocol attribute) log_test_data() (BaseLogger method) log_training_data() (BaseLogger method) log_update_data() (BaseLogger method) LoggedCollectStats (class in tianshou.evaluation.rliable_evaluation) LoggedSummaryData (class in tianshou.evaluation.rliable_evaluation) logger (TrainerParams attribute) (World attribute) LoggerFactory (class in tianshou.highlevel.logger) LoggerFactoryDefault (class in tianshou.highlevel.logger) logits (ModelOutputBatchProtocol attribute) logp_old (LogpOldProtocol attribute) LogpOldProtocol (class in tianshou.data.types) loss (A2CTrainingStats attribute) (ImitationTrainingStats attribute) (LossSequenceTrainingStats attribute) (RainbowTrainingStats attribute) (SimpleLossTrainingStats attribute) LossSequenceTrainingStats (class in tianshou.algorithm.modelfree.reinforce) lr (ParamsMixinSingleModel attribute) lr_scheduler (ParamsMixinSingleModel attribute) LRSchedulerFactory (class in tianshou.algorithm.optim) LRSchedulerFactoryFactory (class in tianshou.highlevel.params.lr_scheduler) LRSchedulerFactoryFactoryLinear (class in tianshou.highlevel.params.lr_scheduler) LRSchedulerFactoryLinear (class in tianshou.algorithm.optim) M make_atari_env() (in module tianshou.env.atari.atari_wrapper) MalformedBufferError map_action() (Policy method) map_action_inverse() (Policy method) MAPRolloutBatchProtocol (class in tianshou.algorithm.multiagent.marl) MapTrainingStats (class in tianshou.algorithm.multiagent.marl) MARLDispatcher (class in tianshou.algorithm.multiagent.marl) MARLRandomDiscreteMaskedOffPolicyAlgorithm (class in tianshou.algorithm.random) MARLRandomDiscreteMaskedOffPolicyAlgorithm.Policy (class in tianshou.algorithm.random) MARLRandomTrainingStats (class in tianshou.algorithm.random) max (LoggedSummaryData attribute) (SequenceSummaryStats attribute) max_action (ActionSpaceInfo attribute) max_backtracks (TRPOParams attribute) max_batchsize (ParamsMixinGeneralAdvantageEstimation attribute) max_epochs (TrainerParams attribute) (TrainingConfig attribute) max_grad_norm (A2CParams attribute) max_kl (TRPOParams attribute) MaxActionScaled (class in tianshou.highlevel.params.env_param) MaxActionScaledGaussian (class in tianshou.highlevel.params.noise) MaxAndSkipEnv (class in tianshou.env.atari.atari_wrapper) mc_return_to_go (EpisodeRolloutHookMCReturn.OutputDict attribute) MC_RETURN_TO_GO_KEY (EpisodeRolloutHookMCReturn attribute) mean (LoggedSummaryData attribute) (SequenceSummaryStats attribute) mean() (MovAvg method) MESSAGE_TAG (TraceLogger attribute) min (LoggedSummaryData attribute) (SequenceSummaryStats attribute) min_action (ActionSpaceInfo attribute) miniblock() (in module tianshou.utils.net.common) MLP (class in tianshou.utils.net.common) ModelOutputBatchProtocol (class in tianshou.data.types) module tianshou.algorithm.algorithm_base tianshou.algorithm.imitation.bcq tianshou.algorithm.imitation.cql tianshou.algorithm.imitation.discrete_bcq tianshou.algorithm.imitation.discrete_cql tianshou.algorithm.imitation.discrete_crr tianshou.algorithm.imitation.gail tianshou.algorithm.imitation.imitation_base tianshou.algorithm.imitation.td3_bc tianshou.algorithm.modelbased.icm tianshou.algorithm.modelbased.psrl tianshou.algorithm.modelfree.a2c tianshou.algorithm.modelfree.bdqn tianshou.algorithm.modelfree.c51 tianshou.algorithm.modelfree.ddpg tianshou.algorithm.modelfree.discrete_sac tianshou.algorithm.modelfree.dqn tianshou.algorithm.modelfree.fqf tianshou.algorithm.modelfree.iqn tianshou.algorithm.modelfree.npg tianshou.algorithm.modelfree.ppo tianshou.algorithm.modelfree.qrdqn tianshou.algorithm.modelfree.rainbow tianshou.algorithm.modelfree.redq tianshou.algorithm.modelfree.reinforce tianshou.algorithm.modelfree.sac tianshou.algorithm.modelfree.td3 tianshou.algorithm.modelfree.trpo tianshou.algorithm.multiagent.marl tianshou.algorithm.optim tianshou.algorithm.random tianshou.config tianshou.data.batch tianshou.data.buffer.buffer_base tianshou.data.buffer.cached tianshou.data.buffer.her tianshou.data.buffer.manager tianshou.data.buffer.prio tianshou.data.buffer.vecbuf tianshou.data.collector tianshou.data.stats tianshou.data.types tianshou.data.utils.converter tianshou.data.utils.segtree tianshou.env.atari.atari_network tianshou.env.atari.atari_wrapper tianshou.env.gym_wrappers tianshou.env.pettingzoo_env tianshou.env.utils tianshou.env.venv_wrappers tianshou.env.venvs tianshou.env.worker.dummy tianshou.env.worker.ray tianshou.env.worker.subproc tianshou.env.worker.worker_base tianshou.evaluation.launcher tianshou.evaluation.rliable_evaluation tianshou.exploration.random tianshou.highlevel.algorithm tianshou.highlevel.config tianshou.highlevel.env tianshou.highlevel.experiment tianshou.highlevel.logger tianshou.highlevel.module.actor tianshou.highlevel.module.core tianshou.highlevel.module.critic tianshou.highlevel.module.intermediate tianshou.highlevel.module.special tianshou.highlevel.params.algorithm_params tianshou.highlevel.params.algorithm_wrapper tianshou.highlevel.params.alpha tianshou.highlevel.params.collector tianshou.highlevel.params.dist_fn tianshou.highlevel.params.env_param tianshou.highlevel.params.lr_scheduler tianshou.highlevel.params.noise tianshou.highlevel.params.optim tianshou.highlevel.persistence tianshou.highlevel.trainer tianshou.highlevel.world tianshou.trainer tianshou.utils.conversion tianshou.utils.determinism tianshou.utils.lagged_network tianshou.utils.logger.logger_base tianshou.utils.logger.tensorboard tianshou.utils.logger.wandb tianshou.utils.logging tianshou.utils.net.common tianshou.utils.net.continuous tianshou.utils.net.discrete tianshou.utils.print tianshou.utils.progress_bar tianshou.utils.space_info tianshou.utils.statistics tianshou.utils.torch_utils tianshou.utils.warning module (IntermediateModule attribute) ModuleFactory (class in tianshou.highlevel.module.core) ModuleWithVectorOutput (class in tianshou.utils.net.common) ModuleWithVectorOutputAdapter (class in tianshou.utils.net.common) MovAvg (class in tianshou.utils.statistics) multi_agent_return_reduction (TrainerParams attribute) MultiAgentOffPolicyAlgorithm (class in tianshou.algorithm.multiagent.marl) MultiAgentOnPolicyAlgorithm (class in tianshou.algorithm.multiagent.marl) MultiAgentPolicy (class in tianshou.algorithm.multiagent.marl) MultiDiscreteToDiscrete (class in tianshou.env.gym_wrappers) MultiRunExperimentResult (class in tianshou.evaluation.rliable_evaluation) N n_collected_episodes (CollectStatsBase attribute) (LoggedCollectStats attribute) n_collected_steps (CollectStatsBase attribute) (LoggedCollectStats attribute) n_jobs (JoblibConfig attribute) n_step_return_horizon (ParamsMixinNStepReturnHorizon attribute) Net (class in tianshou.utils.net.common) next() (ReplayBuffer method) (ReplayBufferManager method) noise_clip (TD3Params attribute) NoiseFactory (class in tianshou.highlevel.params.noise) NoiseFactoryMaxActionScaledGaussian (class in tianshou.highlevel.params.noise) NoisyLinear (class in tianshou.utils.net.discrete) NoopResetEnv (class in tianshou.env.atari.atari_wrapper) norm() (RunningMeanStd method) NPG (class in tianshou.algorithm.modelfree.npg) NPGAlgorithmFactory (class in tianshou.highlevel.algorithm) NPGExperimentBuilder (class in tianshou.highlevel.experiment) NPGParams (class in tianshou.highlevel.params.algorithm_params) NPGTrainingStats (class in tianshou.algorithm.modelfree.npg) num_cosines (IQNParams attribute) num_quantiles (IQNParams attribute) num_test_envs (TrainingConfig attribute) num_training_envs (TrainingConfig attribute) O obs (ObsBatchProtocol attribute) obs_dim (ObservationSpaceInfo property) obs_next (RolloutBatchProtocol attribute) obs_shape (ObservationSpaceInfo attribute) ObsBatchProtocol (class in tianshou.data.types) observation() (ScaledFloatFrame method) (WarpFrame method) observation_info (SpaceInfo attribute) ObservationSpaceInfo (class in tianshou.utils.space_info) observe() (PSRLModel method) OfflineAlgorithm (class in tianshou.algorithm.algorithm_base) OfflineImitationLearning (class in tianshou.algorithm.imitation.imitation_base) OfflineTrainer (class in tianshou.trainer) OfflineTrainerParams (class in tianshou.trainer) OffPolicyAlgorithm (class in tianshou.algorithm.algorithm_base) OffPolicyAlgorithmFactory (class in tianshou.highlevel.algorithm) OffPolicyExperimentBuilder (class in tianshou.highlevel.experiment) OffPolicyImitationLearning (class in tianshou.algorithm.imitation.imitation_base) OffPolicyTrainer (class in tianshou.trainer) OffPolicyTrainerParams (class in tianshou.trainer) OffPolicyTrainingConfig (class in tianshou.highlevel.config) OffPolicyWrapperAlgorithm (class in tianshou.algorithm.algorithm_base) online_sample_size (IQNParams attribute) OnlineTrainer (class in tianshou.trainer) OnlineTrainerParams (class in tianshou.trainer) OnlineTrainingConfig (class in tianshou.highlevel.config) OnPolicyAlgorithm (class in tianshou.algorithm.algorithm_base) OnPolicyAlgorithmFactory (class in tianshou.highlevel.algorithm) OnPolicyAlgorithmParams (class in tianshou.highlevel.params.algorithm_params) OnPolicyExperimentBuilder (class in tianshou.highlevel.experiment) OnPolicyTrainer (class in tianshou.trainer) OnPolicyTrainerParams (class in tianshou.trainer) OnPolicyTrainingConfig (class in tianshou.highlevel.config) OnPolicyWrapperAlgorithm (class in tianshou.algorithm.algorithm_base) optim (ParamsMixinSingleModel attribute) optim_critic_iters (NPGParams attribute) optim_factory_default (ParamTransformerData attribute) OptimizerFactory (class in tianshou.algorithm.optim) OptimizerFactoryFactory (class in tianshou.highlevel.params.optim) OptimizerFactoryFactoryAdam (class in tianshou.highlevel.params.optim) OptimizerFactoryFactoryRMSprop (class in tianshou.highlevel.params.optim) OptimizerFactoryFactoryTorch (class in tianshou.highlevel.params.optim) OptimizerWithLearningRateProtocol (class in tianshou.highlevel.params.optim) OUNoise (class in tianshou.exploration.random) output_dim (IntermediateModule attribute) P Params (class in tianshou.highlevel.params.algorithm_params) ParamsMixinActionScaling (class in tianshou.highlevel.params.algorithm_params) ParamsMixinActionScalingAndBounding (class in tianshou.highlevel.params.algorithm_params) ParamsMixinActorAndCritic (class in tianshou.highlevel.params.algorithm_params) ParamsMixinActorAndDualCritics (class in tianshou.highlevel.params.algorithm_params) ParamsMixinAlpha (class in tianshou.highlevel.params.algorithm_params) ParamsMixinDeterministicEval (class in tianshou.highlevel.params.algorithm_params) ParamsMixinExplorationNoise (class in tianshou.highlevel.params.algorithm_params) ParamsMixinGamma (class in tianshou.highlevel.params.algorithm_params) ParamsMixinGeneralAdvantageEstimation (class in tianshou.highlevel.params.algorithm_params) ParamsMixinNStepReturnHorizon (class in tianshou.highlevel.params.algorithm_params) ParamsMixinSingleModel (class in tianshou.highlevel.params.algorithm_params) ParamsMixinTau (class in tianshou.highlevel.params.algorithm_params) ParamTransformer (class in tianshou.highlevel.params.algorithm_params) ParamTransformerActionScaling (class in tianshou.highlevel.params.algorithm_params) ParamTransformerAutoAlpha (class in tianshou.highlevel.params.algorithm_params) ParamTransformerChangeValue (class in tianshou.highlevel.params.algorithm_params) ParamTransformerData (class in tianshou.highlevel.params.algorithm_params) ParamTransformerDrop (class in tianshou.highlevel.params.algorithm_params) ParamTransformerFloatEnvParamFactory (class in tianshou.highlevel.params.algorithm_params) ParamTransformerNoiseFactory (class in tianshou.highlevel.params.algorithm_params) ParamTransformerOptimFactory (class in tianshou.highlevel.params.algorithm_params) ParamTransformerRename (class in tianshou.highlevel.params.algorithm_params) persist() (Persistence method) (PersistenceGroup method) (PolicyPersistence method) persist_directory (World attribute) persist_path() (World method) PERSIST_POLICY (PersistEvent attribute) Persistence (class in tianshou.highlevel.persistence) persistence_base_dir (ExperimentConfig attribute) persistence_dir_static() (Experiment static method) persistence_enabled (ExperimentConfig attribute) PersistenceGroup (class in tianshou.highlevel.persistence) PersistEvent (class in tianshou.highlevel.persistence) Perturbation (class in tianshou.utils.net.continuous) PettingZooEnv (class in tianshou.env.pettingzoo_env) Policy (class in tianshou.algorithm.algorithm_base) POLICY (PolicyPersistence.Mode attribute) policy_entry (CollectActionBatchProtocol attribute) policy_noise (TD3Params attribute) policy_persistence_mode (ExperimentConfig attribute) policy_restore_directory (ExperimentConfig attribute) POLICY_STATE_DICT (PolicyPersistence.Mode attribute) policy_within_training_step() (in module tianshou.utils.torch_utils) PolicyPersistence (class in tianshou.highlevel.persistence) PolicyPersistence.Mode (class in tianshou.highlevel.persistence) polyak_parameter_update() (in module tianshou.utils.lagged_network) (LaggedNetworkCollection method) pop() (Batch method) (BatchProtocol method) PPO (class in tianshou.algorithm.modelfree.ppo) PPOAlgorithmFactory (class in tianshou.highlevel.algorithm) PPOExperimentBuilder (class in tianshou.highlevel.experiment) PPOParams (class in tianshou.highlevel.params.algorithm_params) pprint_asdict() (DataclassPPrintMixin method) pprints_asdict() (DataclassPPrintMixin method) pred_dist_std_array (CollectStats attribute) pred_dist_std_array_stat (CollectStats attribute) prepare_dict_for_logging() (BaseLogger method) (LazyLogger method) (TensorboardLogger method) (WandbLogger method) prev() (ReplayBuffer method) (ReplayBufferManager method) print_log() (TraceLog method) PrioBatchProtocol (class in tianshou.data.types) PrioritizedReplayBuffer (class in tianshou.data.buffer.prio) PrioritizedReplayBufferManager (class in tianshou.data.buffer.manager) PrioritizedVectorReplayBuffer (class in tianshou.data.buffer.vecbuf) ProbabilisticActorPolicy (class in tianshou.algorithm.modelfree.reinforce) process_buffer() (CQL method) (OfflineAlgorithm method) ProtocolCalledException PSRL (class in tianshou.algorithm.modelbased.psrl) psrl_rew_mean (PSRLTrainingStats attribute) psrl_rew_std (PSRLTrainingStats attribute) PSRLModel (class in tianshou.algorithm.modelbased.psrl) PSRLPolicy (class in tianshou.algorithm.modelbased.psrl) PSRLTrainingStats (class in tianshou.algorithm.modelbased.psrl) Q q_loss (DiscreteBCQTrainingStats attribute) q_value (ImitationBatchProtocol attribute) QLearningOffPolicyAlgorithm (class in tianshou.algorithm.modelfree.dqn) QLearningOffPolicyParams (class in tianshou.highlevel.params.algorithm_params) qr_loss (DiscreteCQLTrainingStats attribute) QRDQN (class in tianshou.algorithm.modelfree.qrdqn) QRDQNet (class in tianshou.env.atari.atari_network) QRDQNPolicy (class in tianshou.algorithm.modelfree.qrdqn) quantile_loss (FQFTrainingStats attribute) QuantileRegressionBatchProtocol (class in tianshou.data.types) quantiles_tau (FQFBatchProtocol attribute) R RainbowDQN (class in tianshou.algorithm.modelfree.rainbow) RainbowNet (class in tianshou.env.atari.atari_network) RainbowTrainingStats (class in tianshou.algorithm.modelfree.rainbow) RandomActionPolicy (class in tianshou.algorithm.algorithm_base) RandomActor (class in tianshou.utils.net.common) RAY (VectorEnvType attribute) RayEnvWorker (class in tianshou.env.worker.ray) RayVectorEnv (class in tianshou.env.venvs) recompute_advantage (PPOParams attribute) Recurrent (class in tianshou.utils.net.common) RecurrentActorProb (class in tianshou.utils.net.continuous) RecurrentCritic (class in tianshou.utils.net.continuous) RecurrentStateBatch (class in tianshou.data.types) recv() (EnvWorker method) (RayEnvWorker method) (SubprocEnvWorker method) REDQ (class in tianshou.algorithm.modelfree.redq) REDQAlgorithmFactory (class in tianshou.highlevel.algorithm) REDQExperimentBuilder (class in tianshou.highlevel.experiment) REDQParams (class in tianshou.highlevel.params.algorithm_params) REDQPolicy (class in tianshou.algorithm.modelfree.redq) REDQTrainingStats (class in tianshou.algorithm.modelfree.redq) reduce() (SegmentTree method) reduce_log_to_messages() (TraceLog method) refresh_all_sequence_stats() (CollectStats method) refresh_len_stats() (CollectStats method) refresh_return_stats() (CollectStats method) refresh_std_array_stats() (CollectStats method) reg_loss (DiscreteBCQTrainingStats attribute) RegisteredExpLauncher (class in tianshou.evaluation.launcher) Reinforce (class in tianshou.algorithm.modelfree.reinforce) ReinforceAlgorithmFactory (class in tianshou.highlevel.algorithm) ReinforceExperimentBuilder (class in tianshou.highlevel.experiment) ReinforceParams (class in tianshou.highlevel.params.algorithm_params) render() (BaseVectorEnv method) (DummyEnvWorker method) (EnvWorker method) (PettingZooEnv method) (RayEnvWorker method) (SubprocEnvWorker method) (VectorEnvWrapper method) replace_empty_batches_by_none() (Batch method) replay_buffer_ignore_obs_next (TrainingConfig attribute) replay_buffer_save_only_last_obs (TrainingConfig attribute) replay_buffer_stack_num (TrainingConfig attribute) ReplayBuffer (class in tianshou.data.buffer.buffer_base) ReplayBufferManager (class in tianshou.data.buffer.manager) reset() (AsyncCollector method) (BaseCollector method) (BaseNoise method) (BaseVectorEnv method) (DummyEnvWorker method) (EnvWorker method) (EpisodicLifeEnv method) (FireResetEnv method) (FrameStack method) (GaussianNoise method) (HERReplayBuffer method) (NoisyLinear method) (NoopResetEnv method) (OnlineTrainer method) (OUNoise method) (PettingZooEnv method) (RayEnvWorker method) (ReplayBuffer method) (ReplayBufferManager method) (SubprocEnvWorker method) (Trainer method) (VectorEnvNormObs method) (VectorEnvWrapper method) reset_buffer() (BaseCollector method) reset_env() (AsyncCollector method) (BaseCollector method) (Collector method) reset_stat() (BaseCollector method) restore() (Persistence method) (PersistenceGroup method) (PolicyPersistence method) restore_data() (BaseLogger method) (LazyLogger method) (TensorboardLogger method) (WandbLogger method) restore_directory (World attribute) restore_logged_data() (BaseLogger static method) (LazyLogger static method) (TensorboardLogger static method) (WandbLogger static method) restore_path() (World method) RESTORE_POLICY (RestoreEvent attribute) RestoreEvent (class in tianshou.highlevel.persistence) resume_from_log (TrainerParams attribute) return_scaling (ActorCriticOnPolicyParams attribute) return_standardization (ReinforceParams attribute) returns (BatchWithReturnsProtocol attribute) (CollectStats attribute) returns_stat (CollectStats attribute) (LoggedCollectStats attribute) rew (EvaluationSequenceEntry attribute) (RolloutBatchProtocol attribute) rew_std (EvaluationSequenceEntry attribute) reward() (ClipRewardEnv method) rewrite_transitions() (HERReplayBuffer method) RMSpropOptimizerFactory (class in tianshou.algorithm.optim) RolloutBatchProtocol (class in tianshou.data.types) run() (Experiment method) (ExperimentCollection method) (Trainer method) run_on_episode_done() (Collector method) run_on_step_hook() (Collector method) run_training() (Algorithm method) (OfflineAlgorithm method) RunningMeanStd (class in tianshou.utils.statistics) S SAC (class in tianshou.algorithm.modelfree.sac) SACAlgorithmFactory (class in tianshou.highlevel.algorithm) SACExperimentBuilder (class in tianshou.highlevel.experiment) SACParams (class in tianshou.highlevel.params.algorithm_params) SACPolicy (class in tianshou.algorithm.modelfree.sac) SACTrainingStats (class in tianshou.algorithm.modelfree.sac) sample() (NoisyLinear method) (PrioritizedReplayBuffer method) (ReplayBuffer method) sample_indices() (HERReplayBuffer method) (PrioritizedReplayBuffer method) (ReplayBuffer method) (ReplayBufferManager method) sample_reward() (PSRLModel method) sample_size (IQNParams attribute) sample_trans_prob() (PSRLModel method) save() (Experiment method) (ShArray method) save_best_fn (TrainerParams attribute) save_checkpoint_fn (TrainerParams attribute) save_data() (BaseLogger method) (LazyLogger method) (TensorboardLogger method) (WandbLogger method) save_hdf5() (HERReplayBuffer method) (HERReplayBufferManager method) (ReplayBuffer method) save_log() (TraceLog method) ScaledFloatFrame (class in tianshou.env.atari.atari_wrapper) ScaledObsInputActionReprNet (class in tianshou.env.atari.atari_network) seed (ExperimentConfig attribute) seed() (BaseVectorEnv method) (DummyEnvWorker method) (EnvWorker method) (PettingZooEnv method) (RayEnvWorker method) (SubprocEnvWorker method) (VectorEnvWrapper method) seeding_info_str_static() (Experiment static method) SegmentTree (class in tianshou.data.utils.segtree) send() (DummyEnvWorker method) (EnvWorker method) (RayEnvWorker method) (SubprocEnvWorker method) SequenceSummaryStats (class in tianshou.data.stats) SEQUENTIAL (RegisteredExpLauncher attribute) SequentialExpLauncher (class in tianshou.evaluation.launcher) set_array_at_key() (Batch method) (BatchProtocol method) (ReplayBuffer method) set_batch() (HERReplayBuffer method) (HERReplayBufferManager method) (ReplayBuffer method) (ReplayBufferManager method) set_beta() (PrioritizedReplayBuffer method) (PrioritizedVectorReplayBuffer method) set_collect_time() (CollectStats method) set_collector_factory() (AlgorithmFactory method) set_env_attr() (BaseVectorEnv method) (DummyEnvWorker method) (EnvWorker method) (RayEnvWorker method) (SubprocEnvWorker method) (VectorEnvWrapper method) set_eps_inference() (DiscreteQLearningPolicy method) set_eps_training() (DiscreteQLearningPolicy method) set_exploration_noise() (ContinuousPolicyWithExplorationNoise method) set_numerical_fields_to_precision() (in module tianshou.utils.logging) set_obs_rms() (VectorEnvNormObs method) set_on_episode_done_hook() (Collector method) set_on_step_hook() (Collector method) set_persistence() (Environments method) set_policy_wrapper_factory() (AlgorithmFactory method) set_postfix() (DummyTqdm method) set_trainer_callbacks() (AlgorithmFactory method) shape (Batch property) (BatchProtocol property) ShArray (class in tianshou.env.worker.subproc) ShmemVectorEnv (class in tianshou.env.venvs) should_stop() (AtariEpochStopCallback method) (EpochStopCallback method) (EpochStopCallbackRewardThreshold method) show_progress (TrainerParams attribute) SimpleLossTrainingStats (class in tianshou.algorithm.modelfree.reinforce) smoothed_loss (TrainingStats attribute) solve_policy() (PSRLModel method) source (LaggedNetworkPair attribute) space_info (RandomActor property) SpaceInfo (class in tianshou.utils.space_info) split() (Batch method) (BatchProtocol method) stack() (Batch static method) (BatchProtocol static method) stack_() (Batch method) (BatchProtocol method) start_timesteps (TrainingConfig attribute) start_timesteps_random (TrainingConfig attribute) state (ActStateBatchProtocol attribute) (ImitationBatchProtocol attribute) state_dict() (Algorithm method) (Algorithm.Optimizer method) std (LoggedSummaryData attribute) (SequenceSummaryStats attribute) std() (MovAvg method) step() (Algorithm.Optimizer method) (BaseVectorEnv method) (EnvWorker method) (EpisodicLifeEnv method) (FrameStack method) (MaxAndSkipEnv method) (PettingZooEnv method) (TruncatedAsTerminated method) (VectorEnvNormObs method) (VectorEnvWrapper method) step_size (TRPOTrainingStats attribute) StepHook (class in tianshou.data.collector) StepHookAddActionDistribution (class in tianshou.data.collector) StepHookProtocol (class in tianshou.data.collector) stop_fn (TrainerParams attribute) subbuffer_edges (ReplayBuffer property) (ReplayBufferManager property) SUBPROC (VectorEnvType attribute) SUBPROC_SHARED_MEM_AUTO (VectorEnvType attribute) SUBPROC_SHARED_MEM_DEFAULT_CONTEXT (VectorEnvType attribute) SUBPROC_SHARED_MEM_FORK_CONTEXT (VectorEnvType attribute) SubprocEnvWorker (class in tianshou.env.worker.subproc) SubprocVectorEnv (class in tianshou.env.venvs) subset_size (REDQParams attribute) T target (LaggedNetworkPair attribute) target_mode (REDQParams attribute) target_sample_size (IQNParams attribute) target_update_freq (QLearningOffPolicyParams attribute) tau (ParamsMixinTau attribute) taus (QuantileRegressionBatchProtocol attribute) TD3 (class in tianshou.algorithm.modelfree.td3) TD3AlgorithmFactory (class in tianshou.highlevel.algorithm) TD3BC (class in tianshou.algorithm.imitation.td3_bc) TD3ExperimentBuilder (class in tianshou.highlevel.experiment) TD3Params (class in tianshou.highlevel.params.algorithm_params) TD3TrainingStats (class in tianshou.algorithm.modelfree.td3) TensorboardLogger (class in tianshou.utils.logger.tensorboard) terminated (RolloutBatchProtocol attribute) TEST (DataScope attribute) (EnvMode attribute) test_collect_stat (EpochStats attribute) test_collector (TrainerParams attribute) (World attribute) test_env_steps_E (MultiRunExperimentResult attribute) test_episode (InfoStats attribute) test_episode_returns_RE (MultiRunExperimentResult attribute) test_fn (TrainerParams attribute) test_in_training (OnlineTrainerParams attribute) (OnlineTrainingConfig attribute) test_step (InfoStats attribute) test_step_num_episodes (TrainerParams attribute) (TrainingConfig attribute) test_time (TimingStats attribute) tianshou.algorithm.algorithm_base module tianshou.algorithm.imitation.bcq module tianshou.algorithm.imitation.cql module tianshou.algorithm.imitation.discrete_bcq module tianshou.algorithm.imitation.discrete_cql module tianshou.algorithm.imitation.discrete_crr module tianshou.algorithm.imitation.gail module tianshou.algorithm.imitation.imitation_base module tianshou.algorithm.imitation.td3_bc module tianshou.algorithm.modelbased.icm module tianshou.algorithm.modelbased.psrl module tianshou.algorithm.modelfree.a2c module tianshou.algorithm.modelfree.bdqn module tianshou.algorithm.modelfree.c51 module tianshou.algorithm.modelfree.ddpg module tianshou.algorithm.modelfree.discrete_sac module tianshou.algorithm.modelfree.dqn module tianshou.algorithm.modelfree.fqf module tianshou.algorithm.modelfree.iqn module tianshou.algorithm.modelfree.npg module tianshou.algorithm.modelfree.ppo module tianshou.algorithm.modelfree.qrdqn module tianshou.algorithm.modelfree.rainbow module tianshou.algorithm.modelfree.redq module tianshou.algorithm.modelfree.reinforce module tianshou.algorithm.modelfree.sac module tianshou.algorithm.modelfree.td3 module tianshou.algorithm.modelfree.trpo module tianshou.algorithm.multiagent.marl module tianshou.algorithm.optim module tianshou.algorithm.random module tianshou.config module tianshou.data.batch module tianshou.data.buffer.buffer_base module tianshou.data.buffer.cached module tianshou.data.buffer.her module tianshou.data.buffer.manager module tianshou.data.buffer.prio module tianshou.data.buffer.vecbuf module tianshou.data.collector module tianshou.data.stats module tianshou.data.types module tianshou.data.utils.converter module tianshou.data.utils.segtree module tianshou.env.atari.atari_network module tianshou.env.atari.atari_wrapper module tianshou.env.gym_wrappers module tianshou.env.pettingzoo_env module tianshou.env.utils module tianshou.env.venv_wrappers module tianshou.env.venvs module tianshou.env.worker.dummy module tianshou.env.worker.ray module tianshou.env.worker.subproc module tianshou.env.worker.worker_base module tianshou.evaluation.launcher module tianshou.evaluation.rliable_evaluation module tianshou.exploration.random module tianshou.highlevel.algorithm module tianshou.highlevel.config module tianshou.highlevel.env module tianshou.highlevel.experiment module tianshou.highlevel.logger module tianshou.highlevel.module.actor module tianshou.highlevel.module.core module tianshou.highlevel.module.critic module tianshou.highlevel.module.intermediate module tianshou.highlevel.module.special module tianshou.highlevel.params.algorithm_params module tianshou.highlevel.params.algorithm_wrapper module tianshou.highlevel.params.alpha module tianshou.highlevel.params.collector module tianshou.highlevel.params.dist_fn module tianshou.highlevel.params.env_param module tianshou.highlevel.params.lr_scheduler module tianshou.highlevel.params.noise module tianshou.highlevel.params.optim module tianshou.highlevel.persistence module tianshou.highlevel.trainer module tianshou.highlevel.world module tianshou.trainer module tianshou.utils.conversion module tianshou.utils.determinism module tianshou.utils.lagged_network module tianshou.utils.logger.logger_base module tianshou.utils.logger.tensorboard module tianshou.utils.logger.wandb module tianshou.utils.logging module tianshou.utils.net.common module tianshou.utils.net.continuous module tianshou.utils.net.discrete module tianshou.utils.print module tianshou.utils.progress_bar module tianshou.utils.space_info module tianshou.utils.statistics module tianshou.utils.torch_utils module tianshou.utils.warning module timing (InfoStats attribute) TimingStats (class in tianshou.data.stats) to_at_least_2d() (Batch method) (BatchProtocol method) to_dict() (Batch method) (BatchProtocol method) to_evaluation_sequence() (MultiRunExperimentResult method) to_hdf5() (in module tianshou.data.utils.converter) to_list_of_dicts() (Batch method) (BatchProtocol method) to_numpy() (Batch method) (BatchProtocol method) (in module tianshou.data.utils.converter) to_numpy_() (Batch method) (BatchProtocol method) to_optional_float() (in module tianshou.utils.conversion) to_torch() (Batch method) (BatchProtocol method) (in module tianshou.data.utils.converter) to_torch_() (Batch method) (BatchProtocol method) to_torch_as() (in module tianshou.data.utils.converter) torch_device() (in module tianshou.utils.torch_utils) torch_param_hash() (in module tianshou.utils.determinism) torch_train_mode() (in module tianshou.utils.torch_utils) TorchOptimizerFactory (class in tianshou.algorithm.optim) total_time (TimingStats attribute) TraceDeterminismTest (class in tianshou.utils.determinism) TraceDeterminismTest.Result (class in tianshou.utils.determinism) TraceLog (class in tianshou.utils.determinism) TraceLogger (class in tianshou.utils.determinism) TraceLoggerContext (class in tianshou.utils.determinism) train (ExperimentConfig attribute) train() (EvalModeModuleWrapper method) train_collect_stat (EpochStats attribute) train_episode (InfoStats attribute) train_step (InfoStats attribute) train_time (TimingStats attribute) (TrainingStats attribute) train_time_collect (TimingStats attribute) train_time_update (TimingStats attribute) Trainer (class in tianshou.trainer) trainer (World attribute) trainer_result (ExperimentResult attribute) TrainerCallbacks (class in tianshou.highlevel.trainer) TrainerParams (class in tianshou.trainer) TRAINING (DataScope attribute) (EnvMode attribute) training_collector (OnlineTrainerParams attribute) (World attribute) training_config (ExperimentBuilder property) training_env_steps_E (MultiRunExperimentResult attribute) training_episode_returns_RE (MultiRunExperimentResult attribute) training_fn (TrainerParams attribute) training_stat (EpochStats attribute) TrainingConfig (class in tianshou.highlevel.config) TrainingContext (class in tianshou.highlevel.trainer) TrainingStats (class in tianshou.algorithm.algorithm_base) TrainingStatsWrapper (class in tianshou.algorithm.algorithm_base) transform() (ParamTransformer method) (ParamTransformerAutoAlpha method) (ParamTransformerChangeValue method) (ParamTransformerDrop method) (ParamTransformerOptimFactory method) (ParamTransformerRename method) TRPO (class in tianshou.algorithm.modelfree.trpo) TRPOAlgorithmFactory (class in tianshou.highlevel.algorithm) TRPOExperimentBuilder (class in tianshou.highlevel.experiment) TRPOParams (class in tianshou.highlevel.params.algorithm_params) TRPOTrainingStats (class in tianshou.algorithm.modelfree.trpo) truncated (RolloutBatchProtocol attribute) TruncatedAsTerminated (class in tianshou.env.gym_wrappers) trust_region_size (NPGParams attribute) U unfinished_index() (ReplayBuffer method) (ReplayBufferManager method) UNSUPPORTED (ContinuousActorType attribute) UPDATE (DataScope attribute) update() (Alpha method) (AutoAlpha method) (Batch method) (BatchProtocol method) (DummyTqdm method) (FixedAlpha method) (HERReplayBuffer method) (HERReplayBufferManager method) (OfflineAlgorithm method) (OffPolicyAlgorithm method) (OnPolicyAlgorithm method) (PrioritizedReplayBuffer method) (ReplayBuffer method) (ReplayBufferManager method) (RunningMeanStd method) update_actor_freq (TD3Params attribute) update_at_episode_done() (CollectStats method) update_at_step_batch() (CollectStats method) update_speed (TimingStats attribute) update_step (InfoStats attribute) update_step_num_gradient_steps_per_sample (OffPolicyTrainerParams attribute) (OffPolicyTrainingConfig attribute) update_step_num_repetitions (OnPolicyTrainerParams attribute) (OnPolicyTrainingConfig attribute) update_weight() (PrioritizedReplayBuffer method) USE_SOFTMAX_OUTPUT (ActorFactoryAtariDQN attribute) use_target_network (QLearningOffPolicyAlgorithm property) V v_s (BatchWithAdvantagesProtocol attribute) VAE (class in tianshou.utils.net.continuous) vae_loss (BCQTrainingStats attribute) value (Alpha property) (AutoAlpha property) (FixedAlpha property) value_clip (PPOParams attribute) value_iteration() (PSRLModel static method) value_mask() (Algorithm static method) VectorEnvNormObs (class in tianshou.env.venv_wrappers) VectorEnvType (class in tianshou.highlevel.env) VectorEnvWrapper (class in tianshou.env.venv_wrappers) VectorReplayBuffer (class in tianshou.data.buffer.vecbuf) verbose (JoblibConfig attribute) (TraceLogger attribute) (TrainerParams attribute) vf_coef (A2CParams attribute) vf_loss (A2CTrainingStats attribute) (NPGTrainingStats attribute) W wait() (DummyEnvWorker static method) (EnvWorker static method) (RayEnvWorker static method) (SubprocEnvWorker static method) WandbLogger (class in tianshou.utils.logger.wandb) WarpFrame (class in tianshou.env.atari.atari_wrapper) WATCH (EnvMode attribute) watch (ExperimentConfig attribute) watch_num_episodes (ExperimentConfig attribute) watch_render (ExperimentConfig attribute) weight (PrioBatchProtocol attribute) with_a2c_params() (A2CExperimentBuilder method) with_algorithm_wrapper_factory() (ExperimentBuilder method) with_autogenerated_stats() (CollectStats class method) with_collector_factory() (ExperimentBuilder method) with_ddpg_params() (DDPGExperimentBuilder method) with_dqn_params() (DQNExperimentBuilder method) with_epoch_stop_callback() (ExperimentBuilder method) with_epoch_test_callback() (ExperimentBuilder method) with_epoch_train_callback() (ExperimentBuilder method) with_iqn_params() (IQNExperimentBuilder method) with_logger_factory() (ExperimentBuilder method) with_lr_scheduler_factory() (OptimizerFactory method) with_model_factory() (DQNExperimentBuilder method) with_model_factory_default() (DQNExperimentBuilder method) with_name() (ExperimentBuilder method) with_npg_params() (NPGExperimentBuilder method) with_optim_default() (ExperimentBuilder method) with_ppo_params() (PPOExperimentBuilder method) with_preprocess_network_factory() (IQNExperimentBuilder method) with_redq_params() (REDQExperimentBuilder method) with_reinforce_params() (ReinforceExperimentBuilder method) with_sac_params() (DiscreteSACExperimentBuilder method) (SACExperimentBuilder method) with_td3_params() (TD3ExperimentBuilder method) with_trpo_params() (TRPOExperimentBuilder method) World (class in tianshou.highlevel.world) world (ExperimentResult attribute) wrap_deepmind() (in module tianshou.env.atari.atari_wrapper) wrapped_stats (TrainingStatsWrapper property) write() (BaseLogger method) (LazyLogger method) (TensorboardLogger method) (WandbLogger method)