Index _ | A | B | C | D | E | F | G | H | I | K | L | M | N | O | P | R | S | T | U | V | W | Z _ __init__() (imitation.algorithms.adversarial.airl.AIRL method) (imitation.algorithms.adversarial.common.AdversarialTrainer method) (imitation.algorithms.adversarial.gail.GAIL method) (imitation.algorithms.adversarial.gail.RewardNetFromDiscriminatorLogit method) (imitation.algorithms.base.BaseImitationAlgorithm method) (imitation.algorithms.base.DemonstrationAlgorithm method) (imitation.algorithms.bc.BatchIteratorWithEpochEndCallback method) (imitation.algorithms.bc.BC method) (imitation.algorithms.bc.BCLogger method) (imitation.algorithms.bc.BCTrainingMetrics method) (imitation.algorithms.bc.BehaviorCloningLossCalculator method) (imitation.algorithms.bc.RolloutStatsComputer method) (imitation.algorithms.dagger.DAggerTrainer method) (imitation.algorithms.dagger.ExponentialBetaSchedule method) (imitation.algorithms.dagger.InteractiveTrajectoryCollector method) (imitation.algorithms.dagger.LinearBetaSchedule method) (imitation.algorithms.dagger.SimpleDAggerTrainer method) (imitation.algorithms.density.DensityAlgorithm method) (imitation.algorithms.mce_irl.MCEIRL method) (imitation.algorithms.mce_irl.TabularPolicy method) (imitation.algorithms.preference_comparisons.ActiveSelectionFragmenter method) (imitation.algorithms.preference_comparisons.AgentTrainer method) (imitation.algorithms.preference_comparisons.BasicRewardTrainer method) (imitation.algorithms.preference_comparisons.CrossEntropyRewardLoss method) (imitation.algorithms.preference_comparisons.EnsembleTrainer method) (imitation.algorithms.preference_comparisons.Fragmenter method) (imitation.algorithms.preference_comparisons.PreferenceComparisons method) (imitation.algorithms.preference_comparisons.PreferenceDataset method) (imitation.algorithms.preference_comparisons.PreferenceGatherer method) (imitation.algorithms.preference_comparisons.PreferenceModel method) (imitation.algorithms.preference_comparisons.RandomFragmenter method) (imitation.algorithms.preference_comparisons.RewardTrainer method) (imitation.algorithms.preference_comparisons.SyntheticGatherer method) (imitation.algorithms.preference_comparisons.TrajectoryDataset method) (imitation.algorithms.preference_comparisons.TrajectoryGenerator method) (imitation.algorithms.sqil.SQIL method) (imitation.algorithms.sqil.SQILReplayBuffer method) (imitation.data.buffer.Buffer method) (imitation.data.buffer.ReplayBuffer method) (imitation.data.huggingface_utils.TrajectoryDatasetSequence method) (imitation.data.rollout.TrajectoryAccumulator method) (imitation.data.types.DictObs method) (imitation.data.types.Trajectory method) (imitation.data.types.TrajectoryWithRew method) (imitation.data.types.Transitions method) (imitation.data.types.TransitionsMinimal method) (imitation.data.types.TransitionsWithRew method) (imitation.data.wrappers.BufferingWrapper method) (imitation.data.wrappers.RolloutInfoWrapper method) (imitation.policies.base.FeedForward32Policy method) (imitation.policies.base.NonTrainablePolicy method) (imitation.policies.base.NormalizeFeaturesExtractor method) (imitation.policies.base.SAC1024Policy method) (imitation.policies.base.ZeroPolicy method) (imitation.policies.exploration_wrapper.ExplorationWrapper method) (imitation.policies.interactive.AtariInteractivePolicy method) (imitation.policies.interactive.DiscreteInteractivePolicy method) (imitation.policies.replay_buffer_wrapper.ReplayBufferRewardWrapper method) (imitation.policies.serialize.SavePolicyCallback method) (imitation.regularization.regularizers.LpRegularizer method) (imitation.regularization.regularizers.Regularizer method) (imitation.regularization.regularizers.RegularizerFactory method) (imitation.regularization.updaters.IntervalParamScaler method) (imitation.regularization.updaters.LambdaUpdater method) (imitation.rewards.reward_function.RewardFn method) (imitation.rewards.reward_nets.AddSTDRewardWrapper method) (imitation.rewards.reward_nets.BasicPotentialCNN method) (imitation.rewards.reward_nets.BasicPotentialMLP method) (imitation.rewards.reward_nets.BasicRewardNet method) (imitation.rewards.reward_nets.BasicShapedRewardNet method) (imitation.rewards.reward_nets.CnnRewardNet method) (imitation.rewards.reward_nets.ForwardWrapper method) (imitation.rewards.reward_nets.NormalizedRewardNet method) (imitation.rewards.reward_nets.RewardEnsemble method) (imitation.rewards.reward_nets.RewardNet method) (imitation.rewards.reward_nets.RewardNetWrapper method) (imitation.rewards.reward_nets.ShapedRewardNet method) (imitation.rewards.reward_wrapper.RewardVecEnvWrapper method) (imitation.rewards.reward_wrapper.WrappedRewardCallback method) (imitation.rewards.serialize.ValidateRewardFn method) (imitation.scripts.eval_policy.InteractiveRender method) (imitation.testing.reward_nets.MockRewardNet method) (imitation.util.logger.HierarchicalLogger method) (imitation.util.logger.WandbOutputFormat method) (imitation.util.networks.BaseNorm method) (imitation.util.networks.EMANorm method) (imitation.util.registry.Registry method) (imitation.util.video_wrapper.VideoWrapper method) A accumulate_means() (imitation.util.logger.HierarchicalLogger method) actions (imitation.algorithms.sqil.SQILReplayBuffer attribute) (imitation.policies.replay_buffer_wrapper.ReplayBufferRewardWrapper attribute) ActiveSelectionFragmenter (class in imitation.algorithms.preference_comparisons) actor (imitation.policies.base.SAC1024Policy attribute) acts (imitation.data.types.Trajectory attribute) (imitation.data.types.TransitionMapping attribute) (imitation.data.types.TransitionMappingNoNextObs attribute) (imitation.data.types.TransitionsMinimal attribute) add() (imitation.algorithms.sqil.SQILReplayBuffer method) (imitation.policies.replay_buffer_wrapper.ReplayBufferRewardWrapper method) add_accumulate_prefix() (imitation.util.logger.HierarchicalLogger method) add_key_prefix() (imitation.util.logger.HierarchicalLogger method) add_step() (imitation.data.rollout.TrajectoryAccumulator method) add_steps_and_auto_finish() (imitation.data.rollout.TrajectoryAccumulator method) AddSTDRewardWrapper (class in imitation.rewards.reward_nets) AdversarialTrainer (class in imitation.algorithms.adversarial.common) AgentTrainer (class in imitation.algorithms.preference_comparisons) AIRL (class in imitation.algorithms.adversarial.airl) airl() (in module imitation.scripts.train_adversarial) allow_variable_horizon (imitation.algorithms.adversarial.gail.GAIL attribute) (imitation.algorithms.base.BaseImitationAlgorithm attribute) (imitation.algorithms.base.DemonstrationAlgorithm attribute) (imitation.algorithms.bc.BC attribute) (imitation.algorithms.dagger.SimpleDAggerTrainer attribute) (imitation.algorithms.preference_comparisons.PreferenceComparisons attribute) analyze_imitation() (in module imitation.scripts.analyze) assert_not_dictobs() (in module imitation.data.types) AtariInteractivePolicy (class in imitation.policies.interactive) B base (imitation.rewards.reward_nets.RewardNetWrapper property) BaseImitationAlgorithm (class in imitation.algorithms.base) BaseNorm (class in imitation.util.networks) BasicPotentialCNN (class in imitation.rewards.reward_nets) BasicPotentialMLP (class in imitation.rewards.reward_nets) BasicRewardNet (class in imitation.rewards.reward_nets) BasicRewardTrainer (class in imitation.algorithms.preference_comparisons) BasicShapedRewardNet (class in imitation.rewards.reward_nets) batch_loader (imitation.algorithms.bc.BatchIteratorWithEpochEndCallback attribute) batch_size (imitation.algorithms.dagger.DAggerTrainer property) BatchIteratorWithEpochEndCallback (class in imitation.algorithms.bc) BC (class in imitation.algorithms.bc) bc() (in module imitation.scripts.train_imitation) BCLogger (class in imitation.algorithms.bc) BCTrainingMetrics (class in imitation.algorithms.bc) BehaviorCloningLossCalculator (class in imitation.algorithms.bc) BetaSchedule (class in imitation.algorithms.dagger) Buffer (class in imitation.data.buffer) buffering_wrapper (imitation.algorithms.density.DensityAlgorithm attribute) BufferingWrapper (class in imitation.data.wrappers) build_cnn() (in module imitation.util.networks) build_loader_fn_require_env() (in module imitation.util.registry) build_loader_fn_require_space() (in module imitation.util.registry) build_mlp() (in module imitation.util.networks) build_sacred_symlink() (in module imitation.util.sacred) C capacity (imitation.data.buffer.Buffer attribute) (imitation.data.buffer.ReplayBuffer attribute) clear_screen() (in module imitation.util.util) close() (imitation.util.logger.HierarchicalLogger method) (imitation.util.logger.WandbOutputFormat method) (imitation.util.video_wrapper.VideoWrapper method) cnn_transpose() (in module imitation.rewards.reward_nets) CnnRewardNet (class in imitation.rewards.reward_nets) compute_train_stats() (in module imitation.algorithms.adversarial.common) concatenate() (imitation.data.types.DictObs class method) concatenate_maybe_dictobs() (in module imitation.data.types) config (imitation.util.sacred.SacredDicts attribute) config_hook() (in module imitation.scripts.ingredients.expert) (in module imitation.scripts.ingredients.reward) (in module imitation.scripts.ingredients.rl) configure() (in module imitation.util.logger) count (imitation.util.networks.BaseNorm attribute) (imitation.util.networks.RunningNorm attribute) create() (imitation.regularization.regularizers.Regularizer class method) create_trajectory_collector() (imitation.algorithms.dagger.DAggerTrainer method) critic (imitation.policies.base.SAC1024Policy attribute) critic_target (imitation.policies.base.SAC1024Policy attribute) CrossEntropyRewardLoss (class in imitation.algorithms.preference_comparisons) current_logger (imitation.util.logger.HierarchicalLogger attribute) D dagger() (in module imitation.scripts.train_imitation) DAggerTrainer (class in imitation.algorithms.dagger) dataclass_quick_asdict() (in module imitation.data.types) dataset (imitation.data.huggingface_utils.TrajectoryDatasetSequence property) default_logger (imitation.util.logger.HierarchicalLogger attribute) DEFAULT_N_EPOCHS (imitation.algorithms.dagger.DAggerTrainer attribute) demo_state_om (imitation.algorithms.mce_irl.MCEIRL attribute) DemonstrationAlgorithm (class in imitation.algorithms.base) density_type (imitation.algorithms.density.DensityAlgorithm attribute) DensityAlgorithm (class in imitation.algorithms.density) DensityType (class in imitation.algorithms.density) device (imitation.rewards.reward_nets.RewardNet property) (imitation.rewards.reward_nets.RewardNetWrapper property) dict_get_nested() (in module imitation.util.sacred) dict_len (imitation.data.types.DictObs property) DictObs (class in imitation.data.types) dir_contains_sacred_jsons() (in module imitation.util.sacred) directory (imitation.util.video_wrapper.VideoWrapper attribute) discounted_sum() (in module imitation.data.rollout) DiscreteInteractivePolicy (class in imitation.policies.interactive) docstring_parameter() (in module imitation.util.util) dones (imitation.algorithms.sqil.SQILReplayBuffer attribute) (imitation.data.types.TransitionMapping attribute) (imitation.data.types.Transitions attribute) (imitation.policies.replay_buffer_wrapper.ReplayBufferRewardWrapper attribute) dtype (imitation.data.types.DictObs property) (imitation.rewards.reward_nets.RewardNet property) (imitation.rewards.reward_nets.RewardNetWrapper property) dump() (imitation.util.logger.HierarchicalLogger method) E EMANorm (class in imitation.util.networks) endless_iter() (in module imitation.util.util) EnsembleTrainer (class in imitation.algorithms.preference_comparisons) ent_loss (imitation.algorithms.bc.BCTrainingMetrics attribute) ent_weight (imitation.algorithms.bc.BehaviorCloningLossCalculator attribute) entropy (imitation.algorithms.bc.BCTrainingMetrics attribute) enumerate_batches() (in module imitation.algorithms.bc) envs (imitation.rewards.reward_wrapper.RewardVecEnvWrapper property) episode_id (imitation.util.video_wrapper.VideoWrapper attribute) error_on_premature_event (imitation.data.wrappers.BufferingWrapper attribute) eval_policy() (in module imitation.scripts.eval_policy) (in module imitation.scripts.ingredients.policy_evaluation) evaluate_trial() (in module imitation.scripts.tuning) evaluating() (in module imitation.util.networks) expert_buffer (imitation.algorithms.sqil.SQIL attribute) ExplorationWrapper (class in imitation.policies.exploration_wrapper) ExponentialBetaSchedule (class in imitation.algorithms.dagger) extend_and_update() (imitation.algorithms.dagger.DAggerTrainer method) F features_extractor (imitation.policies.base.FeedForward32Policy attribute) (imitation.policies.base.NonTrainablePolicy attribute) (imitation.policies.base.RandomPolicy attribute) (imitation.policies.base.ZeroPolicy attribute) (imitation.policies.interactive.AtariInteractivePolicy attribute) (imitation.policies.interactive.DiscreteInteractivePolicy attribute) (imitation.policies.interactive.ImageObsDiscreteInteractivePolicy attribute) FeedForward32Policy (class in imitation.policies.base) filter_subdirs() (in module imitation.util.sacred) find_best_trial() (in module imitation.scripts.tuning) find_sacred_runs() (in module imitation.util.sacred_file_parsing) finish_trajectory() (imitation.data.rollout.TrajectoryAccumulator method) flatten_trajectories() (in module imitation.data.rollout) flatten_trajectories_with_rew() (in module imitation.data.rollout) format_strs (imitation.util.logger.HierarchicalLogger attribute) forward() (imitation.algorithms.adversarial.gail.RewardNetFromDiscriminatorLogit method) (imitation.algorithms.mce_irl.TabularPolicy method) (imitation.algorithms.preference_comparisons.CrossEntropyRewardLoss method) (imitation.algorithms.preference_comparisons.PreferenceModel method) (imitation.algorithms.preference_comparisons.RewardLoss method) (imitation.policies.base.NonTrainablePolicy method) (imitation.policies.base.NormalizeFeaturesExtractor method) (imitation.rewards.reward_nets.BasicPotentialCNN method) (imitation.rewards.reward_nets.BasicPotentialMLP method) (imitation.rewards.reward_nets.BasicRewardNet method) (imitation.rewards.reward_nets.CnnRewardNet method) (imitation.rewards.reward_nets.PredictProcessedWrapper method) (imitation.rewards.reward_nets.RewardEnsemble method) (imitation.rewards.reward_nets.RewardNet method) (imitation.rewards.reward_nets.ShapedRewardNet method) (imitation.testing.reward_nets.MockRewardNet method) (imitation.util.networks.BaseNorm method) (imitation.util.networks.SqueezeLayer method) ForwardWrapper (class in imitation.rewards.reward_nets) Fragmenter (class in imitation.algorithms.preference_comparisons) from_data() (imitation.data.buffer.Buffer class method) (imitation.data.buffer.ReplayBuffer class method) from_obs_list() (imitation.data.types.DictObs class method) full (imitation.policies.replay_buffer_wrapper.ReplayBufferRewardWrapper property) G GAIL (class in imitation.algorithms.adversarial.gail) gail() (in module imitation.scripts.train_adversarial) gather_tb_directories() (in module imitation.scripts.analyze) generate_expert_trajectories() (in module imitation.testing.expert_trajectories) generate_trajectories() (in module imitation.data.rollout) generate_transitions() (in module imitation.data.rollout) get() (imitation.data.types.DictObs method) (imitation.util.registry.Registry method) get_accumulate_prefixes() (imitation.util.logger.HierarchicalLogger method) get_base_model() (in module imitation.algorithms.preference_comparisons) get_dir() (imitation.util.logger.HierarchicalLogger method) get_expert_policy() (in module imitation.scripts.ingredients.expert) get_expert_trajectories() (in module imitation.scripts.ingredients.demonstrations) get_first_iter_element() (in module imitation.util.util) get_num_channels_obs() (imitation.rewards.reward_nets.CnnRewardNet method) get_sacred_dir_from_run() (in module imitation.util.sacred) group_runs_by_algo_and_env() (in module imitation.util.sacred_file_parsing) gym_spaces (in module imitation.testing.hypothesis_strategies) H HierarchicalLogger (class in imitation.util.logger) hook() (in module imitation.scripts.ingredients.logging) I ImageObsDiscreteInteractivePolicy (class in imitation.policies.interactive) imitation module imitation.algorithms module imitation.algorithms.adversarial module imitation.algorithms.adversarial.airl module imitation.algorithms.adversarial.common module imitation.algorithms.adversarial.gail module imitation.algorithms.base module imitation.algorithms.bc module imitation.algorithms.dagger module imitation.algorithms.density module imitation.algorithms.mce_irl module imitation.algorithms.preference_comparisons module imitation.algorithms.sqil module imitation.data module imitation.data.buffer module imitation.data.huggingface_utils module imitation.data.rollout module imitation.data.serialize module imitation.data.types module imitation.data.wrappers module imitation.policies module imitation.policies.base module imitation.policies.exploration_wrapper module imitation.policies.interactive module imitation.policies.replay_buffer_wrapper module imitation.policies.serialize module imitation.regularization module imitation.regularization.regularizers module imitation.regularization.updaters module imitation.rewards module imitation.rewards.reward_function module imitation.rewards.reward_nets module imitation.rewards.reward_wrapper module imitation.rewards.serialize module imitation.scripts module imitation.scripts.analyze module imitation.scripts.config module imitation.scripts.config.analyze module imitation.scripts.config.eval_policy module imitation.scripts.config.parallel module imitation.scripts.config.train_adversarial module imitation.scripts.config.train_imitation module imitation.scripts.config.train_preference_comparisons module imitation.scripts.config.train_rl module imitation.scripts.config.tuning module imitation.scripts.convert_trajs module imitation.scripts.eval_policy module imitation.scripts.ingredients module imitation.scripts.ingredients.bc module imitation.scripts.ingredients.demonstrations module imitation.scripts.ingredients.environment module imitation.scripts.ingredients.expert module imitation.scripts.ingredients.logging module imitation.scripts.ingredients.policy module imitation.scripts.ingredients.policy_evaluation module imitation.scripts.ingredients.reward module imitation.scripts.ingredients.rl module imitation.scripts.ingredients.sqil module imitation.scripts.ingredients.wb module imitation.scripts.parallel module imitation.scripts.train_adversarial module imitation.scripts.train_imitation module imitation.scripts.train_preference_comparisons module imitation.scripts.train_rl module imitation.scripts.tuning module imitation.testing module imitation.testing.expert_trajectories module imitation.testing.hypothesis_strategies module imitation.testing.reward_improvement module imitation.testing.reward_nets module imitation.util module imitation.util.logger module imitation.util.networks module imitation.util.registry module imitation.util.sacred module imitation.util.sacred_file_parsing module imitation.util.util module imitation.util.video_wrapper module info_dict_contents (in module imitation.testing.hypothesis_strategies) infos (imitation.data.types.Trajectory attribute) (imitation.data.types.TransitionsMinimal attribute) InteractiveRender (class in imitation.scripts.eval_policy) InteractiveTrajectoryCollector (class in imitation.algorithms.dagger) IntervalParamScaler (class in imitation.regularization.updaters) inv_learning_rate (imitation.util.networks.EMANorm attribute) is_significant_reward_improvement() (in module imitation.testing.reward_improvement) is_stationary (imitation.algorithms.density.DensityAlgorithm attribute) items() (imitation.data.types.DictObs method) K kernel (imitation.algorithms.density.DensityAlgorithm attribute) kernel_bandwidth (imitation.algorithms.density.DensityAlgorithm attribute) keys() (imitation.data.types.DictObs method) (imitation.util.registry.Registry method) L l2_loss (imitation.algorithms.bc.BCTrainingMetrics attribute) l2_norm (imitation.algorithms.bc.BCTrainingMetrics attribute) l2_weight (imitation.algorithms.bc.BehaviorCloningLossCalculator attribute) lambda_ (imitation.regularization.regularizers.LossRegularizer attribute) (imitation.regularization.regularizers.Regularizer attribute) (imitation.regularization.regularizers.WeightDecayRegularizer attribute) (imitation.regularization.regularizers.WeightRegularizer attribute) lambda_updater (imitation.regularization.regularizers.LossRegularizer attribute) (imitation.regularization.regularizers.Regularizer attribute) (imitation.regularization.regularizers.WeightDecayRegularizer attribute) (imitation.regularization.regularizers.WeightRegularizer attribute) LambdaUpdater (class in imitation.regularization.updaters) lazy_generate_expert_trajectories() (in module imitation.testing.expert_trajectories) LinearBetaSchedule (class in imitation.algorithms.dagger) load() (imitation.algorithms.preference_comparisons.PreferenceDataset static method) (in module imitation.data.serialize) load_attr() (in module imitation.util.registry) load_from_dir() (imitation.util.sacred.SacredDicts class method) load_policy() (in module imitation.policies.serialize) load_reward() (in module imitation.rewards.serialize) load_rl_algo_from_path() (in module imitation.scripts.ingredients.rl) load_stable_baselines_model() (in module imitation.policies.serialize) load_with_rewards() (in module imitation.data.serialize) load_zero() (in module imitation.rewards.serialize) LoaderFn (in module imitation.util.registry) log() (imitation.util.logger.HierarchicalLogger method) log_batch() (imitation.algorithms.bc.BCLogger method) log_epoch() (imitation.algorithms.bc.BCLogger method) logger (imitation.algorithms.base.BaseImitationAlgorithm property) (imitation.algorithms.dagger.DAggerTrainer property) (imitation.algorithms.preference_comparisons.AgentTrainer property) (imitation.algorithms.preference_comparisons.EnsembleTrainer property) (imitation.algorithms.preference_comparisons.RewardTrainer property) (imitation.algorithms.preference_comparisons.TrajectoryGenerator property) (imitation.regularization.regularizers.LossRegularizer attribute) (imitation.regularization.regularizers.Regularizer attribute) (imitation.regularization.regularizers.WeightDecayRegularizer attribute) (imitation.regularization.regularizers.WeightRegularizer attribute) logits_expert_is_high() (imitation.algorithms.adversarial.airl.AIRL method) (imitation.algorithms.adversarial.common.AdversarialTrainer method) (imitation.algorithms.adversarial.gail.GAIL method) loss (imitation.algorithms.bc.BCTrainingMetrics attribute) (imitation.algorithms.preference_comparisons.LossAndMetrics attribute) LossAndMetrics (class in imitation.algorithms.preference_comparisons) LossRegularizer (class in imitation.regularization.regularizers) LpRegularizer (class in imitation.regularization.regularizers) M main() (in module imitation.scripts.convert_trajs) main_console() (in module imitation.scripts.analyze) (in module imitation.scripts.eval_policy) (in module imitation.scripts.parallel) (in module imitation.scripts.train_adversarial) (in module imitation.scripts.train_imitation) (in module imitation.scripts.train_preference_comparisons) (in module imitation.scripts.train_rl) (in module imitation.scripts.tuning) make_bc() (in module imitation.scripts.ingredients.bc) make_data_loader() (in module imitation.algorithms.base) make_ensemble() (in module imitation.testing.reward_nets) make_expert_transition_loader() (in module imitation.testing.expert_trajectories) make_log_callback() (imitation.rewards.reward_wrapper.RewardVecEnvWrapper method) make_log_dir() (in module imitation.scripts.ingredients.logging) make_min_episodes() (in module imitation.data.rollout) make_min_timesteps() (in module imitation.data.rollout) make_or_load_policy() (in module imitation.scripts.ingredients.bc) make_output_format() (in module imitation.util.logger) make_policy() (in module imitation.scripts.ingredients.policy) make_reward_net() (in module imitation.scripts.ingredients.reward) make_rl_algo() (in module imitation.scripts.ingredients.rl) make_rollout_venv() (in module imitation.scripts.ingredients.environment) make_sample_until() (in module imitation.data.rollout) make_seeds() (in module imitation.util.util) make_unique_timestamp() (in module imitation.util.util) make_vec_env() (in module imitation.util.util) make_venv() (in module imitation.scripts.ingredients.environment) map_arrays() (imitation.data.types.DictObs method) map_maybe_dict() (in module imitation.data.types) maybe_unwrap_dictobs() (in module imitation.data.types) maybe_wrap_in_dictobs() (in module imitation.data.types) mce_occupancy_measures() (in module imitation.algorithms.mce_irl) mce_partition_fh() (in module imitation.algorithms.mce_irl) MCEIRL (class in imitation.algorithms.mce_irl) mean_reward_improved_by() (in module imitation.testing.reward_improvement) members (imitation.rewards.reward_nets.RewardEnsemble attribute) metrics (imitation.algorithms.preference_comparisons.LossAndMetrics attribute) MockRewardNet (class in imitation.testing.reward_nets) model (imitation.policies.serialize.SavePolicyCallback attribute) (imitation.rewards.reward_wrapper.WrappedRewardCallback attribute) module imitation imitation.algorithms imitation.algorithms.adversarial imitation.algorithms.adversarial.airl imitation.algorithms.adversarial.common imitation.algorithms.adversarial.gail imitation.algorithms.base imitation.algorithms.bc imitation.algorithms.dagger imitation.algorithms.density imitation.algorithms.mce_irl imitation.algorithms.preference_comparisons imitation.algorithms.sqil imitation.data imitation.data.buffer imitation.data.huggingface_utils imitation.data.rollout imitation.data.serialize imitation.data.types imitation.data.wrappers imitation.policies imitation.policies.base imitation.policies.exploration_wrapper imitation.policies.interactive imitation.policies.replay_buffer_wrapper imitation.policies.serialize imitation.regularization imitation.regularization.regularizers imitation.regularization.updaters imitation.rewards imitation.rewards.reward_function imitation.rewards.reward_nets imitation.rewards.reward_wrapper imitation.rewards.serialize imitation.scripts imitation.scripts.analyze imitation.scripts.config imitation.scripts.config.analyze imitation.scripts.config.eval_policy imitation.scripts.config.parallel imitation.scripts.config.train_adversarial imitation.scripts.config.train_imitation imitation.scripts.config.train_preference_comparisons imitation.scripts.config.train_rl imitation.scripts.config.tuning imitation.scripts.convert_trajs imitation.scripts.eval_policy imitation.scripts.ingredients imitation.scripts.ingredients.bc imitation.scripts.ingredients.demonstrations imitation.scripts.ingredients.environment imitation.scripts.ingredients.expert imitation.scripts.ingredients.logging imitation.scripts.ingredients.policy imitation.scripts.ingredients.policy_evaluation imitation.scripts.ingredients.reward imitation.scripts.ingredients.rl imitation.scripts.ingredients.sqil imitation.scripts.ingredients.wb imitation.scripts.parallel imitation.scripts.train_adversarial imitation.scripts.train_imitation imitation.scripts.train_preference_comparisons imitation.scripts.train_rl imitation.scripts.tuning imitation.testing imitation.testing.expert_trajectories imitation.testing.hypothesis_strategies imitation.testing.reward_improvement imitation.testing.reward_nets imitation.util imitation.util.logger imitation.util.networks imitation.util.registry imitation.util.sacred imitation.util.sacred_file_parsing imitation.util.util imitation.util.video_wrapper N n_batches (imitation.algorithms.bc.BatchIteratorWithEpochEndCallback attribute) n_episodes (imitation.algorithms.bc.RolloutStatsComputer attribute) n_epochs (imitation.algorithms.bc.BatchIteratorWithEpochEndCallback attribute) n_transitions (imitation.data.wrappers.BufferingWrapper attribute) NeedsDemosException neglogp (imitation.algorithms.bc.BCTrainingMetrics attribute) next_obs (imitation.data.types.TransitionMapping attribute) (imitation.data.types.Transitions attribute) next_observations (imitation.algorithms.sqil.SQILReplayBuffer attribute) (imitation.policies.replay_buffer_wrapper.ReplayBufferRewardWrapper attribute) NonTrainablePolicy (class in imitation.policies.base) NormalizedRewardNet (class in imitation.rewards.reward_nets) NormalizeFeaturesExtractor (class in imitation.policies.base) num_batches (imitation.util.networks.EMANorm attribute) num_members (imitation.rewards.reward_nets.RewardEnsemble property) num_samples() (in module imitation.data.buffer) O obs (imitation.data.types.Trajectory attribute) (imitation.data.types.TransitionMapping attribute) (imitation.data.types.TransitionMappingNoNextObs attribute) (imitation.data.types.TransitionsMinimal attribute) observations (imitation.algorithms.sqil.SQILReplayBuffer attribute) (imitation.policies.replay_buffer_wrapper.ReplayBufferRewardWrapper attribute) on_epoch_end (imitation.algorithms.bc.BatchIteratorWithEpochEndCallback attribute) optimizer (imitation.policies.base.RandomPolicy attribute) (imitation.policies.base.ZeroPolicy attribute) (imitation.policies.interactive.AtariInteractivePolicy attribute) (imitation.policies.interactive.DiscreteInteractivePolicy attribute) (imitation.policies.interactive.ImageObsDiscreteInteractivePolicy attribute) (imitation.regularization.regularizers.LossRegularizer attribute) (imitation.regularization.regularizers.Regularizer attribute) (imitation.regularization.regularizers.WeightDecayRegularizer attribute) (imitation.regularization.regularizers.WeightRegularizer attribute) oric() (in module imitation.util.util) override_policy_cls() (in module imitation.scripts.ingredients.sqil) override_rl_cls() (in module imitation.scripts.ingredients.sqil) P p (imitation.regularization.regularizers.LpRegularizer attribute) parallel() (in module imitation.scripts.parallel) parse_optional_path() (in module imitation.util.util) parse_path() (in module imitation.util.util) pi (imitation.algorithms.mce_irl.TabularPolicy attribute) policy (imitation.algorithms.adversarial.common.AdversarialTrainer property) (imitation.algorithms.base.DemonstrationAlgorithm property) (imitation.algorithms.bc.BC property) (imitation.algorithms.dagger.DAggerTrainer property) (imitation.algorithms.density.DensityAlgorithm property) (imitation.algorithms.mce_irl.MCEIRL property) (imitation.algorithms.sqil.SQIL property) policy_registry (in module imitation.policies.serialize) policy_to_callable() (in module imitation.data.rollout) PolicyLoaderFn (in module imitation.policies.serialize) pop_finished_trajectories() (imitation.data.wrappers.BufferingWrapper method) pop_trajectories() (imitation.data.wrappers.BufferingWrapper method) pop_transitions() (imitation.data.wrappers.BufferingWrapper method) pos (imitation.policies.replay_buffer_wrapper.ReplayBufferRewardWrapper property) predict() (imitation.algorithms.mce_irl.TabularPolicy method) (imitation.rewards.reward_nets.PredictProcessedWrapper method) (imitation.rewards.reward_nets.RewardEnsemble method) (imitation.rewards.reward_nets.RewardNet method) predict_processed() (imitation.rewards.reward_nets.AddSTDRewardWrapper method) (imitation.rewards.reward_nets.NormalizedRewardNet method) (imitation.rewards.reward_nets.PredictProcessedWrapper method) (imitation.rewards.reward_nets.RewardEnsemble method) (imitation.rewards.reward_nets.RewardNet method) predict_processed_all() (imitation.rewards.reward_nets.RewardEnsemble method) predict_reward_moments() (imitation.rewards.reward_nets.RewardEnsemble method) (imitation.rewards.reward_nets.RewardNetWithVariance method) predict_th() (imitation.rewards.reward_nets.PredictProcessedWrapper method) (imitation.rewards.reward_nets.RewardNet method) PredictProcessedWrapper (class in imitation.rewards.reward_nets) preference_collate_fn() (in module imitation.algorithms.preference_comparisons) PreferenceComparisons (class in imitation.algorithms.preference_comparisons) PreferenceDataset (class in imitation.algorithms.preference_comparisons) PreferenceGatherer (class in imitation.algorithms.preference_comparisons) PreferenceModel (class in imitation.algorithms.preference_comparisons) preprocess() (imitation.rewards.reward_nets.RewardNet method) (imitation.rewards.reward_nets.RewardNetWrapper method) prob_true_act (imitation.algorithms.bc.BCTrainingMetrics attribute) probability() (imitation.algorithms.preference_comparisons.PreferenceModel method) push() (imitation.algorithms.preference_comparisons.PreferenceDataset method) R raise_uncertainty_on_not_supported() (imitation.algorithms.preference_comparisons.ActiveSelectionFragmenter method) RandomFragmenter (class in imitation.algorithms.preference_comparisons) RandomPolicy (class in imitation.policies.base) reconstruct_policy() (in module imitation.algorithms.bc) reconstruct_trainer() (in module imitation.algorithms.dagger) record() (imitation.util.logger.HierarchicalLogger method) record_mean() (imitation.util.logger.HierarchicalLogger method) register() (imitation.util.registry.Registry method) Registry (class in imitation.util.registry) regularize_and_backward() (imitation.regularization.regularizers.LossRegularizer method) (imitation.regularization.regularizers.Regularizer method) (imitation.regularization.regularizers.WeightRegularizer method) Regularizer (class in imitation.regularization.regularizers) regularizer (imitation.algorithms.preference_comparisons.BasicRewardTrainer attribute) (imitation.algorithms.preference_comparisons.EnsembleTrainer attribute) RegularizerFactory (class in imitation.regularization.regularizers) ReplayBuffer (class in imitation.data.buffer) ReplayBufferRewardWrapper (class in imitation.policies.replay_buffer_wrapper) requires_regularizer_update (imitation.algorithms.preference_comparisons.BasicRewardTrainer property) reset() (imitation.algorithms.dagger.InteractiveTrajectoryCollector method) (imitation.data.wrappers.BufferingWrapper method) (imitation.data.wrappers.RolloutInfoWrapper method) (imitation.rewards.reward_wrapper.RewardVecEnvWrapper method) (imitation.scripts.eval_policy.InteractiveRender method) (imitation.util.video_wrapper.VideoWrapper method) reset_running_stats() (imitation.util.networks.BaseNorm method) (imitation.util.networks.EMANorm method) reset_tensorboard_steps() (imitation.algorithms.bc.BCLogger method) rew (imitation.data.types.TransitionMapping attribute) reward_test (imitation.algorithms.adversarial.airl.AIRL property) (imitation.algorithms.adversarial.common.AdversarialTrainer property) (imitation.algorithms.adversarial.gail.GAIL property) reward_train (imitation.algorithms.adversarial.airl.AIRL property) (imitation.algorithms.adversarial.common.AdversarialTrainer property) (imitation.algorithms.adversarial.gail.GAIL property) RewardEnsemble (class in imitation.rewards.reward_nets) RewardFn (class in imitation.rewards.reward_function) RewardLoss (class in imitation.algorithms.preference_comparisons) RewardNet (class in imitation.rewards.reward_nets) RewardNetFromDiscriminatorLogit (class in imitation.algorithms.adversarial.gail) RewardNetWithVariance (class in imitation.rewards.reward_nets) RewardNetWrapper (class in imitation.rewards.reward_nets) rewards (imitation.algorithms.sqil.SQILReplayBuffer attribute) (imitation.policies.replay_buffer_wrapper.ReplayBufferRewardWrapper attribute) rewards() (imitation.algorithms.preference_comparisons.PreferenceModel method) RewardTrainer (class in imitation.algorithms.preference_comparisons) RewardVecEnvWrapper (class in imitation.rewards.reward_wrapper) rews (imitation.data.types.TrajectoryWithRew attribute) (imitation.data.types.TransitionsWithRew attribute) rl_algo (imitation.algorithms.density.DensityAlgorithm attribute) rng (imitation.algorithms.mce_irl.TabularPolicy attribute) rollout() (in module imitation.data.rollout) rollout_stats() (in module imitation.data.rollout) RolloutInfoWrapper (class in imitation.data.wrappers) RolloutStatsComputer (class in imitation.algorithms.bc) run (imitation.util.sacred.SacredDicts attribute) running_mean (imitation.util.networks.BaseNorm attribute) (imitation.util.networks.RunningNorm attribute) running_var (imitation.util.networks.BaseNorm attribute) (imitation.util.networks.RunningNorm attribute) RunningNorm (class in imitation.util.networks) S SAC1024Policy (class in imitation.policies.base) sacred_dir (imitation.util.sacred.SacredDicts attribute) SacredDicts (class in imitation.util.sacred) safe_to_numpy() (in module imitation.util.util) safe_to_tensor() (in module imitation.util.util) sample() (imitation.algorithms.preference_comparisons.AgentTrainer method) (imitation.algorithms.preference_comparisons.TrajectoryDataset method) (imitation.algorithms.preference_comparisons.TrajectoryGenerator method) (imitation.algorithms.sqil.SQILReplayBuffer method) (imitation.data.buffer.Buffer method) (imitation.data.buffer.ReplayBuffer method) (imitation.policies.replay_buffer_wrapper.ReplayBufferRewardWrapper method) sample_shapes (imitation.data.buffer.Buffer attribute) save() (imitation.algorithms.preference_comparisons.PreferenceDataset method) (in module imitation.data.serialize) (in module imitation.scripts.train_adversarial) save_checkpoint() (in module imitation.scripts.train_preference_comparisons) save_model() (in module imitation.scripts.train_preference_comparisons) save_policy() (in module imitation.util.util) save_stable_model() (in module imitation.policies.serialize) save_trainer() (imitation.algorithms.dagger.DAggerTrainer method) SavePolicyCallback (class in imitation.policies.serialize) seed() (imitation.algorithms.dagger.InteractiveTrajectoryCollector method) set_demonstrations() (imitation.algorithms.adversarial.common.AdversarialTrainer method) (imitation.algorithms.base.DemonstrationAlgorithm method) (imitation.algorithms.bc.BC method) (imitation.algorithms.density.DensityAlgorithm method) (imitation.algorithms.mce_irl.MCEIRL method) (imitation.algorithms.sqil.SQIL method) (imitation.algorithms.sqil.SQILReplayBuffer method) set_level() (imitation.util.logger.HierarchicalLogger method) set_pi() (imitation.algorithms.mce_irl.TabularPolicy method) setup_logging() (in module imitation.scripts.ingredients.logging) shape (imitation.data.types.DictObs property) ShapedRewardNet (class in imitation.rewards.reward_nets) SimpleDAggerTrainer (class in imitation.algorithms.dagger) single_video (imitation.util.video_wrapper.VideoWrapper attribute) size() (imitation.data.buffer.Buffer method) (imitation.data.buffer.ReplayBuffer method) split_in_half() (in module imitation.util.util) SQIL (class in imitation.algorithms.sqil) sqil() (in module imitation.scripts.train_imitation) SQILReplayBuffer (class in imitation.algorithms.sqil) squeeze_r() (in module imitation.algorithms.mce_irl) SqueezeLayer (class in imitation.util.networks) stack() (imitation.data.types.DictObs class method) stack_maybe_dictobs() (in module imitation.data.types) standardise (imitation.algorithms.density.DensityAlgorithm attribute) STATE_ACTION_DENSITY (imitation.algorithms.density.DensityType attribute) STATE_DENSITY (imitation.algorithms.density.DensityType attribute) STATE_STATE_DENSITY (imitation.algorithms.density.DensityType attribute) step() (imitation.data.wrappers.RolloutInfoWrapper method) (imitation.util.video_wrapper.VideoWrapper method) step_async() (imitation.algorithms.dagger.InteractiveTrajectoryCollector method) (imitation.data.wrappers.BufferingWrapper method) (imitation.rewards.reward_wrapper.RewardVecEnvWrapper method) step_wait() (imitation.algorithms.dagger.InteractiveTrajectoryCollector method) (imitation.data.wrappers.BufferingWrapper method) (imitation.rewards.reward_wrapper.RewardVecEnvWrapper method) (imitation.scripts.eval_policy.InteractiveRender method) store() (imitation.data.buffer.Buffer method) (imitation.data.buffer.ReplayBuffer method) SyntheticGatherer (class in imitation.algorithms.preference_comparisons) T TabularPolicy (class in imitation.algorithms.mce_irl) tensor_iter_norm() (in module imitation.util.util) terminal (imitation.data.types.Trajectory attribute) test_policy() (imitation.algorithms.density.DensityAlgorithm method) timeouts (imitation.algorithms.sqil.SQILReplayBuffer attribute) (imitation.policies.replay_buffer_wrapper.ReplayBufferRewardWrapper attribute) train() (imitation.algorithms.adversarial.common.AdversarialTrainer method) (imitation.algorithms.bc.BC method) (imitation.algorithms.dagger.SimpleDAggerTrainer method) (imitation.algorithms.density.DensityAlgorithm method) (imitation.algorithms.mce_irl.MCEIRL method) (imitation.algorithms.preference_comparisons.AgentTrainer method) (imitation.algorithms.preference_comparisons.PreferenceComparisons method) (imitation.algorithms.preference_comparisons.RewardTrainer method) (imitation.algorithms.preference_comparisons.TrajectoryGenerator method) (imitation.algorithms.sqil.SQIL method) train_adversarial() (in module imitation.scripts.train_adversarial) train_disc() (imitation.algorithms.adversarial.common.AdversarialTrainer method) train_gen() (imitation.algorithms.adversarial.common.AdversarialTrainer method) train_policy() (imitation.algorithms.density.DensityAlgorithm method) train_preference_comparisons() (in module imitation.scripts.train_preference_comparisons) train_rl() (in module imitation.scripts.train_rl) training (imitation.algorithms.adversarial.gail.RewardNetFromDiscriminatorLogit attribute) (imitation.algorithms.preference_comparisons.CrossEntropyRewardLoss attribute) (imitation.algorithms.preference_comparisons.PreferenceModel attribute) (imitation.algorithms.preference_comparisons.RewardLoss attribute) (imitation.policies.base.NormalizeFeaturesExtractor attribute) (imitation.policies.base.RandomPolicy attribute) (imitation.policies.base.ZeroPolicy attribute) (imitation.policies.interactive.AtariInteractivePolicy attribute) (imitation.policies.interactive.DiscreteInteractivePolicy attribute) (imitation.policies.interactive.ImageObsDiscreteInteractivePolicy attribute) (imitation.rewards.reward_nets.BasicPotentialCNN attribute) (imitation.rewards.reward_nets.BasicPotentialMLP attribute) (imitation.rewards.reward_nets.BasicRewardNet attribute) (imitation.rewards.reward_nets.BasicShapedRewardNet attribute) (imitation.rewards.reward_nets.CnnRewardNet attribute) (imitation.rewards.reward_nets.ForwardWrapper attribute) (imitation.rewards.reward_nets.NormalizedRewardNet attribute) (imitation.rewards.reward_nets.PredictProcessedWrapper attribute) (imitation.rewards.reward_nets.RewardNet attribute) (imitation.rewards.reward_nets.RewardNetWithVariance attribute) (imitation.rewards.reward_nets.RewardNetWrapper attribute) (imitation.rewards.reward_nets.ShapedRewardNet attribute) (imitation.testing.reward_nets.MockRewardNet attribute) (imitation.util.networks.RunningNorm attribute) (imitation.util.networks.SqueezeLayer attribute) training() (in module imitation.util.networks) training_mode() (in module imitation.util.networks) traj_accum (imitation.algorithms.dagger.InteractiveTrajectoryCollector attribute) trajectories_list (in module imitation.testing.hypothesis_strategies) trajectories_to_dataset() (in module imitation.data.huggingface_utils) trajectories_to_dict() (in module imitation.data.huggingface_utils) trajectories_with_reward_list (in module imitation.testing.hypothesis_strategies) trajectories_without_reward_list (in module imitation.testing.hypothesis_strategies) Trajectory (class in imitation.data.types) trajectory (in module imitation.testing.hypothesis_strategies) trajectory_length (in module imitation.testing.hypothesis_strategies) TrajectoryAccumulator (class in imitation.data.rollout) TrajectoryDataset (class in imitation.algorithms.preference_comparisons) TrajectoryDatasetSequence (class in imitation.data.huggingface_utils) TrajectoryGenerator (class in imitation.algorithms.preference_comparisons) TrajectoryWithRew (class in imitation.data.types) TransitionMapping (class in imitation.data.types) TransitionMappingNoNextObs (class in imitation.data.types) Transitions (class in imitation.data.types) transitions (imitation.algorithms.density.DensityAlgorithm attribute) transitions_collate_fn() (in module imitation.data.types) TransitionsMinimal (class in imitation.data.types) TransitionsWithRew (class in imitation.data.types) tune() (in module imitation.scripts.tuning) U uncertainty_on (imitation.algorithms.preference_comparisons.ActiveSelectionFragmenter property) unwrap() (imitation.data.types.DictObs method) unwrap_traj() (in module imitation.data.rollout) update_params() (imitation.regularization.regularizers.Regularizer method) update_stats() (imitation.util.networks.BaseNorm method) (imitation.util.networks.EMANorm method) (imitation.util.networks.RunningNorm method) update_traj_file_in_place() (in module imitation.scripts.convert_trajs) V val_split (imitation.regularization.regularizers.LossRegularizer attribute) (imitation.regularization.regularizers.Regularizer attribute) (imitation.regularization.regularizers.WeightDecayRegularizer attribute) (imitation.regularization.regularizers.WeightRegularizer attribute) ValidateRewardFn (class in imitation.rewards.serialize) values() (imitation.data.types.DictObs method) variance_estimate() (imitation.algorithms.preference_comparisons.ActiveSelectionFragmenter method) venv (imitation.algorithms.adversarial.airl.AIRL attribute) (imitation.algorithms.adversarial.common.AdversarialTrainer attribute) (imitation.algorithms.adversarial.gail.GAIL attribute) (imitation.algorithms.bc.RolloutStatsComputer attribute) (imitation.algorithms.density.DensityAlgorithm attribute) venv_train (imitation.algorithms.adversarial.airl.AIRL attribute) (imitation.algorithms.adversarial.common.AdversarialTrainer attribute) (imitation.algorithms.adversarial.gail.GAIL attribute) venv_wrapped (imitation.algorithms.adversarial.airl.AIRL attribute) (imitation.algorithms.adversarial.common.AdversarialTrainer attribute) (imitation.algorithms.adversarial.gail.GAIL attribute) (imitation.algorithms.density.DensityAlgorithm attribute) video_recorder (imitation.util.video_wrapper.VideoWrapper attribute) video_wrapper_factory() (in module imitation.scripts.eval_policy) VideoWrapper (class in imitation.util.video_wrapper) W wandb_init() (in module imitation.scripts.ingredients.wb) WandbOutputFormat (class in imitation.util.logger) WeightDecayRegularizer (class in imitation.regularization.regularizers) WeightRegularizer (class in imitation.regularization.regularizers) WrappedRewardCallback (class in imitation.rewards.reward_wrapper) wrapper_callback (imitation.algorithms.density.DensityAlgorithm attribute) write() (imitation.util.logger.WandbOutputFormat method) Z ZeroPolicy (class in imitation.policies.base)