Tianshou
v0.2.5
Tutorials
Deep Q Network
Basic concepts in Tianshou
Understand Batch
Multi-Agent RL
Train a model-free RL agent within 30s
Cheat Sheet
API Docs
tianshou.data
tianshou.env
tianshou.policy
tianshou.trainer
tianshou.exploration
tianshou.utils
Community
Contributing to Tianshou
Contributor
Tianshou
Docs
»
Index
Edit on GitHub
Index
_
|
A
|
B
|
C
|
D
|
E
|
F
|
G
|
I
|
K
|
L
|
M
|
N
|
O
|
P
|
R
|
S
|
T
|
U
|
V
_
__call__() (tianshou.exploration.BaseNoise method)
(tianshou.exploration.GaussianNoise method)
(tianshou.exploration.OUNoise method)
__getattr__() (tianshou.data.ReplayBuffer method)
(tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
__getitem__() (tianshou.data.Batch method)
(tianshou.data.PrioritizedReplayBuffer method)
(tianshou.data.ReplayBuffer method)
__len__() (tianshou.data.Batch method)
(tianshou.data.ReplayBuffer method)
(tianshou.env.BaseVectorEnv method)
__setattr__() (tianshou.data.Batch method)
__setitem__() (tianshou.data.Batch method)
A
A2CPolicy (class in tianshou.policy)
Actor (class in tianshou.utils.net.continuous)
(class in tianshou.utils.net.discrete)
ActorProb (class in tianshou.utils.net.continuous)
add() (tianshou.data.PrioritizedReplayBuffer method)
(tianshou.data.ReplayBuffer method)
(tianshou.utils.MovAvg method)
B
BaseNoise (class in tianshou.exploration)
BasePolicy (class in tianshou.policy)
BaseVectorEnv (class in tianshou.env)
Batch (class in tianshou.data)
C
cat() (tianshou.data.Batch static method)
cat_() (tianshou.data.Batch method)
close() (tianshou.data.Collector method)
(tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
collect() (tianshou.data.Collector method)
Collector (class in tianshou.data)
compute_episodic_return() (tianshou.policy.BasePolicy static method)
compute_nstep_return() (tianshou.policy.BasePolicy static method)
Critic (class in tianshou.utils.net.continuous)
(class in tianshou.utils.net.discrete)
D
DDPGPolicy (class in tianshou.policy)
DQN (class in tianshou.utils.net.discrete)
DQNPolicy (class in tianshou.policy)
E
empty() (tianshou.data.Batch static method)
empty_() (tianshou.data.Batch method)
F
forward() (tianshou.policy.A2CPolicy method)
(tianshou.policy.BasePolicy method)
(tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.ImitationPolicy method)
(tianshou.policy.MultiAgentPolicyManager method)
(tianshou.policy.PGPolicy method)
(tianshou.policy.PPOPolicy method)
(tianshou.policy.RandomPolicy method)
(tianshou.policy.SACPolicy method)
(tianshou.utils.net.common.Net method)
(tianshou.utils.net.common.Recurrent method)
(tianshou.utils.net.continuous.Actor method)
(tianshou.utils.net.continuous.ActorProb method)
(tianshou.utils.net.continuous.Critic method)
(tianshou.utils.net.continuous.RecurrentActorProb method)
(tianshou.utils.net.continuous.RecurrentCritic method)
(tianshou.utils.net.discrete.Actor method)
(tianshou.utils.net.discrete.Critic method)
(tianshou.utils.net.discrete.DQN method)
G
gather_info() (in module tianshou.trainer)
GaussianNoise (class in tianshou.exploration)
get() (tianshou.data.Batch method)
(tianshou.data.ReplayBuffer method)
(tianshou.utils.MovAvg method)
get_env_num() (tianshou.data.Collector method)
I
ImitationPolicy (class in tianshou.policy)
is_empty() (tianshou.data.Batch method)
items() (tianshou.data.Batch method)
K
keys() (tianshou.data.Batch method)
L
learn() (tianshou.policy.A2CPolicy method)
(tianshou.policy.BasePolicy method)
(tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.ImitationPolicy method)
(tianshou.policy.MultiAgentPolicyManager method)
(tianshou.policy.PGPolicy method)
(tianshou.policy.PPOPolicy method)
(tianshou.policy.RandomPolicy method)
(tianshou.policy.SACPolicy method)
(tianshou.policy.TD3Policy method)
ListReplayBuffer (class in tianshou.data)
M
mean() (tianshou.utils.MovAvg method)
module
tianshou.data
tianshou.env
tianshou.exploration
tianshou.policy
tianshou.trainer
tianshou.utils
tianshou.utils.net.common
tianshou.utils.net.continuous
tianshou.utils.net.discrete
MovAvg (class in tianshou.utils)
MultiAgentEnv (class in tianshou.env)
MultiAgentPolicyManager (class in tianshou.policy)
N
Net (class in tianshou.utils.net.common)
O
offpolicy_trainer() (in module tianshou.trainer)
onpolicy_trainer() (in module tianshou.trainer)
OUNoise (class in tianshou.exploration)
P
PGPolicy (class in tianshou.policy)
PPOPolicy (class in tianshou.policy)
PrioritizedReplayBuffer (class in tianshou.data)
process_fn() (tianshou.policy.A2CPolicy method)
(tianshou.policy.BasePolicy method)
(tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.MultiAgentPolicyManager method)
(tianshou.policy.PGPolicy method)
(tianshou.policy.PPOPolicy method)
R
RandomPolicy (class in tianshou.policy)
RayVectorEnv (class in tianshou.env)
Recurrent (class in tianshou.utils.net.common)
RecurrentActorProb (class in tianshou.utils.net.continuous)
RecurrentCritic (class in tianshou.utils.net.continuous)
render() (tianshou.data.Collector method)
(tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
replace() (tianshou.data.PrioritizedReplayBuffer property)
replace_policy() (tianshou.policy.MultiAgentPolicyManager method)
ReplayBuffer (class in tianshou.data)
reset() (tianshou.data.Collector method)
(tianshou.data.ListReplayBuffer method)
(tianshou.data.ReplayBuffer method)
(tianshou.env.BaseVectorEnv method)
(tianshou.env.MultiAgentEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
(tianshou.exploration.BaseNoise method)
(tianshou.exploration.OUNoise method)
reset_buffer() (tianshou.data.Collector method)
reset_env() (tianshou.data.Collector method)
S
SACPolicy (class in tianshou.policy)
sample() (tianshou.data.Collector method)
(tianshou.data.ListReplayBuffer method)
(tianshou.data.PrioritizedReplayBuffer method)
(tianshou.data.ReplayBuffer method)
seed() (tianshou.data.Collector method)
(tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
set_agent_id() (tianshou.policy.BasePolicy method)
set_eps() (tianshou.policy.DQNPolicy method)
set_exp_noise() (tianshou.policy.DDPGPolicy method)
shape() (tianshou.data.Batch property)
split() (tianshou.data.Batch method)
stack() (tianshou.data.Batch static method)
stack_() (tianshou.data.Batch method)
std() (tianshou.utils.MovAvg method)
step() (tianshou.env.BaseVectorEnv method)
(tianshou.env.MultiAgentEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
SubprocVectorEnv (class in tianshou.env)
sync_weight() (tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.SACPolicy method)
(tianshou.policy.TD3Policy method)
T
TD3Policy (class in tianshou.policy)
test_episode() (in module tianshou.trainer)
tianshou.data
module
tianshou.env
module
tianshou.exploration
module
tianshou.policy
module
tianshou.trainer
module
tianshou.utils
module
tianshou.utils.net.common
module
tianshou.utils.net.continuous
module
tianshou.utils.net.discrete
module
to_numpy() (in module tianshou.data)
(tianshou.data.Batch method)
to_torch() (in module tianshou.data)
(tianshou.data.Batch method)
to_torch_as() (in module tianshou.data)
train() (tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.SACPolicy method)
(tianshou.policy.TD3Policy method)
U
update() (tianshou.data.Batch method)
(tianshou.data.ReplayBuffer method)
update_weight() (tianshou.data.PrioritizedReplayBuffer method)
V
values() (tianshou.data.Batch method)
VectorEnv (class in tianshou.env)