Tianshou
v0.2.3
Tutorials
Deep Q Network
Basic concepts in Tianshou
Train a model-free RL agent within 30s
Cheat Sheet
API Docs
tianshou.data
tianshou.env
tianshou.policy
tianshou.trainer
tianshou.exploration
tianshou.utils
Community
Contributing to Tianshou
Contributor
Tianshou
Docs
»
Index
Edit on GitHub
Index
_
|
A
|
B
|
C
|
D
|
E
|
F
|
G
|
I
|
K
|
L
|
M
|
O
|
P
|
R
|
S
|
T
|
U
|
V
_
__call__() (tianshou.exploration.OUNoise method)
__getitem__() (tianshou.data.Batch method)
(tianshou.data.PrioritizedReplayBuffer method)
(tianshou.data.ReplayBuffer method)
__len__() (tianshou.data.Batch method)
(tianshou.data.ReplayBuffer method)
(tianshou.env.BaseVectorEnv method)
A
A2CPolicy (class in tianshou.policy)
add() (tianshou.data.PrioritizedReplayBuffer method)
(tianshou.data.ReplayBuffer method)
(tianshou.utils.MovAvg method)
append() (tianshou.data.Batch method)
B
BasePolicy (class in tianshou.policy)
BaseVectorEnv (class in tianshou.env)
Batch (class in tianshou.data)
C
close() (tianshou.data.Collector method)
(tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
collect() (tianshou.data.Collector method)
Collector (class in tianshou.data)
compute_episodic_return() (tianshou.policy.BasePolicy static method)
D
DDPGPolicy (class in tianshou.policy)
DQNPolicy (class in tianshou.policy)
E
eval() (tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.SACPolicy method)
(tianshou.policy.TD3Policy method)
F
forward() (tianshou.policy.A2CPolicy method)
(tianshou.policy.BasePolicy method)
(tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.ImitationPolicy method)
(tianshou.policy.PGPolicy method)
(tianshou.policy.PPOPolicy method)
(tianshou.policy.SACPolicy method)
G
gather_info() (in module tianshou.trainer)
get() (tianshou.data.Batch method)
(tianshou.data.ReplayBuffer method)
(tianshou.utils.MovAvg method)
get_env_num() (tianshou.data.Collector method)
I
ImitationPolicy (class in tianshou.policy)
K
keys() (tianshou.data.Batch method)
L
learn() (tianshou.policy.A2CPolicy method)
(tianshou.policy.BasePolicy method)
(tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.ImitationPolicy method)
(tianshou.policy.PGPolicy method)
(tianshou.policy.PPOPolicy method)
(tianshou.policy.SACPolicy method)
(tianshou.policy.TD3Policy method)
ListReplayBuffer (class in tianshou.data)
M
mean() (tianshou.utils.MovAvg method)
module
tianshou.data
tianshou.env
tianshou.exploration
tianshou.policy
tianshou.trainer
tianshou.utils
MovAvg (class in tianshou.utils)
O
offpolicy_trainer() (in module tianshou.trainer)
onpolicy_trainer() (in module tianshou.trainer)
OUNoise (class in tianshou.exploration)
P
PGPolicy (class in tianshou.policy)
PPOPolicy (class in tianshou.policy)
PrioritizedReplayBuffer (class in tianshou.data)
process_fn() (tianshou.policy.A2CPolicy method)
(tianshou.policy.BasePolicy method)
(tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.PGPolicy method)
(tianshou.policy.PPOPolicy method)
R
RayVectorEnv (class in tianshou.env)
render() (tianshou.data.Collector method)
(tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
ReplayBuffer (class in tianshou.data)
reset() (tianshou.data.Collector method)
(tianshou.data.ListReplayBuffer method)
(tianshou.data.PrioritizedReplayBuffer method)
(tianshou.data.ReplayBuffer method)
(tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
(tianshou.exploration.OUNoise method)
reset_buffer() (tianshou.data.Collector method)
reset_env() (tianshou.data.Collector method)
S
SACPolicy (class in tianshou.policy)
sample() (tianshou.data.Collector method)
(tianshou.data.PrioritizedReplayBuffer method)
(tianshou.data.ReplayBuffer method)
seed() (tianshou.data.Collector method)
(tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
set_eps() (tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
split() (tianshou.data.Batch method)
std() (tianshou.utils.MovAvg method)
step() (tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
SubprocVectorEnv (class in tianshou.env)
sync_weight() (tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.SACPolicy method)
(tianshou.policy.TD3Policy method)
T
TD3Policy (class in tianshou.policy)
test_episode() (in module tianshou.trainer)
tianshou.data
module
tianshou.env
module
tianshou.exploration
module
tianshou.policy
module
tianshou.trainer
module
tianshou.utils
module
to_numpy() (in module tianshou.data)
(tianshou.data.Batch method)
to_torch() (in module tianshou.data)
(tianshou.data.Batch method)
train() (tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.SACPolicy method)
(tianshou.policy.TD3Policy method)
U
update() (tianshou.data.ReplayBuffer method)
update_weight() (tianshou.data.PrioritizedReplayBuffer method)
V
values() (tianshou.data.Batch method)
VectorEnv (class in tianshou.env)