[{"title":"(41个子文件11.42MB)imitation_learning:PyTorch实现的一些强化学习算法:优势演员评论(A2C),近距离策略优化(PPO),V-MPO,行为克隆(BC)。将添加更多算法-源码","children":[{"title":"imitation_learning-master","children":[{"title":"utils","children":[{"title":"vec_env.py <span style='color:#111;'>11.44KB</span>","children":null,"spread":false},{"title":"batch_crop.py <span style='color:#111;'>773B</span>","children":null,"spread":false},{"title":"utils.py <span style='color:#111;'>816B</span>","children":null,"spread":false},{"title":"__init__.py <span style='color:#111;'>0B</span>","children":null,"spread":false},{"title":"env_wrappers.py <span style='color:#111;'>8.27KB</span>","children":null,"spread":false}],"spread":true},{"title":"algorithms","children":[{"title":"agents","children":[{"title":"v_mpo.py <span style='color:#111;'>7.77KB</span>","children":null,"spread":false},{"title":"bc.py <span style='color:#111;'>3.01KB</span>","children":null,"spread":false},{"title":"ppo.py <span style='color:#111;'>7.62KB</span>","children":null,"spread":false},{"title":"agent_train.py <span style='color:#111;'>7.81KB</span>","children":null,"spread":false},{"title":"a2c.py <span style='color:#111;'>2.69KB</span>","children":null,"spread":false}],"spread":true},{"title":"kl_divergence.py <span style='color:#111;'>1.56KB</span>","children":null,"spread":false},{"title":"real_nvp.py <span style='color:#111;'>6.71KB</span>","children":null,"spread":false},{"title":"nn","children":[{"title":"conv_encoders.py <span style='color:#111;'>3.25KB</span>","children":null,"spread":false},{"title":"recurrent_encoders.py <span style='color:#111;'>2.48KB</span>","children":null,"spread":false},{"title":"actor_critic.py <span style='color:#111;'>3.31KB</span>","children":null,"spread":false},{"title":"agent_model.py <span style='color:#111;'>5.47KB</span>","children":null,"spread":false}],"spread":true},{"title":"normalization.py <span style='color:#111;'>2.82KB</span>","children":null,"spread":false},{"title":"distributions.py <span style='color:#111;'>9.36KB</span>","children":null,"spread":false}],"spread":true},{"title":"test.py <span style='color:#111;'>6.31KB</span>","children":null,"spread":false},{"title":"requirements.txt <span style='color:#111;'>92B</span>","children":null,"spread":false},{"title":"trainers","children":[{"title":"base_trainer.py <span style='color:#111;'>2.29KB</span>","children":null,"spread":false},{"title":"rollout.py <span style='color:#111;'>7.51KB</span>","children":null,"spread":false},{"title":"on_policy.py <span style='color:#111;'>9.09KB</span>","children":null,"spread":false},{"title":"behavior_cloning.py <span style='color:#111;'>1.51KB</span>","children":null,"spread":false}],"spread":true},{"title":"train_scripts","children":[{"title":"bc","children":[{"title":"cart_pole_10_episodes.py <span style='color:#111;'>1.62KB</span>","children":null,"spread":false}],"spread":true},{"title":"ppo","children":[{"title":"bipedal_rnn.py <span style='color:#111;'>2.38KB</span>","children":null,"spread":false},{"title":"car_racing.py <span style='color:#111;'>2.21KB</span>","children":null,"spread":false},{"title":"cart_pole.py <span style='color:#111;'>1.69KB</span>","children":null,"spread":false},{"title":"bipedal_hardcore.py <span style='color:#111;'>2.58KB</span>","children":null,"spread":false},{"title":"bipedal.py <span style='color:#111;'>1.80KB</span>","children":null,"spread":false},{"title":"humanoid.py <span style='color:#111;'>1.94KB</span>","children":null,"spread":false},{"title":"cart_pole_rnn.py <span style='color:#111;'>2.16KB</span>","children":null,"spread":false}],"spread":true},{"title":"a2c","children":[{"title":"cart_pole.py <span style='color:#111;'>1.61KB</span>","children":null,"spread":false},{"title":"cart_pole_rnn.py <span style='color:#111;'>2.13KB</span>","children":null,"spread":false}],"spread":true}],"spread":true},{"title":".gitignore <span style='color:#111;'>90B</span>","children":null,"spread":false},{"title":"gifs","children":[{"title":"cartpole.gif <span style='color:#111;'>84.82KB</span>","children":null,"spread":false},{"title":"car_racing.gif <span style='color:#111;'>5.93MB</span>","children":null,"spread":false},{"title":"humanoid.gif <span style='color:#111;'>3.67MB</span>","children":null,"spread":false},{"title":"bipedal.gif <span style='color:#111;'>1.78MB</span>","children":null,"spread":false}],"spread":true},{"title":"custom_environments","children":[{"title":"mario_wrapper.py <span style='color:#111;'>1.42KB</span>","children":null,"spread":false}],"spread":true},{"title":"readme.md <span style='color:#111;'>7.00KB</span>","children":null,"spread":false}],"spread":true}],"spread":true}]