[{"title":"( 41 个子文件 11.42MB ) imitation_learning:PyTorch实现的一些强化学习算法:优势演员评论(A2C),近距离策略优化(PPO),V-MPO,行为克隆(BC)。 将添加更多算法-源码","children":[{"title":"imitation_learning-master","children":[{"title":"utils","children":[{"title":"vec_env.py <span style='color:#111;'> 11.44KB </span>","children":null,"spread":false},{"title":"batch_crop.py <span style='color:#111;'> 773B </span>","children":null,"spread":false},{"title":"utils.py <span style='color:#111;'> 816B </span>","children":null,"spread":false},{"title":"__init__.py <span style='color:#111;'> 0B </span>","children":null,"spread":false},{"title":"env_wrappers.py <span style='color:#111;'> 8.27KB </span>","children":null,"spread":false}],"spread":true},{"title":"algorithms","children":[{"title":"agents","children":[{"title":"v_mpo.py <span style='color:#111;'> 7.77KB </span>","children":null,"spread":false},{"title":"bc.py <span style='color:#111;'> 3.01KB </span>","children":null,"spread":false},{"title":"ppo.py <span style='color:#111;'> 7.62KB </span>","children":null,"spread":false},{"title":"agent_train.py <span style='color:#111;'> 7.81KB </span>","children":null,"spread":false},{"title":"a2c.py <span style='color:#111;'> 2.69KB </span>","children":null,"spread":false}],"spread":true},{"title":"kl_divergence.py <span style='color:#111;'> 1.56KB </span>","children":null,"spread":false},{"title":"real_nvp.py <span style='color:#111;'> 6.71KB </span>","children":null,"spread":false},{"title":"nn","children":[{"title":"conv_encoders.py <span style='color:#111;'> 3.25KB </span>","children":null,"spread":false},{"title":"recurrent_encoders.py <span style='color:#111;'> 2.48KB </span>","children":null,"spread":false},{"title":"actor_critic.py <span style='color:#111;'> 3.31KB </span>","children":null,"spread":false},{"title":"agent_model.py <span style='color:#111;'> 5.47KB </span>","children":null,"spread":false}],"spread":true},{"title":"normalization.py <span style='color:#111;'> 2.82KB </span>","children":null,"spread":false},{"title":"distributions.py <span style='color:#111;'> 9.36KB </span>","children":null,"spread":false}],"spread":true},{"title":"test.py <span style='color:#111;'> 6.31KB </span>","children":null,"spread":false},{"title":"requirements.txt <span style='color:#111;'> 92B </span>","children":null,"spread":false},{"title":"trainers","children":[{"title":"base_trainer.py <span style='color:#111;'> 2.29KB </span>","children":null,"spread":false},{"title":"rollout.py <span style='color:#111;'> 7.51KB </span>","children":null,"spread":false},{"title":"on_policy.py <span style='color:#111;'> 9.09KB </span>","children":null,"spread":false},{"title":"behavior_cloning.py <span style='color:#111;'> 1.51KB </span>","children":null,"spread":false}],"spread":true},{"title":"train_scripts","children":[{"title":"bc","children":[{"title":"cart_pole_10_episodes.py <span style='color:#111;'> 1.62KB </span>","children":null,"spread":false}],"spread":true},{"title":"ppo","children":[{"title":"bipedal_rnn.py <span style='color:#111;'> 2.38KB </span>","children":null,"spread":false},{"title":"car_racing.py <span style='color:#111;'> 2.21KB </span>","children":null,"spread":false},{"title":"cart_pole.py <span style='color:#111;'> 1.69KB </span>","children":null,"spread":false},{"title":"bipedal_hardcore.py <span style='color:#111;'> 2.58KB </span>","children":null,"spread":false},{"title":"bipedal.py <span style='color:#111;'> 1.80KB </span>","children":null,"spread":false},{"title":"humanoid.py <span style='color:#111;'> 1.94KB </span>","children":null,"spread":false},{"title":"cart_pole_rnn.py <span style='color:#111;'> 2.16KB </span>","children":null,"spread":false}],"spread":true},{"title":"a2c","children":[{"title":"cart_pole.py <span style='color:#111;'> 1.61KB </span>","children":null,"spread":false},{"title":"cart_pole_rnn.py <span style='color:#111;'> 2.13KB </span>","children":null,"spread":false}],"spread":true}],"spread":true},{"title":".gitignore <span style='color:#111;'> 90B </span>","children":null,"spread":false},{"title":"gifs","children":[{"title":"cartpole.gif <span style='color:#111;'> 84.82KB </span>","children":null,"spread":false},{"title":"car_racing.gif <span style='color:#111;'> 5.93MB </span>","children":null,"spread":false},{"title":"humanoid.gif <span style='color:#111;'> 3.67MB </span>","children":null,"spread":false},{"title":"bipedal.gif <span style='color:#111;'> 1.78MB </span>","children":null,"spread":false}],"spread":true},{"title":"custom_environments","children":[{"title":"mario_wrapper.py <span style='color:#111;'> 1.42KB </span>","children":null,"spread":false}],"spread":true},{"title":"readme.md <span style='color:#111;'> 7.00KB </span>","children":null,"spread":false}],"spread":true}],"spread":true}]