[{"title":"( 60 个子文件 5.82MB ) 带有火炬的深度增强学习:DQN,AC,ACER,A2C,A3C,PG,DDPG,TRPO,PPO,SAC,TD3和PyTorch实施...-源码","children":[{"title":"Deep-reinforcement-learning-with-pytorch-master","children":[{"title":"figures","children":[{"title":"test.png <span style='color:#111;'> 11.38KB </span>","children":null,"spread":false}],"spread":true},{"title":"Char02 Policy Gradient","children":[{"title":"Run_Model.py <span style='color:#111;'> 2.32KB </span>","children":null,"spread":false},{"title":"pytorch_MountainCar-v0.py <span style='color:#111;'> 2.91KB </span>","children":null,"spread":false},{"title":"REINFORCE.py <span style='color:#111;'> 3.05KB </span>","children":null,"spread":false},{"title":"naive-policy-gradient.py <span style='color:#111;'> 3.78KB </span>","children":null,"spread":false},{"title":"PolicyGradient.py <span style='color:#111;'> 3.09KB </span>","children":null,"spread":false},{"title":"REINFORCE_with_Baseline.py <span style='color:#111;'> 3.96KB </span>","children":null,"spread":false}],"spread":true},{"title":"Char03 Actor-Critic","children":[{"title":"AC_MountainCar-v0.py <span style='color:#111;'> 3.60KB </span>","children":null,"spread":false},{"title":"AC_CartPole-v0.py <span style='color:#111;'> 3.26KB </span>","children":null,"spread":false}],"spread":true},{"title":"Char04 A2C","children":[{"title":"multiprocessing_env.py <span style='color:#111;'> 4.78KB </span>","children":null,"spread":false},{"title":"A2C.py <span style='color:#111;'> 3.85KB </span>","children":null,"spread":false}],"spread":true},{"title":"Char10 TD3","children":[{"title":"TD3_Pendulum-v0.png <span style='color:#111;'> 47.53KB </span>","children":null,"spread":false},{"title":"TD3_BipedalWalker-v2.py <span style='color:#111;'> 12.90KB </span>","children":null,"spread":false},{"title":"expTD3_BipedalWalker-v2.pyBipedalWalker-v2.","children":[{"title":"critic_1_target.pth <span style='color:#111;'> 517.48KB </span>","children":null,"spread":false},{"title":"critic_2.pth <span style='color:#111;'> 517.48KB </span>","children":null,"spread":false},{"title":"actor.pth <span style='color:#111;'> 514.76KB </span>","children":null,"spread":false},{"title":"critic_1.pth <span style='color:#111;'> 517.48KB </span>","children":null,"spread":false},{"title":"critic_2_target.pth <span style='color:#111;'> 517.48KB </span>","children":null,"spread":false},{"title":"actor_target.pth <span style='color:#111;'> 514.76KB </span>","children":null,"spread":false}],"spread":true},{"title":"expTD3.pyPendulum-v0.","children":[{"title":"critic_1_target.pth <span style='color:#111;'> 479.98KB </span>","children":null,"spread":false},{"title":"critic_2.pth <span style='color:#111;'> 479.98KB </span>","children":null,"spread":false},{"title":"actor.pth <span style='color:#111;'> 478.42KB </span>","children":null,"spread":false},{"title":"critic_1.pth <span style='color:#111;'> 479.98KB </span>","children":null,"spread":false},{"title":"critic_2_target.pth <span style='color:#111;'> 479.98KB </span>","children":null,"spread":false},{"title":"actor_target.pth <span style='color:#111;'> 478.42KB </span>","children":null,"spread":false}],"spread":true},{"title":"Episode_reward_TD3_BipedakWalker.png <span style='color:#111;'> 89.23KB </span>","children":null,"spread":false},{"title":"TD3.py <span style='color:#111;'> 12.71KB </span>","children":null,"spread":false}],"spread":true},{"title":"Char01 DQN","children":[{"title":"DQN","children":[{"title":"pic","children":[{"title":"finish_episode.jpg <span style='color:#111;'> 34.84KB </span>","children":null,"spread":false},{"title":"value_loss.jpg <span style='color:#111;'> 35.01KB </span>","children":null,"spread":false},{"title":"readme.md <span style='color:#111;'> 7B </span>","children":null,"spread":false}],"spread":true}],"spread":true},{"title":"DQN_CartPole-v0.py <span style='color:#111;'> 4.09KB </span>","children":null,"spread":false},{"title":"DQN.py <span style='color:#111;'> 4.77KB </span>","children":null,"spread":false},{"title":"DQN_MountainCar-v0.py <span style='color:#111;'> 4.09KB </span>","children":null,"spread":false},{"title":"DQN_mountain_car_v1.py <span style='color:#111;'> 4.21KB </span>","children":null,"spread":false},{"title":"readme.md <span style='color:#111;'> 997B </span>","children":null,"spread":false},{"title":"naiveDQN.py <span style='color:#111;'> 4.20KB </span>","children":null,"spread":false}],"spread":true},{"title":"requirements.txt <span style='color:#111;'> 70B </span>","children":null,"spread":false},{"title":"Char07 PPO","children":[{"title":"PPO_CartPole_v0.py <span style='color:#111;'> 6.11KB </span>","children":null,"spread":false},{"title":"PPO2.py <span style='color:#111;'> 6.64KB </span>","children":null,"spread":false},{"title":"PPO_pendulum.py <span style='color:#111;'> 6.26KB </span>","children":null,"spread":false},{"title":"PPO_MountainCar-v0.py <span style='color:#111;'> 6.14KB </span>","children":null,"spread":false},{"title":"readme.md <span style='color:#111;'> 185B </span>","children":null,"spread":false}],"spread":true},{"title":"LICENSE <span style='color:#111;'> 1.04KB </span>","children":null,"spread":false},{"title":"Char00 Conventional Algorithms","children":[{"title":"gridworld.py <span style='color:#111;'> 6.64KB </span>","children":null,"spread":false},{"title":"Sarsa.py <span style='color:#111;'> 2.89KB </span>","children":null,"spread":false},{"title":"Q-learning.py <span style='color:#111;'> 2.70KB </span>","children":null,"spread":false}],"spread":true},{"title":"Char08 ACER","children":[{"title":"readme.md <span style='color:#111;'> 44B </span>","children":null,"spread":false}],"spread":true},{"title":"Char09 SAC","children":[{"title":"SAC_ep_r_curve.png <span style='color:#111;'> 62.16KB </span>","children":null,"spread":false},{"title":"SAC_dual_Q_net.py <span style='color:#111;'> 11.69KB </span>","children":null,"spread":false},{"title":"SAC.py <span style='color:#111;'> 11.00KB </span>","children":null,"spread":false},{"title":"test_agent.py <span style='color:#111;'> 12.44KB </span>","children":null,"spread":false},{"title":"SAC_BipedalWalker-v2.py <span style='color:#111;'> 12.48KB </span>","children":null,"spread":false}],"spread":true},{"title":"Char05 DDPG","children":[{"title":"DDPG_exp.jpg <span style='color:#111;'> 61.21KB </span>","children":null,"spread":false},{"title":"README.md <span style='color:#111;'> 420B </span>","children":null,"spread":false},{"title":"DDPG.py <span style='color:#111;'> 10.02KB </span>","children":null,"spread":false}],"spread":true},{"title":"readme.md <span style='color:#111;'> 8.26KB </span>","children":null,"spread":false},{"title":"More","children":[{"title":"Application in real world","children":[{"title":"README.md <span style='color:#111;'> 274B </span>","children":null,"spread":false}],"spread":false},{"title":"MARL","children":[{"title":"README.md <span style='color:#111;'> 581B </span>","children":null,"spread":false}],"spread":false},{"title":"readme.md <span style='color:#111;'> 53B </span>","children":null,"spread":false},{"title":"plot.py <span style='color:#111;'> 1.40KB </span>","children":null,"spread":false}],"spread":false}],"spread":false}],"spread":true}]