[{"title":"( 58 个子文件 271KB ) 莫烦python RL代码","children":[{"title":"Reinforcement-learning-with-tensorflow-master","children":[{"title":"contents","children":[{"title":"5.2_Prioritized_Replay_DQN","children":[{"title":"RL_brain.py <span style='color:#111;'> 11.55KB </span>","children":null,"spread":false},{"title":"run_MountainCar.py <span style='color:#111;'> 2.06KB </span>","children":null,"spread":false}],"spread":true},{"title":"7_Policy_gradient_softmax","children":[{"title":"RL_brain.py <span style='color:#111;'> 4.24KB </span>","children":null,"spread":false},{"title":"run_MountainCar.py <span style='color:#111;'> 1.98KB </span>","children":null,"spread":false},{"title":"run_CartPole.py <span style='color:#111;'> 1.77KB </span>","children":null,"spread":false}],"spread":true},{"title":"5_Deep_Q_Network","children":[{"title":"RL_brain.py <span style='color:#111;'> 8.22KB </span>","children":null,"spread":false},{"title":"maze_env.py <span style='color:#111;'> 4.07KB </span>","children":null,"spread":false},{"title":"DQN_modified.py <span style='color:#111;'> 6.41KB </span>","children":null,"spread":false},{"title":"run_this.py <span style='color:#111;'> 1.31KB </span>","children":null,"spread":false}],"spread":true},{"title":"4_Sarsa_lambda_maze","children":[{"title":"RL_brain.py <span style='color:#111;'> 3.09KB </span>","children":null,"spread":false},{"title":"maze_env.py <span style='color:#111;'> 3.92KB </span>","children":null,"spread":false},{"title":"run_this.py <span style='color:#111;'> 1.56KB </span>","children":null,"spread":false}],"spread":true},{"title":"5.1_Double_DQN","children":[{"title":"RL_brain.py <span style='color:#111;'> 6.52KB </span>","children":null,"spread":false},{"title":"run_Pendulum.py <span style='color:#111;'> 2.08KB </span>","children":null,"spread":false}],"spread":true},{"title":"3_Sarsa_maze","children":[{"title":"RL_brain.py <span style='color:#111;'> 2.63KB </span>","children":null,"spread":false},{"title":"maze_env.py <span style='color:#111;'> 3.92KB </span>","children":null,"spread":false},{"title":"run_this.py <span style='color:#111;'> 1.47KB </span>","children":null,"spread":false}],"spread":true},{"title":"12_Proximal_Policy_Optimization","children":[{"title":"discrete_DPPO.py <span style='color:#111;'> 8.60KB </span>","children":null,"spread":false},{"title":"simply_PPO.py <span style='color:#111;'> 6.31KB </span>","children":null,"spread":false},{"title":"DPPO.py <span style='color:#111;'> 8.08KB </span>","children":null,"spread":false}],"spread":true},{"title":"11_Dyna_Q","children":[{"title":"RL_brain.py <span style='color:#111;'> 2.85KB </span>","children":null,"spread":false},{"title":"maze_env.py <span style='color:#111;'> 3.81KB </span>","children":null,"spread":false},{"title":"run_this.py <span style='color:#111;'> 1.46KB </span>","children":null,"spread":false}],"spread":true},{"title":"8_Actor_Critic_Advantage","children":[{"title":"AC_continue_Pendulum.py <span style='color:#111;'> 6.24KB </span>","children":null,"spread":false},{"title":"AC_CartPole.py <span style='color:#111;'> 5.72KB </span>","children":null,"spread":false}],"spread":true},{"title":"1_command_line_reinforcement_learning","children":[{"title":"treasure_on_right.py <span style='color:#111;'> 3.36KB </span>","children":null,"spread":false}],"spread":true},{"title":"2_Q_Learning_maze","children":[{"title":"RL_brain.py <span style='color:#111;'> 1.79KB </span>","children":null,"spread":false},{"title":"maze_env.py <span style='color:#111;'> 4.21KB </span>","children":null,"spread":false},{"title":"run_this.py <span style='color:#111;'> 1.36KB </span>","children":null,"spread":false}],"spread":true},{"title":"5.3_Dueling_DQN","children":[{"title":"RL_brain.py <span style='color:#111;'> 6.56KB </span>","children":null,"spread":false},{"title":"run_Pendulum.py <span style='color:#111;'> 2.11KB </span>","children":null,"spread":false}],"spread":true},{"title":"10_A3C","children":[{"title":"A3C_continuous_action.py <span style='color:#111;'> 7.97KB </span>","children":null,"spread":false},{"title":"A3C_RNN.py <span style='color:#111;'> 9.21KB </span>","children":null,"spread":false},{"title":"A3C_distributed_tf.py <span style='color:#111;'> 8.98KB </span>","children":null,"spread":false},{"title":"A3C_discrete_action.py <span style='color:#111;'> 7.70KB </span>","children":null,"spread":false}],"spread":false},{"title":"9_Deep_Deterministic_Policy_Gradient_DDPG","children":[{"title":"DDPG_update.py <span style='color:#111;'> 5.63KB </span>","children":null,"spread":false},{"title":"DDPG.py <span style='color:#111;'> 9.76KB </span>","children":null,"spread":false},{"title":"DDPG_update2.py <span style='color:#111;'> 5.55KB </span>","children":null,"spread":false}],"spread":false},{"title":"6_OpenAI_gym","children":[{"title":"RL_brain.py <span style='color:#111;'> 8.18KB </span>","children":null,"spread":false},{"title":"run_MountainCar.py <span style='color:#111;'> 1.32KB </span>","children":null,"spread":false},{"title":"run_CartPole.py <span style='color:#111;'> 1.44KB </span>","children":null,"spread":false}],"spread":false}],"spread":false},{"title":"experiments","children":[{"title":"Solve_BipedalWalker","children":[{"title":"A3C.py <span style='color:#111;'> 8.39KB </span>","children":null,"spread":false},{"title":"A3C_rnn.py <span style='color:#111;'> 9.84KB </span>","children":null,"spread":false},{"title":"log","children":[{"title":"events.out.tfevents.1490801027.Morvan <span style='color:#111;'> 1.07MB </span>","children":null,"spread":false}],"spread":true},{"title":"DDPG.py <span style='color:#111;'> 15.72KB </span>","children":null,"spread":false}],"spread":true},{"title":"Solve_LunarLander","children":[{"title":"A3C.py <span style='color:#111;'> 9.43KB </span>","children":null,"spread":false},{"title":"run_LunarLander.py <span style='color:#111;'> 1.67KB </span>","children":null,"spread":false},{"title":"DuelingDQNPrioritizedReplay.py <span style='color:#111;'> 12.72KB </span>","children":null,"spread":false}],"spread":true},{"title":"2D_car","children":[{"title":"car_env.py <span style='color:#111;'> 7.77KB </span>","children":null,"spread":false},{"title":"DDPG.py <span style='color:#111;'> 9.57KB </span>","children":null,"spread":false},{"title":"collision.py <span style='color:#111;'> 2.02KB </span>","children":null,"spread":false}],"spread":true},{"title":"Robot_arm","children":[{"title":"A3C.py <span style='color:#111;'> 8.42KB </span>","children":null,"spread":false},{"title":"arm_env.py <span style='color:#111;'> 8.28KB </span>","children":null,"spread":false},{"title":"DDPG.py <span style='color:#111;'> 10.13KB </span>","children":null,"spread":false},{"title":"DPPO.py <span style='color:#111;'> 7.84KB </span>","children":null,"spread":false}],"spread":true}],"spread":true},{"title":"LICENCE <span style='color:#111;'> 1.03KB </span>","children":null,"spread":false},{"title":"README.md <span style='color:#111;'> 6.96KB </span>","children":null,"spread":false},{"title":"RL_cover.jpg <span style='color:#111;'> 68.07KB </span>","children":null,"spread":false}],"spread":true}],"spread":true}]