[{"title":"( 15 个子文件 23KB ) RL Latest Tech分层强化学习:Option-Critic架构算法","children":[{"title":"option_critic-master","children":[{"title":"train_q.py <span style='color:#111;'> 1.43KB </span>","children":null,"spread":false},{"title":"init.py <span style='color:#111;'> 0B </span>","children":null,"spread":false},{"title":"learning.py <span style='color:#111;'> 3.55KB </span>","children":null,"spread":false},{"title":"run_best_model.py <span style='color:#111;'> 324B </span>","children":null,"spread":false},{"title":"train_agent.py <span style='color:#111;'> 16.14KB </span>","children":null,"spread":false},{"title":"exp_replay.py <span style='color:#111;'> 4.53KB </span>","children":null,"spread":false},{"title":"fourrooms","children":[{"title":"fourrooms.py <span style='color:#111;'> 2.79KB </span>","children":null,"spread":false},{"title":"transfer.py <span style='color:#111;'> 11.29KB </span>","children":null,"spread":false},{"title":"README.md <span style='color:#111;'> 1.66KB </span>","children":null,"spread":false}],"spread":true},{"title":"neural_net.py <span style='color:#111;'> 8.91KB </span>","children":null,"spread":false},{"title":".gitignore <span style='color:#111;'> 22B </span>","children":null,"spread":false},{"title":"nnet.py <span style='color:#111;'> 4.38KB </span>","children":null,"spread":false},{"title":"launcher.py <span style='color:#111;'> 10.59KB </span>","children":null,"spread":false},{"title":"README.md <span style='color:#111;'> 662B </span>","children":null,"spread":false},{"title":"plot_learning.py <span style='color:#111;'> 2.24KB </span>","children":null,"spread":false}],"spread":false}],"spread":true}]