[{"title":"( 103 个子文件 2MB ) Popular-RL-Algorithms:软参与者关键(SAC),双延迟DDPG(TD3),参与者关键(ACA2C),近端策略优化(PPO),QT-Opt,PointNet的PyTorch实施。","children":[{"title":".gitmodules <span style='color:#111;'> 239B </span>","children":null,"spread":false},{"title":"qt_opt_v3.py <span style='color:#111;'> 12.13KB </span>","children":null,"spread":false},{"title":"events.out.tfevents.1577364245.quantumiracle-G3-3579 <span style='color:#111;'> 237.07KB </span>","children":null,"spread":false},{"title":"ddpg.py <span style='color:#111;'> 12.31KB </span>","children":null,"spread":false},{"title":"_policies.py <span style='color:#111;'> 588B </span>","children":null,"spread":false},{"title":"CEM_Gaussian_test.ipynb <span style='color:#111;'> 75.99KB </span>","children":null,"spread":false},{"title":"cem.py <span style='color:#111;'> 3.34KB </span>","children":null,"spread":false},{"title":"RunJupyter.py <span style='color:#111;'> 159B </span>","children":null,"spread":false},{"title":"CEM_Categorical_test.ipynb <span style='color:#111;'> 51.67KB </span>","children":null,"spread":false},{"title":"CEM_Categorical_test-checkpoint.ipynb <span style='color:#111;'> 51.67KB </span>","children":null,"spread":false},{"title":"CEM_Gaussian_test-checkpoint.ipynb <span style='color:#111;'> 74.59KB </span>","children":null,"spread":false},{"title":"sdt_train.py <span style='color:#111;'> 1.29KB </span>","children":null,"spread":false},{"title":"sdt_train.cpython-36.pyc <span style='color:#111;'> 967B </span>","children":null,"spread":false},{"title":"SDT.cpython-36.pyc <span style='color:#111;'> 4.41KB </span>","children":null,"spread":false},{"title":"SDT.py <span style='color:#111;'> 5.88KB </span>","children":null,"spread":false},{"title":"ac.py <span style='color:#111;'> 17.55KB </span>","children":null,"spread":false},{"title":"sac_nonautoentropy.png <span style='color:#111;'> 64.00KB </span>","children":null,"spread":false},{"title":"td3_deterministic.png <span style='color:#111;'> 90.32KB </span>","children":null,"spread":false},{"title":"ac_cartpole.png <span style='color:#111;'> 121.48KB </span>","children":null,"spread":false},{"title":"td3_nondeterministic.png <span style='color:#111;'> 83.65KB </span>","children":null,"spread":false},{"title":"sac_autoentropy.png <span style='color:#111;'> 54.95KB </span>","children":null,"spread":false},{"title":"ppo_single_2 (copy).png <span style='color:#111;'> 22.65KB </span>","children":null,"spread":false},{"title":"pendulum.png <span style='color:#111;'> 41.92KB </span>","children":null,"spread":false},{"title":"ac.png <span style='color:#111;'> 46.49KB </span>","children":null,"spread":false},{"title":"ppo_single_2.png <span style='color:#111;'> 26.17KB </span>","children":null,"spread":false},{"title":"ppo_continuous3.py <span style='color:#111;'> 7.71KB </span>","children":null,"spread":false},{"title":"ppo_continuous_multiprocess.py <span style='color:#111;'> 15.24KB </span>","children":null,"spread":false},{"title":"ddpg_target_q <span style='color:#111;'> 35.36KB </span>","children":null,"spread":false},{"title":"ddpg_policy <span style='color:#111;'> 18.60KB </span>","children":null,"spread":false},{"title":"rdpg_policy <span style='color:#111;'> 149.30KB </span>","children":null,"spread":false},{"title":"rdpg_q <span style='color:#111;'> 149.55KB </span>","children":null,"spread":false},{"title":"ddpg_q <span style='color:#111;'> 35.36KB </span>","children":null,"spread":false},{"title":"rdpg_target_q <span style='color:#111;'> 149.55KB </span>","children":null,"spread":false},{"title":"plot.ipynb <span style='color:#111;'> 34.52KB </span>","children":null,"spread":false},{"title":"sac_v2_lstm.py <span style='color:#111;'> 12.98KB </span>","children":null,"spread":false},{"title":"reacher.cpython-36.pyc <span style='color:#111;'> 4.80KB </span>","children":null,"spread":false},{"title":"reacher.cpython-35.pyc <span style='color:#111;'> 5.40KB </span>","children":null,"spread":false},{"title":"sac_v2_multiprocess_multi_gpu.py <span style='color:#111;'> 26.95KB </span>","children":null,"spread":false},{"title":"ppo_continuous.py <span style='color:#111;'> 13.84KB </span>","children":null,"spread":false},{"title":"reward_compare_td3.pdf <span style='color:#111;'> 26.99KB </span>","children":null,"spread":false},{"title":"plot.ipynb <span style='color:#111;'> 68.00KB </span>","children":null,"spread":false},{"title":"sac_v2_lstm.py <span style='color:#111;'> 12.29KB </span>","children":null,"spread":false},{"title":"td3_lstm.py <span style='color:#111;'> 12.65KB </span>","children":null,"spread":false},{"title":"value_networks.py <span style='color:#111;'> 5.96KB </span>","children":null,"spread":false},{"title":"buffers.py <span style='color:#111;'> 6.89KB </span>","children":null,"spread":false},{"title":"utils.py <span style='color:#111;'> 686B </span>","children":null,"spread":false},{"title":"initialize.cpython-36.pyc <span style='color:#111;'> 826B </span>","children":null,"spread":false},{"title":"value_networks.cpython-36.pyc <span style='color:#111;'> 5.15KB </span>","children":null,"spread":false},{"title":"policy_networks.cpython-36.pyc <span style='color:#111;'> 14.25KB </span>","children":null,"spread":false},{"title":"utils.cpython-36.pyc <span style='color:#111;'> 930B </span>","children":null,"spread":false},{"title":"buffers.cpython-36.pyc <span style='color:#111;'> 6.13KB </span>","children":null,"spread":false},{"title":"optimizers.py <span style='color:#111;'> 4.78KB </span>","children":null,"spread":false},{"title":"policy_networks.py <span style='color:#111;'> 18.91KB </span>","children":null,"spread":false},{"title":"initialize.py <span style='color:#111;'> 515B </span>","children":null,"spread":false},{"title":"reward_compare_sac.pdf <span style='color:#111;'> 16.02KB </span>","children":null,"spread":false},{"title":"td3.py <span style='color:#111;'> 16.98KB </span>","children":null,"spread":false},{"title":"sac_v2.py <span style='color:#111;'> 16.83KB </span>","children":null,"spread":false},{"title":"plot-checkpoint.ipynb <span style='color:#111;'> 68.00KB </span>","children":null,"spread":false},{"title":"reward_compare_td3.pdf <span style='color:#111;'> 26.99KB </span>","children":null,"spread":false},{"title":"plot.ipynb <span style='color:#111;'> 68.39KB </span>","children":null,"spread":false},{"title":"ppo_discrete.py <span style='color:#111;'> 4.48KB </span>","children":null,"spread":false},{"title":"reacher.py <span style='color:#111;'> 7.69KB </span>","children":null,"spread":false},{"title":"LICENSE <span style='color:#111;'> 11.09KB </span>","children":null,"spread":false},{"title":"td3_lstm.py <span style='color:#111;'> 12.97KB </span>","children":null,"spread":false},{"title":"ppo_continuous2.py <span style='color:#111;'> 13.96KB </span>","children":null,"spread":false},{"title":"rdpg.py <span style='color:#111;'> 11.67KB </span>","children":null,"spread":false},{"title":"reward_compare.pdf <span style='color:#111;'> 12.24KB </span>","children":null,"spread":false},{"title":"value_networks.py <span style='color:#111;'> 7.67KB </span>","children":null,"spread":false},{"title":"buffers.py <span style='color:#111;'> 6.89KB </span>","children":null,"spread":false},{"title":"utils.py <span style='color:#111;'> 686B </span>","children":null,"spread":false},{"title":"initialize.cpython-36.pyc <span style='color:#111;'> 826B </span>","children":null,"spread":false},{"title":"value_networks.cpython-36.pyc <span style='color:#111;'> 6.54KB </span>","children":null,"spread":false},{"title":"policy_networks.cpython-36.pyc <span style='color:#111;'> 16.95KB </span>","children":null,"spread":false},{"title":"utils.cpython-36.pyc <span style='color:#111;'> 930B </span>","children":null,"spread":false},{"title":"buffers.cpython-36.pyc <span style='color:#111;'> 6.13KB </span>","children":null,"spread":false},{"title":"optimizers.py <span style='color:#111;'> 4.78KB </span>","children":null,"spread":false},{"title":"policy_networks.py <span style='color:#111;'> 22.37KB </span>","children":null,"spread":false},{"title":"initialize.py <span style='color:#111;'> 515B </span>","children":null,"spread":false},{"title":"ramble_sac.md <span style='color:#111;'> 5.48KB </span>","children":null,"spread":false},{"title":"ppo_gae_discrete.py <span style='color:#111;'> 4.22KB </span>","children":null,"spread":false},{"title":"sac_v2_multiprocess.py <span style='color:#111;'> 21.11KB </span>","children":null,"spread":false},{"title":"td3.py <span style='color:#111;'> 17.36KB </span>","children":null,"spread":false},{"title":"sac_pendulum.py <span style='color:#111;'> 10.03KB </span>","children":null,"spread":false},{"title":"requirements.txt <span style='color:#111;'> 2.55KB </span>","children":null,"spread":false},{"title":"td3_multiprocess.py <span style='color:#111;'> 21.53KB </span>","children":null,"spread":false},{"title":"ppo_continuous_tf.py <span style='color:#111;'> 9.06KB </span>","children":null,"spread":false},{"title":"checkpoint <span style='color:#111;'> 63B </span>","children":null,"spread":false},{"title":"ppo.index <span style='color:#111;'> 1.36KB </span>","children":null,"spread":false},{"title":"ppo.meta <span style='color:#111;'> 138.25KB </span>","children":null,"spread":false},{"title":"ppo.data-00000-of-00001 <span style='color:#111;'> 32.12KB </span>","children":null,"spread":false},{"title":"ppo_continuous_multiprocess2.py <span style='color:#111;'> 15.18KB </span>","children":null,"spread":false},{"title":".gitignore <span style='color:#111;'> 114B </span>","children":null,"spread":false},{"title":"ppo_gae_continuous_not_work.py <span style='color:#111;'> 5.99KB </span>","children":null,"spread":false},{"title":"sac_v2.py <span style='color:#111;'> 17.39KB </span>","children":null,"spread":false},{"title":"sac_v2_multithread.py <span style='color:#111;'> 17.96KB </span>","children":null,"spread":false},{"title":"sac_v2_gru.py <span style='color:#111;'> 13.24KB </span>","children":null,"spread":false},{"title":"plot-checkpoint.ipynb <span style='color:#111;'> 34.45KB </span>","children":null,"spread":false},{"title":"README.md <span style='color:#111;'> 6.63KB </span>","children":null,"spread":false},{"title":"sdt_ppo_gae_discrete.py <span style='color:#111;'> 5.56KB </span>","children":null,"spread":false},{"title":"sac.py <span style='color:#111;'> 15.60KB </span>","children":null,"spread":false},{"title":"......","children":null,"spread":false},{"title":"<span style='color:steelblue;'>文件过多,未全部展示</span>","children":null,"spread":false}],"spread":true}]