嘿,亲!知识可是无价之宝呢,但咱这精心整理的资料也耗费了不少心血呀。小小地破费一下,绝对物超所值哦!如有下载和支付问题,请联系我们QQ(微信同号):813200300
本次赞助数额为: 2 元微信扫码支付:2 元
请留下您的邮箱,我们将在2小时内将文件发到您的邮箱
代码中包含13种强化学习算法,所调用的环境不仅包含gym下面的一些简单环境,还可以自己设计环境(简单的迷宫游戏),简洁明了,适合算法学习的同学使用,其中A3C与PPO还涉及了并行运算的算法。
卷 软件 的文件夹 PATH 列表
卷序列号为 0D75-0D0C
D:.
└─Reinforcement-learning-with-tensorflow
│ LICENCE
│ README.md
│ RL_cover.jpg
│
├─.idea
│ misc.xml
│ modules.xml
│ Reinforcement-learning-with-tensorflow.iml
│ vcs.xml
│ workspace.xml
│
├─contents
│ ├─10_A3C
│ │ │ A3C_continuous_action.py
│ │ │ A3C_discrete_action.py
│ │ │ A3C_distributed_tf.py
│ │ │ A3C_RNN.py
│ │ │
│ │ └─log
│ │ events.out.tfevents.1551167889.DESKTOP-OSFDGN5
│ │
│ ├─11_Dyna_Q
│ │ maze_env.py
│ │ RL_brain.py
│ │ run_this.py
│ │
│ ├─12_Proximal_Policy_Optimization
│ │ │ discrete_DPPO.py
│ │ │ DPPO.py
│ │ │ PPO.py
│ │ │ simply_PPO.py
│ │ │ simply_PPO1.py
│ │ │
│ │ └─log
│ │ events.out.tfevents.1551178953.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1551255571.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1553224232.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1553238324.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1553837229.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1554976756.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1556507113.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1556507732.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1556518602.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1556522855.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1557300964.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1557373659.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1557891088.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1557991550.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558410109.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558492818.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558493235.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558493411.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558523123.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558523249.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558523427.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558523705.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558523771.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558599329.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558601706.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558602205.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558602434.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558603717.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558604038.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558604207.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558604975.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558605865.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558606275.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558606399.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558607336.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558607454.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558607565.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558607756.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558607833.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558608089.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558608259.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558608468.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558608570.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558609087.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558609193.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558609349.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558609640.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558610084.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558610665.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558659163.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558659275.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558660352.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558661649.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558663823.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558664829.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558665334.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558667665.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558669203.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558672109.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1558673239.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1565602750.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1565837491.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1565837545.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1565838580.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1567677923.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1567738605.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1567738776.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1567738924.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1567738968.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1568098203.DESKTOP-OSFDGN5
│ │
│ ├─13_saras
│ │ saras.py
│ │ __init__.py
│ │
│ ├─1_command_line_reinforcement_learning
│ │ treasure_on_right.py
│ │
│ ├─2_Q_Learning_maze
│ │ maze_env.py
│ │ RL_brain.py
│ │ run_this.py
│ │
│ ├─3_Sarsa_maze
│ │ │ maze_env.py
│ │ │ RL_brain.py
│ │ │ run_this.py
│ │ │
│ │ └─__pycache__
│ │ maze_env.cpython-35.pyc
│ │ RL_brain.cpython-35.pyc
│ │
│ ├─4_Sarsa_lambda_maze
│ │ maze_env.py
│ │ RL_brain.py
│ │ run_this.py
│ │
│ ├─5.1_Double_DQN
│ │ RL_brain.py
│ │ run_Pendulum.py
│ │
│ ├─5.2_Prioritized_Replay_DQN
│ │ RL_brain.py
│ │ run_MountainCar.py
│ │
│ ├─5.3_Dueling_DQN
│ │ RL_brain.py
│ │ run_Pendulum.py
│ │
│ ├─5_Deep_Q_Network
│ │ DQN_modified.py
│ │ maze_env.py
│ │ RL_brain.py
│ │ run_this.py
│ │
│ ├─6_OpenAI_gym
│ │ │ RL_brain.py
│ │ │ run_CartPole.py
│ │ │ run_MountainCar.py
│ │ │
│ │ └─__pycache__
│ │ RL_brain.cpython-35.pyc
│ │
│ ├─7_Policy_gradient_softmax
│ │ RL_brain.py
│ │ run_CartPole.py
│ │ run_MountainCar.py
│ │
│ ├─8_Actor_Critic_Advantage
│ │ AC_CartPole.py
│ │ AC_continue_Pendulum.py
│ │
│ ├─9_Deep_Deterministic_Policy_Gradient_DDPG
│ │ │ DDPG.py
│ │ │ DDPG_update.py
│ │ │ DDPG_update2.py
│ │ │
│ │ └─logs
│ │ events.out.tfevents.1553588612.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1553664943.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1553664974.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1553665084.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1553665248.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1554974631.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1556422021.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1557133756.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1561971410.DESKTOP-OSFDGN5
│ │ events.out.tfevents.1561971451.DESKTOP-OSFDGN5
│ │
│ └─Curiosity_Model
│ Curiosity.png
│ Curiosity.py
│ Random_Network_Distillation.py
│
└─experiments
├─2D_car
│ car_env.py
│ collision.py
│ DDPG.py
│
├─Robot_arm
│ │ A3C.py
│ │ arm_env.py
│ │ DDPG.py
│ │ DPPO.py
│ │
│ └─__pycache__
│ arm_env.cpython-35.pyc
│
├─Solve_BipedalWalker
│ │ A3C.py
│ │ A3C_rnn.py
│ │ DDPG.py
│ │
│ └─log
│ events.out.tfevents.1490801027.Morvan
│
└─Solve_LunarLander
A3C.py
DuelingDQNPrioritizedReplay.py
run_LunarLander.py