[{"title":"(11个子文件14.99MB)DavidSilver强化学习(reinforcementlearning)课程PPT","children":[{"title":"DavidSilver强化学习(reinforcementlearning)课程PPT","children":[{"title":"intergratinglearningandplanning.pdf <span style='color:#111;'>2.08MB</span>","children":null,"spread":false},{"title":"MC-TD.pdf <span style='color:#111;'>1.39MB</span>","children":null,"spread":false},{"title":"DP.pdf <span style='color:#111;'>804.66KB</span>","children":null,"spread":false},{"title":"model-freecontrol.pdf <span style='color:#111;'>1.43MB</span>","children":null,"spread":false},{"title":"MDP.pdf <span style='color:#111;'>815.74KB</span>","children":null,"spread":false},{"title":"ValueFunctionApproximation.pdf <span style='color:#111;'>1.90MB</span>","children":null,"spread":false},{"title":"intro_RL.pdf <span style='color:#111;'>2.86MB</span>","children":null,"spread":false},{"title":"classicgames.pdf <span style='color:#111;'>2.96MB</span>","children":null,"spread":false},{"title":"Easy21-Johannes.pdf <span style='color:#111;'>226.17KB</span>","children":null,"spread":false},{"title":"PolicyGradient.pdf <span style='color:#111;'>1.79MB</span>","children":null,"spread":false},{"title":"explorationandexploitation.pdf <span style='color:#111;'>1.28MB</span>","children":null,"spread":false}],"spread":false}],"spread":true}]