[{"title":"( 19 个子文件 12.16MB ) 强化学习PPT(赵世钰)","children":[{"title":"强化学习","children":[{"title":"L9_Policy gradient methods_With animation.pdf <span style='color:#111;'> 574.09KB </span>","children":null,"spread":false},{"title":"L1-Basic concepts-With animation.pdf <span style='color:#111;'> 660.75KB </span>","children":null,"spread":false},{"title":"L3-Bellman optimality equation.pdf <span style='color:#111;'> 548.79KB </span>","children":null,"spread":false},{"title":"L10-Actor Critic-With animation.pdf <span style='color:#111;'> 868.97KB </span>","children":null,"spread":false},{"title":"L6-Stochastic approximation.pdf <span style='color:#111;'> 861.99KB </span>","children":null,"spread":false},{"title":"L3-Bellman optimality equation-With animation.pdf <span style='color:#111;'> 624.35KB </span>","children":null,"spread":false},{"title":"L7-Temporal-Difference Learning.pdf <span style='color:#111;'> 749.57KB </span>","children":null,"spread":false},{"title":"L5-Monte Carlo methods.pdf <span style='color:#111;'> 856.16KB </span>","children":null,"spread":false},{"title":"L4-Value iteration and policy iteration.pdf <span style='color:#111;'> 573.70KB </span>","children":null,"spread":false},{"title":"L6-Stochastic approximation-With animation.pdf <span style='color:#111;'> 1.00MB </span>","children":null,"spread":false},{"title":"L2-Bellman equation.pdf <span style='color:#111;'> 611.87KB </span>","children":null,"spread":false},{"title":"L10-Actor Critic.pdf <span style='color:#111;'> 718.05KB </span>","children":null,"spread":false},{"title":"L8-Value function approximation.pdf <span style='color:#111;'> 1.18MB </span>","children":null,"spread":false},{"title":"L8-Value function approximation-With animation.pdf <span style='color:#111;'> 1.47MB </span>","children":null,"spread":false},{"title":"L1-Basic concepts.pdf <span style='color:#111;'> 570.75KB </span>","children":null,"spread":false},{"title":"L4-Value iteration and policy iteration-With animation.pdf <span style='color:#111;'> 677.63KB </span>","children":null,"spread":false},{"title":"L9_Policy gradient methods.pdf <span style='color:#111;'> 473.73KB </span>","children":null,"spread":false},{"title":"L5-Monte Carlo methods-With animation.pdf <span style='color:#111;'> 974.70KB </span>","children":null,"spread":false},{"title":"L7-Temporal-Difference Learning-With animation.pdf <span style='color:#111;'> 944.78KB </span>","children":null,"spread":false}],"spread":false}],"spread":true}]