Filename | Size | Date |
---|
reinforcement-learning-master | 0 | 2018-06-01
|
reinforcement-learning-master\.gitattributes | 66 | 2018-06-01
|
reinforcement-learning-master\MAL | 0 | 2018-06-01
|
reinforcement-learning-master\MAL\01 MA Centralized-Q | 0 | 2018-06-01
|
reinforcement-learning-master\MAL\01 MA Centralized-Q\LFAEstimator.m | 807 | 2018-06-01
|
reinforcement-learning-master\MAL\01 MA Centralized-Q\MAEnvironment.m | 7602 | 2018-06-01
|
reinforcement-learning-master\MAL\01 MA Centralized-Q\macq.m | 3115 | 2018-06-01
|
reinforcement-learning-master\MAL\01 MA Centralized-Q\maq_iterationCount.mat | 5988 | 2018-06-01
|
reinforcement-learning-master\MAL\01 MA Centralized-Q\maq_reward.mat | 5987 | 2018-06-01
|
reinforcement-learning-master\MAL\01 MA Centralized-Q\weights.mat | 1487 | 2018-06-01
|
reinforcement-learning-master\MAL\02 MA Hysteretic-Q | 0 | 2018-06-01
|
reinforcement-learning-master\MAL\02 MA Hysteretic-Q\LFAEstimator.m | 1003 | 2018-06-01
|
reinforcement-learning-master\MAL\02 MA Hysteretic-Q\MAEnvironment.m | 7775 | 2018-06-01
|
reinforcement-learning-master\MAL\02 MA Hysteretic-Q\a1_weights.mat | 536 | 2018-06-01
|
reinforcement-learning-master\MAL\02 MA Hysteretic-Q\a2_weights.mat | 535 | 2018-06-01
|
reinforcement-learning-master\MAL\02 MA Hysteretic-Q\mahq.m | 3720 | 2018-06-01
|
reinforcement-learning-master\MAL\02 MA Hysteretic-Q\maq_iterationCount.mat | 5739 | 2018-06-01
|
reinforcement-learning-master\MAL\02 MA Hysteretic-Q\maq_reward.mat | 5760 | 2018-06-01
|
reinforcement-learning-master\MAL\03 MAPG | 0 | 2018-06-01
|
reinforcement-learning-master\MAL\03 MAPG\MAEnvironment.m | 7775 | 2018-06-01
|
reinforcement-learning-master\MAL\03 MAPG\PolicyEstimator.m | 1122 | 2018-06-01
|
reinforcement-learning-master\MAL\03 MAPG\ValueEstimator.m | 844 | 2018-06-01
|
reinforcement-learning-master\MAL\03 MAPG\agent1_policy_weights.mat | 536 | 2018-06-01
|
reinforcement-learning-master\MAL\03 MAPG\agent2_policy_weights.mat | 537 | 2018-06-01
|
reinforcement-learning-master\MAL\03 MAPG\mapg.m | 3389 | 2018-06-01
|
reinforcement-learning-master\MAL\03 MAPG\mapg_iterationCount.mat | 3556 | 2018-06-01
|
reinforcement-learning-master\MAL\03 MAPG\mapg_reward.mat | 3608 | 2018-06-01
|
reinforcement-learning-master\MAL\03 MAPG\value_weights.mat | 216 | 2018-06-01
|
reinforcement-learning-master\MAL\Basic Functions | 0 | 2018-06-01
|
reinforcement-learning-master\MAL\Basic Functions\clcAngle.m | 463 | 2018-06-01
|
reinforcement-learning-master\MAL\Basic Functions\compare_fig.m | 1759 | 2018-06-01
|
reinforcement-learning-master\MAL\Basic Functions\ds2nfu.m | 2946 | 2018-06-01
|
reinforcement-learning-master\MAL\Basic Functions\make_epsilon_policy.m | 334 | 2018-06-01
|
reinforcement-learning-master\MAL\Basic Functions\make_greedy_policy.m | 277 | 2018-06-01
|
reinforcement-learning-master\MAL\Basic Functions\make_random_policy.m | 92 | 2018-06-01
|
reinforcement-learning-master\MAL\Basic Functions\q_value_or_policy2fig.m | 3218 | 2018-06-01
|
reinforcement-learning-master\MAL\Basic Functions\sigmoid.m | 51 | 2018-06-01
|
reinforcement-learning-master\README.md | 759 | 2018-06-01
|
reinforcement-learning-master\SAL | 0 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP | 0 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\PE.m | 522 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\PE_V.mat | 5034 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\PI.m | 2383 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\PI_P.mat | 696 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\PI_P.svg | 56294 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\PI_V.mat | 6922 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\PI_simulationTime.mat | 192 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\VI.m | 2456 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\VI_P.mat | 361 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\VI_P.svg | 54344 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\VI_Q.mat | 25500 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\VI_Q.svg | 56806 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\VI_V.mat | 4881 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\VI_simulationTime.mat | 192 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\Values.xlsx | 26566 | 2018-06-01
|
reinforcement-learning-master\SAL\01 DP\policy_evaluation.m | 781 | 2018-06-01
|
reinforcement-learning-master\SAL\02 MC | 0 | 2018-06-01
|
reinforcement-learning-master\SAL\02 MC\offpmc.m | 4645 | 2018-06-01
|
reinforcement-learning-master\SAL\02 MC\offpmc_c.mat | 20341 | 2018-06-01
|
reinforcement-learning-master\SAL\02 MC\offpmc_iterationCount.mat | 109202 | 2018-06-01
|
reinforcement-learning-master\SAL\02 MC\offpmc_policy.mat | 1317 | 2018-06-01
|
reinforcement-learning-master\SAL\02 MC\offpmc_q.mat | 20092 | 2018-06-01
|
reinforcement-learning-master\SAL\02 MC\offpmc_reward.mat | 1885 | 2018-06-01
|
reinforcement-learning-master\SAL\02 MC\onpmc.m | 4255 | 2018-06-01
|
reinforcement-learning-master\SAL\02 MC\onpmc_iterationCount.mat | 78957 | 2018-06-01
|
reinforcement-learning-master\SAL\02 MC\onpmc_policy.mat | 2485 | 2018-06-01
|
reinforcement-learning-master\SAL\02 MC\onpmc_q.mat | 27688 | 2018-06-01
|
reinforcement-learning-master\SAL\02 MC\onpmc_returns.mat | 36066 | 2018-06-01
|
reinforcement-learning-master\SAL\02 MC\onpmc_reward.mat | 1015 | 2018-06-01
|
reinforcement-learning-master\SAL\03 TD | 0 | 2018-06-01
|
reinforcement-learning-master\SAL\03 TD\qLearning.m | 2976 | 2018-06-01
|
reinforcement-learning-master\SAL\03 TD\qLearning_iterationCount.mat | 90583 | 2018-06-01
|
reinforcement-learning-master\SAL\03 TD\qLearning_q.mat | 27502 | 2018-06-01
|
reinforcement-learning-master\SAL\03 TD\qLearning_reward.mat | 5288 | 2018-06-01
|
reinforcement-learning-master\SAL\03 TD\sarsa.m | 3327 | 2018-06-01
|
reinforcement-learning-master\SAL\03 TD\sarsa_iterationCount.mat | 91987 | 2018-06-01
|
reinforcement-learning-master\SAL\03 TD\sarsa_q.mat | 27541 | 2018-06-01
|
reinforcement-learning-master\SAL\03 TD\sarsa_reward.mat | 1559 | 2018-06-01
|
reinforcement-learning-master\SAL\04 LFA | 0 | 2018-06-01
|
reinforcement-learning-master\SAL\04 LFA\LFAEstimator.m | 807 | 2018-06-01
|
reinforcement-learning-master\SAL\04 LFA\linear_function_approximation.m | 3454 | 2018-06-01
|
reinforcement-learning-master\SAL\04 LFA\onp_lfa_iterationCount.mat | 125625 | 2018-06-01
|
reinforcement-learning-master\SAL\04 LFA\onp_lfa_reward.mat | 1702 | 2018-06-01
|
reinforcement-learning-master\SAL\04 LFA\onp_lfa_weights.mat | 328 | 2018-06-01
|
reinforcement-learning-master\SAL\05 DQN | 0 | 2018-06-01
|
reinforcement-learning-master\SAL\05 DQN\DQN.m | 4158 | 2018-06-01
|
reinforcement-learning-master\SAL\05 DQN\DQNEstimator.m | 3079 | 2018-06-01
|
reinforcement-learning-master\SAL\05 DQN\DQN_iterationCount.mat | 23638 | 2018-06-01
|
reinforcement-learning-master\SAL\05 DQN\DQN_reward.mat | 2976 | 2018-06-01
|
reinforcement-learning-master\SAL\05 DQN\DQN_simulationTime.mat | 241 | 2018-06-01
|
reinforcement-learning-master\SAL\05 DQN\DQN_weights.mat | 844598 | 2018-06-01
|
reinforcement-learning-master\SAL\05 DQN\dqn_rwd.png | 9910 | 2018-06-01
|
reinforcement-learning-master\SAL\06 LPG | 0 | 2018-06-01
|
reinforcement-learning-master\SAL\06 LPG\PolicyEstimator.m | 1135 | 2018-06-01
|
reinforcement-learning-master\SAL\06 LPG\ValueEstimator.m | 844 | 2018-06-01
|
reinforcement-learning-master\SAL\06 LPG\pg_iterationCount.mat | 103307 | 2018-06-01
|
reinforcement-learning-master\SAL\06 LPG\pg_reward.mat | 2130 | 2018-06-01
|
reinforcement-learning-master\SAL\06 LPG\policy_gradient.m | 3366 | 2018-06-01
|
reinforcement-learning-master\SAL\06 LPG\policy_weights.mat | 330 | 2018-06-01
|
reinforcement-learning-master\SAL\06 LPG\value_weights.mat | 211 | 2018-06-01 |