|
826 | 826 | ] |
827 | 827 | } |
828 | 828 | }, |
| 829 | + "pendulum_ddpg_nonoise": { |
| 830 | + "problem": "Pendulum-v0", |
| 831 | + "Agent": "DDPG", |
| 832 | + "HyperOptimizer": "GridSearch", |
| 833 | + "Memory": "LinearMemoryWithForgetting", |
| 834 | + "Optimizer": "AdamOptimizer", |
| 835 | + "Policy": "NoNoisePolicy", |
| 836 | + "PreProcessor": "NoPreProcessor", |
| 837 | + "param": { |
| 838 | + "batch_size": 64, |
| 839 | + "n_epoch": 1, |
| 840 | + "tau": 0.005, |
| 841 | + "lr": 0.001, |
| 842 | + "critic_lr": 0.001, |
| 843 | + "exploration_anneal_episodes": 50, |
| 844 | + "gamma": 0.97, |
| 845 | + "hidden_layers": [400, 300], |
| 846 | + "hidden_layers_activation": "relu", |
| 847 | + "output_layer_activation": "tanh" |
| 848 | + }, |
| 849 | + "param_range": { |
| 850 | + "lr": [0.0001, 0.0005, 0.001], |
| 851 | + "critic_lr": [0.001, 0.005], |
| 852 | + "gamma": [0.95, 0.97, 0.99], |
| 853 | + "hidden_layers": [ |
| 854 | + [400, 300], |
| 855 | + [800, 400, 200], |
| 856 | + [800, 600, 400, 200] |
| 857 | + ] |
| 858 | + } |
| 859 | + }, |
| 860 | + "pendulum_ddpg_per": { |
| 861 | + "problem": "Pendulum-v0", |
| 862 | + "Agent": "DDPG", |
| 863 | + "HyperOptimizer": "GridSearch", |
| 864 | + "Memory": "PrioritizedExperienceReplay", |
| 865 | + "Optimizer": "AdamOptimizer", |
| 866 | + "Policy": "NoNoisePolicy", |
| 867 | + "PreProcessor": "NoPreProcessor", |
| 868 | + "param": { |
| 869 | + "batch_size": 64, |
| 870 | + "n_epoch": 1, |
| 871 | + "tau": 0.001, |
| 872 | + "lr": 0.001, |
| 873 | + "critic_lr": 0.001, |
| 874 | + "exploration_anneal_episodes": 50, |
| 875 | + "gamma": 0.97, |
| 876 | + "hidden_layers": [400, 300], |
| 877 | + "hidden_layers_activation": "relu", |
| 878 | + "output_layer_activation": "tanh", |
| 879 | + "max_mem_len": 30000 |
| 880 | + }, |
| 881 | + "param_range": { |
| 882 | + "lr": [0.0001, 0.0005, 0.001], |
| 883 | + "critic_lr": [0.001, 0.005], |
| 884 | + "gamma": [0.95, 0.97, 0.99], |
| 885 | + "hidden_layers": [ |
| 886 | + [400, 300], |
| 887 | + [800, 400, 200], |
| 888 | + [800, 600, 400, 200] |
| 889 | + ] |
| 890 | + } |
| 891 | + }, |
| 892 | + "pendulum_ddpg_per_linearnoise": { |
| 893 | + "problem": "Pendulum-v0", |
| 894 | + "Agent": "DDPG", |
| 895 | + "HyperOptimizer": "GridSearch", |
| 896 | + "Memory": "PrioritizedExperienceReplay", |
| 897 | + "Optimizer": "AdamOptimizer", |
| 898 | + "Policy": "LinearNoisePolicy", |
| 899 | + "PreProcessor": "NoPreProcessor", |
| 900 | + "param": { |
| 901 | + "batch_size": 64, |
| 902 | + "n_epoch": 1, |
| 903 | + "tau": 0.005, |
| 904 | + "lr": 0.001, |
| 905 | + "critic_lr": 0.001, |
| 906 | + "exploration_anneal_episodes": 100, |
| 907 | + "gamma": 0.97, |
| 908 | + "hidden_layers": [400, 300], |
| 909 | + "hidden_layers_activation": "relu", |
| 910 | + "output_layer_activation": "tanh", |
| 911 | + "max_mem_len": 30000 |
| 912 | + }, |
| 913 | + "param_range": { |
| 914 | + "lr": [0.0001, 0.0005], |
| 915 | + "critic_lr": [0.001, 0.005], |
| 916 | + "gamma": [0.95, 0.97, 0.99], |
| 917 | + "hidden_layers": [ |
| 918 | + [200, 100], |
| 919 | + [400, 200], |
| 920 | + [400, 300], |
| 921 | + [800, 400] |
| 922 | + ] |
| 923 | + } |
| 924 | + }, |
| 925 | + "pendulum_ddpg_linearnoise": { |
| 926 | + "problem": "Pendulum-v0", |
| 927 | + "Agent": "DDPG", |
| 928 | + "HyperOptimizer": "GridSearch", |
| 929 | + "Memory": "LinearMemoryWithForgetting", |
| 930 | + "Optimizer": "AdamOptimizer", |
| 931 | + "Policy": "LinearNoisePolicy", |
| 932 | + "PreProcessor": "NoPreProcessor", |
| 933 | + "param": { |
| 934 | + "batch_size": 64, |
| 935 | + "n_epoch": 1, |
| 936 | + "tau": 0.005, |
| 937 | + "lr": 0.0001, |
| 938 | + "critic_lr": 0.005, |
| 939 | + "exploration_anneal_episodes": 50, |
| 940 | + "gamma": 0.97, |
| 941 | + "hidden_layers": [400, 300], |
| 942 | + "hidden_layers_activation": "relu", |
| 943 | + "output_layer_activation": "tanh" |
| 944 | + }, |
| 945 | + "param_range": { |
| 946 | + "lr": [0.0001, 0.0005, 0.001], |
| 947 | + "critic_lr": [0.001, 0.005], |
| 948 | + "gamma": [0.95, 0.97, 0.99], |
| 949 | + "hidden_layers": [ |
| 950 | + [400, 300], |
| 951 | + [800, 400, 200], |
| 952 | + [800, 600, 400, 200] |
| 953 | + ] |
| 954 | + } |
| 955 | + }, |
| 956 | + "pendulum_ddpg_ounoise": { |
| 957 | + "problem": "Pendulum-v0", |
| 958 | + "Agent": "DDPG", |
| 959 | + "HyperOptimizer": "GridSearch", |
| 960 | + "Memory": "LinearMemoryWithForgetting", |
| 961 | + "Optimizer": "AdamOptimizer", |
| 962 | + "Policy": "NoNoisePolicy", |
| 963 | + "PreProcessor": "NoPreProcessor", |
| 964 | + "param": { |
| 965 | + "batch_size": 64, |
| 966 | + "n_epoch": 1, |
| 967 | + "tau": 0.005, |
| 968 | + "lr": 0.001, |
| 969 | + "critic_lr": 0.001, |
| 970 | + "exploration_anneal_episodes": 50, |
| 971 | + "gamma": 0.97, |
| 972 | + "hidden_layers": [400, 300], |
| 973 | + "hidden_layers_activation": "relu", |
| 974 | + "output_layer_activation": "tanh" |
| 975 | + }, |
| 976 | + "param_range": { |
| 977 | + "lr": [0.0001, 0.0005, 0.001], |
| 978 | + "critic_lr": [0.001, 0.005], |
| 979 | + "gamma": [0.95, 0.97, 0.99], |
| 980 | + "hidden_layers": [ |
| 981 | + [400, 300], |
| 982 | + [800, 400, 200], |
| 983 | + [800, 600, 400, 200] |
| 984 | + ] |
| 985 | + } |
| 986 | + }, |
| 987 | + "pendulum_ddpg_gaussiannoise": { |
| 988 | + "problem": "Pendulum-v0", |
| 989 | + "Agent": "DDPG", |
| 990 | + "HyperOptimizer": "GridSearch", |
| 991 | + "Memory": "LinearMemoryWithForgetting", |
| 992 | + "Optimizer": "AdamOptimizer", |
| 993 | + "Policy": "GaussianWhiteNoisePolicy", |
| 994 | + "PreProcessor": "NoPreProcessor", |
| 995 | + "param": { |
| 996 | + "batch_size": 64, |
| 997 | + "n_epoch": 1, |
| 998 | + "tau": 0.005, |
| 999 | + "lr": 0.001, |
| 1000 | + "critic_lr": 0.001, |
| 1001 | + "exploration_anneal_episodes": 50, |
| 1002 | + "gamma": 0.97, |
| 1003 | + "hidden_layers": [400, 300], |
| 1004 | + "hidden_layers_activation": "relu", |
| 1005 | + "output_layer_activation": "tanh" |
| 1006 | + }, |
| 1007 | + "param_range": { |
| 1008 | + "lr": [0.0001, 0.0005, 0.001], |
| 1009 | + "critic_lr": [0.001, 0.005], |
| 1010 | + "gamma": [0.95, 0.97, 0.99], |
| 1011 | + "hidden_layers": [ |
| 1012 | + [400, 300], |
| 1013 | + [800, 400, 200], |
| 1014 | + [800, 600, 400, 200] |
| 1015 | + ] |
| 1016 | + } |
| 1017 | + }, |
829 | 1018 | "mountain_dqn": { |
830 | 1019 | "problem": "MountainCar-v0", |
831 | 1020 | "Agent": "DQN", |
|
880 | 1069 | ] |
881 | 1070 | } |
882 | 1071 | }, |
883 | | - "mountain_double_dqn_per": { |
| 1072 | + "mountain_dqn_per": { |
884 | 1073 | "problem": "MountainCar-v0", |
885 | | - "Agent": "DoubleDQN", |
| 1074 | + "Agent": "DQN", |
886 | 1075 | "HyperOptimizer": "GridSearch", |
887 | 1076 | "Memory": "PrioritizedExperienceReplay", |
888 | 1077 | "Optimizer": "AdamOptimizer", |
889 | | - "Policy": "DoubleDQNBoltzmannPolicy", |
| 1078 | + "Policy": "BoltzmannPolicy", |
890 | 1079 | "PreProcessor": "NoPreProcessor", |
891 | 1080 | "param": { |
892 | 1081 | "batch_size": 32, |
|
895 | 1084 | "hidden_layers": [128, 64], |
896 | 1085 | "hidden_layers_activation": "sigmoid", |
897 | 1086 | "output_layer_activation": "linear", |
898 | | - "exploration_anneal_episodes": 200, |
899 | | - "epi_change_lr": 500, |
900 | | - "max_mem_len": 20000 |
| 1087 | + "exploration_anneal_episodes": 50, |
| 1088 | + "epi_change_lr": 150, |
| 1089 | + "max_mem_len": 30000 |
901 | 1090 | }, |
902 | 1091 | "param_range": { |
903 | | - "lr": [0.01, 0.02, 0.03, 0.05], |
| 1092 | + "lr": [0.005, 0.01, 0.02, 0.05], |
904 | 1093 | "gamma": [0.99, 0.999], |
905 | 1094 | "hidden_layers": [ |
906 | 1095 | [400], |
907 | | - [800], |
908 | | - [400, 200] |
| 1096 | + [800] |
909 | 1097 | ] |
910 | 1098 | } |
911 | 1099 | }, |
|
951 | 1139 | "hidden_layers_activation": "sigmoid" |
952 | 1140 | }, |
953 | 1141 | "param_range": { |
954 | | - "lr": [0.005, 0.01, 0.05, 0.1], |
| 1142 | + "lr": [0.001, 0.005, 0.01], |
955 | 1143 | "gamma": [0.97, 0.99, 0.999], |
956 | 1144 | "hidden_layers": [ |
957 | 1145 | [200], |
958 | | - [400, 200], |
959 | | - [400, 200, 100] |
| 1146 | + [400] |
960 | 1147 | ] |
961 | 1148 | } |
962 | 1149 | } |
|
0 commit comments