Skip to content

Commit 5a9f21f

Browse files
committed
update configs for ilqr linear mpc lqr and pid.
1 parent fce6d19 commit 5a9f21f

File tree

4 files changed

+53
-58
lines changed

4 files changed

+53
-58
lines changed

examples/hpo/quadrotor/config_overrides/ilqr_quadrotor_2D_attitude_hpo.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,9 @@
11
hpo_config:
22

33
load_if_exists: True # this should set to True if hpo is run in parallel
4-
objective: [exponentiated_rmse] # [other metrics defined in base_experiment.py]
5-
objective_bounds: [[0.0, 1.0]] # [bounds for each objective]. Worse value will be assigned if objective evaluation is None
6-
direction: [maximize] # [minimize, maximize]
4+
objective: [exponentiated_rmse, exponentiated_rms_action_change] # [other metrics defined in base_experiment.py]
5+
objective_bounds: [[0.0, 1.0], [0.0, 1.0]] # [bounds for each objective]. Worse value will be assigned if objective evaluation is None
6+
direction: [maximize, maximize] # [minimize, maximize]
77
repetitions: 5 # number of samples of performance for each objective query
88
n_episodes: 5 # number of episodes to evaluate each policy
99
use_gpu: True
Lines changed: 18 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,9 @@
11
hpo_config:
22

33
load_if_exists: True # this should set to True if hpo is run in parallel
4-
objective: [exponentiated_rmse] # [other metrics defined in base_experiment.py]
5-
objective_bounds: [[0.0, 1.0]] # [bounds for each objective]. Worse value will be assigned if objective evaluation is None
6-
direction: [maximize] # [minimize, maximize]
4+
objective: [exponentiated_rmse, exponentiated_rms_action_change] # [other metrics defined in base_experiment.py]
5+
objective_bounds: [[0.0, 1.0], [0.0, 1.0]] # [bounds for each objective]. Worse value will be assigned if objective evaluation is None
6+
direction: [maximize, maximize] # [minimize, maximize]
77
repetitions: 5 # number of samples of performance for each objective query
88
n_episodes: 5 # number of episodes to evaluate each policy
99
use_gpu: True
@@ -14,6 +14,18 @@ hpo_config:
1414

1515
# hyperparameters
1616
hps_config:
17-
horizon: 40
18-
q_mpc: [5.0, 0.1, 5.0, 0.1, 0.5, 0.001]
19-
r_mpc: [0.8, 0.8]
17+
horizon: 25
18+
q_mpc: [15, 0.1, 15, 0.1, 0.5, 0.01]
19+
r_mpc: [15., 5.]
20+
vizier_hps:
21+
horizon: 30
22+
q_mpc:
23+
- 14.315870549815472
24+
- 2.5426733145296656
25+
- 15.0
26+
- 0.0001
27+
- 0.0001
28+
- 0.0001
29+
r_mpc:
30+
- 15.0
31+
- 6.471762097184253

examples/hpo/quadrotor/config_overrides/lqr_quadrotor_2D_attitude_hpo.yaml

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -18,15 +18,15 @@ hpo_config:
1818
r_lqr: [1.0, 1.0]
1919
vizier_hps:
2020
q_lqr:
21-
- 14.974836994854666
22-
- 1.6803329734409302
23-
- 0.02535896270931672
24-
- 0.00028863807214684776
25-
- 1.1108878724895586
21+
- 5.88529216699797
2622
- 0.0001
27-
r_lqr:
28-
- 0.0003546601186005271
23+
- 5.00397782633266
24+
- 0.8618608985543565
25+
- 0.980013664114415
2926
- 0.0001
27+
r_lqr:
28+
- 1.2497823191792372
29+
- 0.8638794170664649
3030
optuna_hps:
3131
q_lqr:
3232
- 5.0

examples/hpo/quadrotor/config_overrides/pid_quadrotor_2D_attitude_hpo.yaml

Lines changed: 25 additions & 42 deletions
Original file line numberDiff line numberDiff line change
@@ -23,51 +23,34 @@ hpo_config:
2323
d_coeff_tor: [20000., 20000., 12000.]
2424
vizier_hps:
2525
d_coeff_for:
26-
- 2.129021744940595
27-
- 0.4640573281692209
28-
- 2.542887187784077
26+
- 0.1890092870696659
27+
- 1.0541122664300269
28+
- 1.1247264394469974
2929
d_coeff_tor:
30-
- 14998.998579124276
31-
- 10019.881571806687
32-
- 10534.570451701942
30+
- 14624.865780764232
31+
- 14735.949237321409
32+
- 12928.8956036557
3333
i_coeff_for:
34-
- 0.0014889448824393103
35-
- 2.1744158095428565
36-
- 0.0029573499100777104
34+
- 0.001
35+
- 0.4045145572372126
36+
- 0.6961573899435679
3737
i_coeff_tor:
38-
- 441.54939925530545
39-
- 0.5010238470068967
40-
- 444.3856421179262
38+
- 0.0
39+
- 7.906897732216709
40+
- 524.6539429699372
4141
p_coeff_for:
42-
- 4.886838283343341
43-
- 4.608092291879853
44-
- 4.996853766830539
42+
- 0.4458780003496436
43+
- 2.118873126448762
44+
- 1.2386787893322404
4545
p_coeff_tor:
46-
- 50002.195370586196
47-
- 79982.3047902415
48-
- 50006.91012411862
46+
- 64299.26234435173
47+
- 73880.50880762804
48+
- 59700.826209375475
4949
optuna_hps:
50-
d_coeff_for:
51-
- 1.5604761716915811
52-
- 1.3593133298420035
53-
- 3.2553437457217855
54-
d_coeff_tor:
55-
- 12782.496926017255
56-
- 13315.217714132743
57-
- 13650.965688467855
58-
i_coeff_for:
59-
- 2.4249337311042356
60-
- 0.5072768704878523
61-
- 4.280513008919815
62-
i_coeff_tor:
63-
- 518.9194229378894
64-
- 298.29551117414286
65-
- 332.42926926363987
66-
p_coeff_for:
67-
- 4.553904304026884
68-
- 3.439182803233737
69-
- 4.778645189386438
70-
p_coeff_tor:
71-
- 68371.22038933045
72-
- 69727.19131379195
73-
- 68354.19711764912
50+
p_coeff_for: [.4, .4, 1.25]
51+
i_coeff_for: [.05, .05, .05]
52+
d_coeff_for: [.2, .2, .5]
53+
54+
p_coeff_tor: [70000., 70000., 60000.]
55+
i_coeff_tor: [.0, .0, 500.]
56+
d_coeff_tor: [20000., 20000., 12000.]

0 commit comments

Comments
 (0)