Skip to content

Commit 4835f55

Browse files
author
pizarrob
committed
Adding DM3 with more noise but it also didn't work
1 parent 38c8a95 commit 4835f55

File tree

177 files changed

+2926
-6
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

177 files changed

+2926
-6
lines changed

experiments/crazyflie/config_overrides/crazyflie_track.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -28,8 +28,8 @@ task_config:
2828
inertial_prop_randomization_info:
2929
M:
3030
distrib: 'uniform'
31-
low: -0.0015
32-
high: 0.0015
31+
low: -0.0025
32+
high: 0.0025
3333
Ixx:
3434
distrib: 'uniform'
3535
low: -0.1e-5
@@ -135,7 +135,7 @@ task_config:
135135
disturbances:
136136
observation:
137137
- disturbance_func: white_noise
138-
std: 0.001
138+
std: 0.003
139139
dynamics:
140140
- disturbance_func: white_noise
141-
std: 0.1
141+
std: 0.3
Lines changed: 246 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,246 @@
1+
algo: ppo
2+
algo_config:
3+
activation: tanh
4+
actor_lr: 0.001
5+
clip_obs: 10
6+
clip_param: 0.2
7+
clip_reward: 10
8+
critic_lr: 0.001
9+
deque_size: 10
10+
entropy_coef: 0.01
11+
eval_batch_size: 10
12+
eval_interval: 10000
13+
eval_save_best: true
14+
filter_train_actions: true
15+
gae_lambda: 0.95
16+
gamma: 0.99
17+
hidden_dim: 128
18+
log_interval: 10000
19+
max_env_steps: 250000
20+
max_grad_norm: 0.5
21+
mini_batch_size: 256
22+
norm_obs: false
23+
norm_reward: false
24+
num_checkpoints: 0
25+
num_workers: 1
26+
opt_epochs: 20
27+
penalize_sf_diff: true
28+
rollout_batch_size: 1
29+
rollout_steps: 1000
30+
save_interval: 0
31+
sf_penalty: 0.1
32+
target_kl: 0.01
33+
tensorboard: false
34+
training: true
35+
use_clipped_value: false
36+
use_gae: true
37+
use_safe_reset: true
38+
device: cpu
39+
kv_overrides:
40+
- sf_config.cost_function=one_step_cost
41+
- algo_config.filter_train_actions=True
42+
- algo_config.penalize_sf_diff=True
43+
- algo_config.use_safe_reset=True
44+
- algo_config.sf_penalty=0.1
45+
- task_config.use_constraint_penalty=False
46+
output_dir: ./models/rl_models/ppo/mpsf_0.1_dm3
47+
overrides:
48+
- ./config_overrides/crazyflie_track.yaml
49+
- ./config_overrides/ppo_crazyflie.yaml
50+
- ./config_overrides/nl_mpsc.yaml
51+
restore: null
52+
safety_filter: nl_mpsc
53+
seed: null
54+
sf_config:
55+
cost_function: one_step_cost
56+
decay_factor: 0.85
57+
horizon: 10
58+
integration_algo: rk4
59+
mpsc_cost_horizon: 5
60+
n_samples: 600
61+
prior_info:
62+
prior_prop: null
63+
prior_prop_rand_info: null
64+
randomize_prior_prop: false
65+
q_lin:
66+
- 0.008
67+
- 1.85
68+
- 0.008
69+
- 1.85
70+
- 10
71+
- 10
72+
r_lin:
73+
- 2
74+
use_acados: true
75+
use_terminal_set: false
76+
warmstart: true
77+
tag: temp
78+
task: quadrotor
79+
task_config:
80+
adversary_disturbance: null
81+
adversary_disturbance_offset: 0.0
82+
adversary_disturbance_scale: 0.01
83+
camera_view:
84+
- 5
85+
- -40
86+
- -40
87+
- 0.5
88+
- -1
89+
- 0.5
90+
constraint_penalty: -1
91+
constraints:
92+
- active_dims:
93+
- 0
94+
- 1
95+
- 2
96+
- 3
97+
- 6
98+
- 7
99+
constrained_variable: state
100+
constraint_form: bounded_constraint
101+
lower_bounds:
102+
- -0.95
103+
- -2
104+
- -0.95
105+
- -2
106+
- -0.25
107+
- -0.25
108+
upper_bounds:
109+
- 0.95
110+
- 2
111+
- 0.95
112+
- 2
113+
- 0.25
114+
- 0.25
115+
- constrained_variable: input
116+
constraint_form: default_constraint
117+
cost: quadratic
118+
ctrl_freq: 500
119+
disturbances:
120+
dynamics:
121+
- disturbance_func: white_noise
122+
std: 0.3
123+
observation:
124+
- disturbance_func: white_noise
125+
std: 0.003
126+
done_on_out_of_bound: true
127+
done_on_violation: false
128+
episode_len_sec: 15
129+
gui: false
130+
inertial_prop:
131+
Ixx: 1.4e-05
132+
Iyy: 1.4e-05
133+
Izz: 2.17e-05
134+
M: 0.0345
135+
inertial_prop_randomization_info:
136+
Ixx:
137+
distrib: uniform
138+
high: 1.0e-06
139+
low: -1.0e-06
140+
Iyy:
141+
distrib: uniform
142+
high: 1.0e-06
143+
low: -1.0e-06
144+
Izz:
145+
distrib: uniform
146+
high: 1.0e-06
147+
low: -1.0e-06
148+
M:
149+
distrib: uniform
150+
high: 0.0025
151+
low: -0.0025
152+
info_in_reset: true
153+
init_state:
154+
init_p: 0
155+
init_phi: 0
156+
init_psi: 0
157+
init_q: 0
158+
init_r: 0
159+
init_theta: 0
160+
init_x: 0
161+
init_x_dot: 0
162+
init_y: 0
163+
init_y_dot: 0
164+
init_z: 1
165+
init_z_dot: 0
166+
init_state_randomization_info:
167+
init_p:
168+
distrib: uniform
169+
high: 0.5
170+
low: -0.5
171+
init_phi:
172+
distrib: uniform
173+
high: 0.25
174+
low: -0.25
175+
init_psi:
176+
distrib: uniform
177+
high: 0
178+
low: 0
179+
init_q:
180+
distrib: uniform
181+
high: 0.5
182+
low: -0.5
183+
init_r:
184+
distrib: uniform
185+
high: 0
186+
low: 0
187+
init_theta:
188+
distrib: uniform
189+
high: 0.25
190+
low: -0.25
191+
init_x:
192+
distrib: uniform
193+
high: 0.95
194+
low: -0.95
195+
init_x_dot:
196+
distrib: uniform
197+
high: 2
198+
low: -2
199+
init_y:
200+
distrib: uniform
201+
high: 0.95
202+
low: -0.95
203+
init_y_dot:
204+
distrib: uniform
205+
high: 2
206+
low: -2
207+
init_z:
208+
distrib: uniform
209+
high: 1
210+
low: 1
211+
init_z_dot:
212+
distrib: uniform
213+
high: 0
214+
low: 0
215+
norm_act_scale: 0.1
216+
normalized_rl_action_space: false
217+
obs_goal_horizon: 0
218+
physics: pyb
219+
pyb_freq: 1000
220+
quad_type: 3
221+
randomized_inertial_prop: true
222+
randomized_init: false
223+
rew_act_weight: 0.0001
224+
rew_exponential: true
225+
rew_state_weight: 1.0
226+
seed: 1337
227+
task: traj_tracking
228+
task_info:
229+
num_cycles: 1
230+
proj_normal:
231+
- 0
232+
- 1
233+
- 1
234+
proj_point:
235+
- 0
236+
- 0
237+
- 0.5
238+
trajectory_plane: xz
239+
trajectory_position_offset:
240+
- 0
241+
- 1
242+
trajectory_scale: 1
243+
trajectory_type: figure8
244+
use_constraint_penalty: false
245+
verbose: false
246+
use_gpu: false
Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
step,loss/approx_kl
2+
10000,0.014540497004054487
3+
20000,0.012409154457661012
4+
30000,0.011346515376741688
5+
40000,0.035299180285073825
6+
50000,0.021245106402784583
7+
60000,0.011667467308385918
8+
70000,0.006656894968667377
9+
80000,0.014440136899550756
10+
90000,0.023396018807155396
11+
100000,0.014779321589351944
12+
110000,0.023984983928191164
13+
120000,0.020489891265363745
14+
130000,0.01915428274078295
15+
140000,0.01767941640767579
16+
150000,0.015961797760489088
17+
160000,0.025441439830077194
18+
170000,0.011703287883816907
19+
180000,0.017753030012439316
20+
190000,0.017511220268594724
21+
200000,0.017385097426207117
22+
210000,0.021932779786099373
23+
220000,0.01595768651653392
24+
230000,0.023145760580276453
25+
240000,0.011205980827799066
26+
250000,0.018960489249244955
Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
step,loss/entropy_loss
2+
10000,-1.8106971601645152
3+
20000,-1.8322240412235256
4+
30000,-1.8304906249046329
5+
40000,-1.8484702567259472
6+
50000,-1.733134748538335
7+
60000,-1.7376533726851147
8+
70000,-1.6336932837963105
9+
80000,-1.59782941142718
10+
90000,-1.5392753720283507
11+
100000,-1.4729125042756397
12+
110000,-1.4312396665414173
13+
120000,-1.3802246312300364
14+
130000,-1.3919271488984426
15+
140000,-1.3630793670813244
16+
150000,-1.247284871339798
17+
160000,-1.2033760945002239
18+
170000,-1.1260549108187359
19+
180000,-1.1539814134438833
20+
190000,-1.0648897012074787
21+
200000,-1.0050092359383902
22+
210000,-0.9445812960465749
23+
220000,-0.8714521269003551
24+
230000,-0.8680322647094727
25+
240000,-0.7861478596925735
26+
250000,-0.8180636356274288
Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
step,loss/policy_loss
2+
10000,-0.005690815966606119
3+
20000,-0.01259742840586284
4+
30000,-0.009443554758569069
5+
40000,-0.007235572013100111
6+
50000,-0.015047529632433337
7+
60000,-0.017006347467995946
8+
70000,-0.002489459361173485
9+
80000,-0.012903842581236991
10+
90000,-0.003840118485633351
11+
100000,-0.007168129051580952
12+
110000,-0.0014811347991109526
13+
120000,-0.003636718594477153
14+
130000,-0.01774967541777613
15+
140000,-0.00125425776132927
16+
150000,-0.01088452067844718
17+
160000,-0.0027276332932849325
18+
170000,-0.013703564653057743
19+
180000,-0.009056110161266208
20+
190000,-0.010057948827489347
21+
200000,-0.010866868573943506
22+
210000,-0.00702074262882479
23+
220000,-0.007562065251478287
24+
230000,-0.00805554889624997
25+
240000,-0.014234422214343716
26+
250000,-0.011923532010163712
Lines changed: 26 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,26 @@
1+
step,loss/value_loss
2+
10000,13.269518279808343
3+
20000,13.763680027678394
4+
30000,8.96380062877704
5+
40000,14.288173564770474
6+
50000,10.736329231750975
7+
60000,12.9411191784862
8+
70000,23.509398347812912
9+
80000,24.774437726823308
10+
90000,23.809120391281493
11+
100000,12.89694149895158
12+
110000,42.12703010948331
13+
120000,27.93424511378899
14+
130000,42.34400811920298
15+
140000,24.363797277094278
16+
150000,18.025186236420705
17+
160000,13.754035599705697
18+
170000,11.474913011699913
19+
180000,46.118299395552796
20+
190000,36.187337796267904
21+
200000,5.288323052674792
22+
210000,37.57964238106247
23+
220000,6.2835994539467315
24+
230000,27.778048256723473
25+
240000,7.67200679565516
26+
250000,34.50073091352491

0 commit comments

Comments
 (0)