Skip to content

Commit

Permalink
Adding updated results with stricter constraints
Browse files Browse the repository at this point in the history
  • Loading branch information
pizarrob committed Nov 7, 2023
1 parent 21e3d86 commit c050e7f
Show file tree
Hide file tree
Showing 722 changed files with 54,172 additions and 54,169 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@ algo_config:
critic_lr: 0.001
deque_size: 10
entropy_coef: 0.01
eval_batch_size: 10
eval_batch_size: 25
eval_interval: 10000
eval_save_best: true
filter_train_actions: true
Expand Down Expand Up @@ -69,20 +69,20 @@ sf_config:
prior_prop_rand_info: null
randomize_prior_prop: false
q_lin:
- 0.001
- 0.06
- 0.001
- 0.06
- 0.00025
- 80
- 0.1
- 0.006
- 3.0
- 1.0e-05
- 8.0
- 1.0e-05
- 0.75
- 1
- 1
- 1
- 1.0e-08
- 1.0e-08
- 0.01
- 0.5
- 0.5
- 0.5
r_lin:
- 90
- 10000
slack_cost: 250
soften_constraints: true
use_acados: true
Expand All @@ -99,31 +99,31 @@ task_config:
- constrained_variable: state
constraint_form: default_constraint
lower_bounds:
- -0.95
- -2
- -0.475
- -2
- 0.525
- -2
- -0.5
- -0.5
- -0.5
- -2
- -2
- -1
- -2
- -1
- 0
- -1
- -0.2
- -0.2
- -0.2
- -1
- -1
- -1
upper_bounds:
- 0.95
- 2
- 0
- 2
- 0.95
- 2
- 0.5
- 0.5
- 0.5
- 2
- 1
- 2
- 1
- 2
- 1
- 0.2
- 0.2
- 0.2
- 1
- 1
- 1
- constrained_variable: input
constraint_form: default_constraint
lower_bounds:
Expand Down Expand Up @@ -167,52 +167,52 @@ task_config:
init_state_randomization_info:
init_p:
distrib: uniform
high: 1
low: -1
high: 2
low: -2
init_phi:
distrib: uniform
high: 0.2
low: -0.2
high: 0.5
low: -0.5
init_psi:
distrib: uniform
high: 0.2
low: -0.2
high: 0.5
low: -0.5
init_q:
distrib: uniform
high: 1
low: -1
high: 2
low: -2
init_r:
distrib: uniform
high: 1
low: -1
high: 2
low: -2
init_theta:
distrib: uniform
high: 0.2
low: -0.2
high: 0.5
low: -0.5
init_x:
distrib: uniform
high: 2
low: -2
high: 0.95
low: -0.95
init_x_dot:
distrib: uniform
high: 1
low: -1
init_y:
distrib: uniform
high: 2
low: -2
init_y:
distrib: uniform
high: 0
low: -0.475
init_y_dot:
distrib: uniform
high: 1
low: -1
high: 2
low: -2
init_z:
distrib: uniform
high: 2
low: 0.3
high: 0.95
low: 0.525
init_z_dot:
distrib: uniform
high: 1
low: -1
high: 2
low: -2
norm_act_scale: 0.1
normalized_rl_action_space: true
obs_goal_horizon: 1
Expand Down
Original file line number Diff line number Diff line change
@@ -1,101 +1,101 @@
step,loss/approx_kl
10000,0.018229736884435018
20000,0.02127453736805668
30000,0.02370014371505628
40000,0.02065292401239276
50000,0.025316688713307185
60000,0.01826790439275404
70000,0.025006062878916657
80000,0.018720928160473705
90000,0.019625773886218664
100000,0.013361939182505009
110000,0.03154762430737416
120000,0.031806574435904615
130000,0.02165382777651151
140000,0.015200028227021298
150000,0.020803385553881525
160000,0.014369704714044928
170000,0.02885335066045324
180000,0.020664520297820364
190000,0.02774980144264797
200000,0.014654031302779914
210000,0.028576524602249263
220000,0.03024926499153177
230000,0.02645964035764336
240000,0.04079947238788009
250000,0.017594279488548636
260000,0.032765278577183685
270000,0.029457671707496042
280000,0.015534943140422305
290000,0.030238619043181342
300000,0.030985550116747612
310000,0.033439734640220806
320000,0.010407944504792491
330000,0.035565994260832665
340000,0.01913086099860569
350000,0.018777612193177147
360000,0.02521338181880613
370000,0.026439335926746334
380000,0.022027451839918895
390000,0.028303294302895667
400000,0.017139489576220517
410000,0.04025533202414711
420000,0.031722171915074183
430000,0.014261707291007042
440000,0.02689499178280433
450000,0.02678934750147164
460000,0.03554095750053724
470000,0.026956252986565225
480000,0.02715459933194021
490000,0.029161349792654313
500000,0.020614128513261675
510000,0.03876745159116884
520000,0.0294973047139744
530000,0.02062256399852534
540000,0.02528983733306328
550000,0.019311279663816096
560000,0.025200433749705552
570000,0.029168432097261155
580000,0.025244836416095495
590000,0.018281504170348246
600000,0.025952478436132277
610000,0.027890596538782113
620000,0.026617188627521198
630000,0.026978990544254584
640000,0.023182477817560238
650000,0.026558673909554888
660000,0.026973483727003138
670000,0.038929785757015146
680000,0.03427885382746656
690000,0.02805567579343915
700000,0.030999637239923078
710000,0.021579861144224805
720000,0.02489494209488233
730000,0.02404243256896734
740000,0.022397541472067434
750000,0.024323036956290397
760000,0.019284146217008434
770000,0.014312991220504043
780000,0.026891583390533918
790000,0.024835351140548783
800000,0.024412206746637823
810000,0.021250387715796633
820000,0.025366627704352142
830000,0.02246172120794654
840000,0.026730975322425365
850000,0.03421310999741157
860000,0.01983120329678059
870000,0.015500476863235236
880000,0.013675535159806412
890000,0.026640326157212256
900000,0.028744155572106446
910000,0.025880434301992255
920000,0.02237929714222749
930000,0.03249762508397301
940000,0.024294908437877894
950000,0.026201037224382162
960000,0.013028102368116379
970000,0.032526198371003075
980000,0.01626911209896207
990000,0.023152368733038504
1000000,0.023702411105235414
10000,0.017213520842293897
20000,0.02764010163179288
30000,0.01743585287282864
40000,0.017944027467941246
50000,0.018553049815818668
60000,0.023324231663718824
70000,0.024198097828775644
80000,0.013849695399403571
90000,0.020018802893658476
100000,0.020879797528808315
110000,0.020450342632830146
120000,0.034239981804663935
130000,0.026658428382749354
140000,0.022649019258096814
150000,0.022941715223714708
160000,0.007890155275041858
170000,0.014145796125133833
180000,0.021201497875154015
190000,0.01608441020362079
200000,0.020309033151715995
210000,0.03166960822418333
220000,0.02117745455664893
230000,0.026413527317345142
240000,0.02563850761701663
250000,0.030556447710841893
260000,0.02503080541888873
270000,0.015589506893108288
280000,0.022843319425980255
290000,0.02117375050050517
300000,0.0253074764739722
310000,0.015984897377590335
320000,0.028337029942000908
330000,0.01633354507697125
340000,0.03463563905097544
350000,0.024914210988208653
360000,0.019485377830763657
370000,0.020445223230247694
380000,0.014343827916309237
390000,0.0241228209498028
400000,0.02197242130835851
410000,0.024426490704839425
420000,0.012739477089295787
430000,0.025227935565635563
440000,0.02386964901039998
450000,0.029704142517099776
460000,0.02316980489219228
470000,0.018668918684124947
480000,0.01797391955430309
490000,0.017083619410792988
500000,0.021401571932559208
510000,0.016890498654296003
520000,0.019246815827985604
530000,0.025200538026789825
540000,0.009884566161781547
550000,0.018769014471520983
560000,0.0193116427709659
570000,0.03082204340025783
580000,0.03612479014943043
590000,0.024618654077251754
600000,0.026440184066692983
610000,0.013226955570280552
620000,0.016506727163990337
630000,0.029131261756022764
640000,0.03199023871372143
650000,0.03162956436475117
660000,0.025987505105634533
670000,0.03066992412010829
680000,0.03358819276715318
690000,0.018738419531534115
700000,0.02501208819448948
710000,0.033234185290833315
720000,0.02395644110317032
730000,0.021680068410933014
740000,0.02534624853481849
750000,0.022559438801060122
760000,0.02713867419709761
770000,0.01857999600470066
780000,0.026966472839315726
790000,0.01576397685954968
800000,0.015534047378847995
810000,0.02498807981610298
820000,0.02157363562534253
830000,0.02366078707079093
840000,0.033624009167154634
850000,0.02301981703688701
860000,0.023170643423994382
870000,0.03527537065868576
880000,0.024989187065511943
890000,0.02142417756840587
900000,0.023315265898903214
910000,0.026628257675717276
920000,0.01719271431987484
930000,0.025014398898929358
940000,0.03365887276207407
950000,0.019868735255052648
960000,0.025951597404976684
970000,0.02967567397281527
980000,0.04032600869735082
990000,0.008862463602175314
1000000,0.02233600672334433
Loading

0 comments on commit c050e7f

Please sign in to comment.