Federico-PizarroBejarano
diff --git a/‎experiments/crazyflie/config_overrides/crazyflie_stab.yaml‎ renamed to ‎experiments/crazyflie/config_overrides/crazyflie_track.yaml‎
Lines changed: 12 additions & 7 deletions b/‎experiments/crazyflie/config_overrides/crazyflie_stab.yaml‎ renamed to ‎experiments/crazyflie/config_overrides/crazyflie_track.yaml‎
Lines changed: 12 additions & 7 deletions
diff --git a/‎experiments/crazyflie/config_overrides/nl_mpsc.yaml‎
Lines changed: 6 additions & 14 deletions b/‎experiments/crazyflie/config_overrides/nl_mpsc.yaml‎
Lines changed: 6 additions & 14 deletions
diff --git a/‎experiments/crazyflie/crazyflie_experiment.py‎
Lines changed: 112 additions & 52 deletions b/‎experiments/crazyflie/crazyflie_experiment.py‎
Lines changed: 112 additions & 52 deletions
diff --git a/‎experiments/crazyflie/crazyflie_utils.py‎
Lines changed: 20 additions & 1 deletion b/‎experiments/crazyflie/crazyflie_utils.py‎
Lines changed: 20 additions & 1 deletion
diff --git a/‎experiments/crazyflie/models/mpsc_parameters/linear_mpsc_crazyflie_stab.pkl‎
-188 Bytes b/‎experiments/crazyflie/models/mpsc_parameters/linear_mpsc_crazyflie_stab.pkl‎
-188 Bytes
diff --git a/‎experiments/crazyflie/models/mpsc_parameters/nl_mpsc_crazyflie_stab.pkl‎
-1.33 KB b/‎experiments/crazyflie/models/mpsc_parameters/nl_mpsc_crazyflie_stab.pkl‎
-1.33 KB
diff --git a/‎experiments/crazyflie/models/mpsc_parameters/nl_mpsc_crazyflie_track.pkl‎
1.22 KB b/‎experiments/crazyflie/models/mpsc_parameters/nl_mpsc_crazyflie_track.pkl‎
1.22 KB
diff --git a/‎experiments/crazyflie/models/mpsc_parameters/nl_mpsc_quadrotor_3D_stab.pkl‎
-4.97 KB b/‎experiments/crazyflie/models/mpsc_parameters/nl_mpsc_quadrotor_3D_stab.pkl‎
-4.97 KB
diff --git a/‎experiments/crazyflie/models/traj_data/errors.npy‎
313 KB b/‎experiments/crazyflie/models/traj_data/errors.npy‎
313 KB
diff --git a/‎experiments/crazyflie/models/traj_data/matlab_data.mat‎
1.07 MB b/‎experiments/crazyflie/models/traj_data/matlab_data.mat‎
1.07 MB
@@ -26,10 +26,15 @@ task_config:
   randomized_init: False
   randomized_inertial_prop: False
 
-  task: stabilization
+  task: traj_tracking
   task_info:
-    stabilization_goal: [0.5, -0.5, 2]
-    stabilization_goal_tolerance: 0.0
+    trajectory_type: figure8
+    num_cycles: 1
+    trajectory_plane: 'xz'
+    trajectory_position_offset: [0, 1]
+    trajectory_scale: 1
+    proj_point: [0, 0, 0.5]
+    proj_normal: [0, 1, 1]
 
   inertial_prop:
     M: 0.03775
@@ -43,8 +48,8 @@ task_config:
       upper_bounds:
         - 0.75
         - 0.5
-        - 1
-        - 1
+        - 0.75
+        - 0.5
         - 2
         - 1
         - 0.2
@@ -56,8 +61,8 @@ task_config:
       lower_bounds:
         - -0.75
         - -0.5
-        - -1
-        - -1
+        - -0.75
+        - -0.5
         - 0
         - -1
         - -0.2
 
@@ -2,26 +2,18 @@ safety_filter: nl_mpsc
 sf_config:
   # LQR controller parameters
   r_lin:
-    - 90
+    - 2
   q_lin:
-    - 0.001
-    - 0.06
-    - 0.001
-    - 0.06
-    - 0.00025
-    - 80
-    - 0.00001
-    - 0.00001
-    - 0.75
-    - 1
-    - 1
-    - 1
+    - 0.008
+    - 1.85
+    - 0.008
+    - 1.85
 
   # MPC Parameters
   horizon: 10
   warmstart: True
   integration_algo: rk4
-  use_terminal_set: True
+  use_terminal_set: False
 
   # Prior info
   prior_info:
 
@@ -10,7 +10,7 @@
 import numpy as np
 from scipy.io import savemat
 
-from experiments.crazyflie.crazyflie_utils import gen_traj
+from experiments.crazyflie.crazyflie_utils import gen_traj, gen_input_traj
 from safe_control_gym.envs.benchmark_env import Task
 from safe_control_gym.safety_filters.mpsc.mpsc_utils import Cost_Function, get_discrete_derivative
 from safe_control_gym.utils.configuration import ConfigFactory
@@ -27,12 +27,18 @@
     print('Module \'cffirmware\' available:', FIRMWARE_INSTALLED)
 
 
-A = np.array([[0.9987, 0.02872],
-              [0.006117, 0.8535]])
-B = np.array([[0.02309, 0.2854]]).T
+A = np.array([[ 1,           0.03659,   7.598e-07, -0.006083],
+              [-5.858e-06,   0.7886,    5.132e-06,  0.03174],
+              [ 3.259e-06,   0.0009138, 1,          0.03899],
+              [-1.735e-05,  -0.006111, -9.836e-06,  0.7786]])
 
+B = np.array([[ 0.003886,  0.01169],
+              [ 0.4229,   -0.06055],
+              [-0.001915, -0.0006503],
+              [ 0.01223,   0.4419]])
 
-def run(gui=False, plot=True, training=False, certify=False, traj='sine', curr_path='.'):
+
+def run(gui=False, plot=True, training=False, certify=True, curr_path='.'):
     '''The main function creating, running, and closing an environment over N episodes. '''
 
     # Define arguments.
@@ -58,23 +64,24 @@ def run(gui=False, plot=True, training=False, certify=False, traj='sine', curr_p
     actions_uncert = []
     actions_cert = []
 
-    errors = []
-
     # Create environment.
     firmware_wrapper = make('firmware', env_func_500, FIRMWARE_FREQ, CTRL_FREQ)
     obs, info = firmware_wrapper.reset()
     env = firmware_wrapper.env
 
     # Create trajectory.
     full_trajectory = gen_traj(CTRL_FREQ, env.EPISODE_LEN_SEC)
-    lqr_gain = 0.05 * np.array([[4, 0.1]])
+    full_trajectory = np.hstack((full_trajectory, full_trajectory))
+
+    lqr_gain = 0.05 * np.array([[4,  0.1,  0,  0],
+                                [0,  0,    4,  0.1]])
 
     # Setup controller.
     ctrl = make(config.algo,
                 env_func,
                 **config.algo_config)
     ctrl.gain = lqr_gain
-    ctrl.model.U_EQ = 0
+    ctrl.model.U_EQ = np.array([[0, 0]]).T
 
     ctrl.env.X_GOAL = full_trajectory
     ctrl.env.TASK = Task.TRAJ_TRACKING
@@ -88,9 +95,10 @@ def run(gui=False, plot=True, training=False, certify=False, traj='sine', curr_p
         if training is True:
             safety_filter.learn(env=env)
             safety_filter.save(path=f'{curr_path}/models/mpsc_parameters/{config.safety_filter}_crazyflie_{task}.pkl')
-            1 / 0
+            1/0
         else:
             safety_filter.load(path=f'{curr_path}/models/mpsc_parameters/{config.safety_filter}_crazyflie_{task}.pkl')
+            safety_filter.env.X_GOAL = full_trajectory
 
         if config.sf_config.cost_function == Cost_Function.PRECOMPUTED_COST:
             safety_filter.cost_function.uncertified_controller = ctrl
@@ -101,25 +109,21 @@ def run(gui=False, plot=True, training=False, certify=False, traj='sine', curr_p
     states.append(env.state)
     action = env.U_GOAL
     successes = 0
-    estimated_vel = []
-    bad_estimated_vel = []
-    prev_vel = 0
-    prev_x = 0
-    alpha = 0.3
+
     for i in range(CTRL_FREQ * env.EPISODE_LEN_SEC):
-        curr_obs = np.atleast_2d(np.array([obs[0], obs[1]])).T
+        curr_obs = np.atleast_2d(obs[0:4]).T
+        curr_obs = curr_obs.reshape((4, 1))
         info['current_step'] = i
-        new_act = ctrl.select_action(curr_obs, info)[0]
-        new_act = np.clip(new_act, -0.25, 0.25)
+        new_act = ctrl.select_action(curr_obs, info)
+        new_act = np.clip(new_act, np.array([[-0.25, -0.25]]).T, np.array([[0.25, 0.25]]).T)
         actions_uncert.append(new_act)
         if certify is True:
             certified_action, success = safety_filter.certify_action(curr_obs, new_act, info)
             if success:
                 successes += 1
                 new_act = certified_action
         actions_cert.append(new_act)
-        next_state = A @ curr_obs + B * new_act
-        pos = [(new_act + curr_obs[0])[0], 0, 1]
+        pos = [(new_act[0] + curr_obs[0])[0], (new_act[1] + curr_obs[2])[0], 1]
         vel = [0, 0, 0]
         acc = [0, 0, 0]
         yaw = 0
@@ -131,15 +135,6 @@ def run(gui=False, plot=True, training=False, certify=False, traj='sine', curr_p
 
         # Step the environment.
         obs, _, _, info, action = firmware_wrapper.step(curr_time, action)
-        x_obs = obs[0] + np.random.normal(0.0, 0.001)
-        est_vel = (x_obs - prev_x) / CTRL_DT
-        bad_estimated_vel.append(est_vel)
-        prev_vel = (1 - alpha) * prev_vel + alpha * est_vel
-        prev_x = x_obs
-        estimated_vel.append(prev_vel)
-        obs[0] = x_obs
-        obs[1] = prev_vel
-        errors.append(np.squeeze(np.array([obs[0], obs[1]])) - np.squeeze(next_state))
 
         states.append(obs)
         if obs[4] < 0.05:
@@ -154,29 +149,18 @@ def run(gui=False, plot=True, training=False, certify=False, traj='sine', curr_p
     actions_uncert = np.array(actions_uncert)
     print('Number of Max Inputs: ', np.sum(np.abs(actions_uncert) == 0.25))
     actions_cert = np.array(actions_cert)
-    errors = np.array(errors)
-    corrections = actions_cert - actions_uncert
+    corrections = np.squeeze(actions_cert) - np.squeeze(actions_uncert)
 
     # Close the environment
     env.close()
     print('Elapsed Time: ', time.time() - ep_start)
-    print('Model Errors: ', np.linalg.norm(errors))
-    print(f'Feasible steps: {successes}/{CTRL_FREQ*env.EPISODE_LEN_SEC}')
     print('NUM ERRORS POS: ', np.sum(np.abs(states[:, 0]) >= 0.75))
     print('NUM ERRORS VEL: ', np.sum(np.abs(states[:, 1]) >= 0.5))
     print('Rate of change (inputs): ', np.linalg.norm(get_discrete_derivative(np.atleast_2d(actions_cert).T, CTRL_FREQ)))
-    print('Max Correction: ', np.max(np.abs(corrections)))
-    print('Magnitude of Corrections: ', np.linalg.norm(corrections))
-
-    if certify is False:
-        np.save('./models/results/states_uncert.npy', states)
-        np.save('./models/results/actions_uncert.npy', actions_uncert)
-        np.save('./models/results/errors_uncert.npy', errors)
-    else:
-        np.save('./models/results/states_cert.npy', states)
-        np.save('./models/results/actions_uncert.npy', actions_uncert)
-        np.save('./models/results/actions_cert.npy', actions_cert)
-        np.save('./models/results/errors_cert.npy', errors)
+    if certify:
+        print(f'Feasible steps: {float(successes)}/{CTRL_FREQ*env.EPISODE_LEN_SEC}')
+        print('Max Correction: ', np.max(np.abs(corrections)))
+        print('Magnitude of Corrections: ', np.linalg.norm(corrections))
 
     if plot:
         plt.plot(states[:, 0], label='x')
@@ -190,16 +174,92 @@ def run(gui=False, plot=True, training=False, certify=False, traj='sine', curr_p
         plt.legend()
         plt.show()
 
-        plt.plot(states[:, 1], label='vel x')
-        plt.plot(full_trajectory[:, 1], label='ref vel')
-        plt.plot(estimated_vel, label='est vel')
-        plt.plot(bad_estimated_vel, label='bad est vel')
-        plt.legend()
-        plt.show()
+    print('Experiment Complete.')
+
+
+def identify_system(curr_path='.'):
+    '''The main function creating, running, and closing an environment over N episodes. '''
+    # Define arguments.
+    fac = ConfigFactory()
+    config = fac.merge()
+
+    CTRL_FREQ = config.task_config['ctrl_freq']
+    CTRL_DT = 1 / CTRL_FREQ
+
+    FIRMWARE_FREQ = 500
+    config.task_config['ctrl_freq'] = FIRMWARE_FREQ
+    env_func_500 = partial(make,
+                           config.task,
+                           **config.task_config)
+
+    states = []
+    actions = []
+
+    # Create environment.
+    firmware_wrapper = make('firmware', env_func_500, FIRMWARE_FREQ, CTRL_FREQ)
+    obs, _ = firmware_wrapper.reset()
+    env = firmware_wrapper.env
+
+    # Create trajectory.
+    input_traj = gen_input_traj(CTRL_FREQ, env.EPISODE_LEN_SEC, num_channels=2)
+
+    states.append(env.state)
+    action = env.U_GOAL
+
+    errors = []
+
+    for i in range(10000):
+        curr_obs = np.atleast_2d(obs[0:4]).T
+        new_act = np.atleast_2d(input_traj[:, i]).T
+        actions.append(new_act)
+
+        pos = [(new_act[0] + curr_obs[0])[0], (new_act[1] + curr_obs[2])[0], 1]
+        args = [pos, [0, 0, 0], [0, 0, 0], 0, [0, 0, 0]]
+
+        curr_time = i * CTRL_DT
+        firmware_wrapper.sendFullStateCmd(*args, curr_time)
+
+        # Step the environment.
+        obs, _, _, _, action = firmware_wrapper.step(curr_time, action)
+        states.append(obs.copy())
+
+        pred_next_state = A @ curr_obs + B @ new_act
+        errors.append(np.squeeze(obs[0:4] - np.squeeze(pred_next_state)))
+
+        if obs[4] < 0.05:
+            print('CRASHED!!!')
+            break
+
+    states = np.array(states)
+    actions = np.array(actions)
+    errors = np.array(errors)
+
+    normed_w = np.linalg.norm(errors, axis=1)
+    print('MAX ERROR:', np.max(normed_w))
+    print('MEAN ERROR:', np.mean(normed_w))
+    print('MAX ERROR PER DIM:', np.max(errors, axis=0))
+    print('TOTAL ERRORS BY CHANNEL:', np.sum(np.abs(errors), axis=0))
+
+    # Close the environment
+    env.close()
 
     print('Experiment Complete.')
-    savemat(f'{curr_path}/models/results/matlab_data.mat', {'states': states, 'actions': actions_cert})
+    savemat(f'{curr_path}/models/traj_data/matlab_data.mat', {'states': states, 'actions': actions})
+    np.save('./models/traj_data/errors.npy', errors)
+
+    plt.plot(states[:, 0], label='x')
+    plt.plot(states[:, 2], label='y')
+    plt.plot(states[:, 4], label='z')
+    plt.legend()
+    plt.show()
+
+    plt.plot(states[:, 1], label='x')
+    plt.plot(states[:, 3], label='y')
+    plt.plot(states[:, 5], label='z')
+    plt.legend()
+    plt.show()
 
 
 if __name__ == '__main__':
     run()
+    # identify_system()
@@ -80,6 +80,24 @@ def plot_traj(CTRL_FREQ, TEST=0, CERTIFIED=False, COST_FUNCTION='one_step', M=2)
     plt.show()
 
 
+def gen_input_traj(CTRL_FREQ, EPISODE_LEN_SEC, num_channels=1, plot=False):
+    num_freqs = 20
+
+    input_traj = []
+    for _ in range(num_channels):
+        freqs = np.power(np.random.rand(num_freqs+1)*2, 2)
+        freqs = np.linspace(freqs[:-1], freqs[1:], CTRL_FREQ * EPISODE_LEN_SEC, axis=1).flatten()
+        x = np.linspace(0, 12*np.pi, num_freqs * CTRL_FREQ * EPISODE_LEN_SEC)
+        traj = np.sin(np.multiply(x, freqs))
+        input_traj.append(traj*0.25)
+
+    if plot:
+        plt.plot(traj)
+        plt.show()
+
+    return np.array(input_traj)
+
+
 def gen_traj(CTRL_FREQ, EPISODE_LEN_SEC, plot=False):
     CTRL_DT = 1.0 / CTRL_FREQ
 
@@ -133,6 +151,7 @@ def get_max_chatter(CERTIFIED, COST_FUNCTION, M):
     M = 10
 
     # gen_traj(CTRL_FREQ=25, EPISODE_LEN_SEC=20, plot=True)
-    plot_traj(CTRL_FREQ=25, TEST=TEST, CERTIFIED=CERTIFIED, COST_FUNCTION=COST_FUNCTION, M=M)
+    gen_input_traj(CTRL_FREQ=25, EPISODE_LEN_SEC=20, plot=True)
+    # plot_traj(CTRL_FREQ=25, TEST=TEST, CERTIFIED=CERTIFIED, COST_FUNCTION=COST_FUNCTION, M=M)
     # get_max_chatter(CERTIFIED=CERTIFIED, COST_FUNCTION=COST_FUNCTION, M=M)
     # calc_error(CTRL_FREQ=25, EPISODE_LEN_SEC=20, TEST=TEST, CERTIFIED=CERTIFIED, COST_FUNCTION=COST_FUNCTION, M=M)