From 6e06675778cff11e1014e1e858feffbc5bc87081 Mon Sep 17 00:00:00 2001
From: Federico-PizarroBejarano <federico.pizarrobejarano@mail.utoronto.ca>
Date: Fri, 6 Dec 2024 16:40:56 -0500
Subject: [PATCH] Merging in latest changes from benchmark_mpsf which has
 nl_mpsc, changes to mpsc_acados, and some config changes

---
 .../ppo_quadrotor_2D_attitude.yaml            |    6 +-
 .../quadrotor_2D_attitude_track.yaml          |    6 +-
 .../mpsc_acados_quadrotor_2D_attitude.yaml    |    1 +
 .../nl_mpsc_quadrotor_2D_attitude.yaml        |   30 +
 .../ppo_quadrotor_2D_attitude.yaml            |    6 +-
 .../quadrotor_2D_attitude_tracking.yaml       |    1 +
 .../nl_mpsc_quadrotor_2D_attitude.pkl         |  Bin 0 -> 1872 bytes
 experiments/mpsc/mpsc_experiment.py           |    6 +-
 experiments/mpsc/mpsc_experiment.sh           |    1 +
 safe_control_gym/controllers/ppo/ppo.py       |   17 +-
 safe_control_gym/safety_filters/__init__.py   |    4 +
 .../safety_filters/mpsc/mpsc_acados.py        |  165 ++-
 .../safety_filters/mpsc/nl_mpsc.py            | 1051 +++++++++++++++++
 13 files changed, 1188 insertions(+), 106 deletions(-)
 create mode 100644 experiments/mpsc/config_overrides/nl_mpsc_quadrotor_2D_attitude.yaml
 create mode 100644 experiments/mpsc/models/mpsc_parameters/nl_mpsc_quadrotor_2D_attitude.pkl
 create mode 100644 safe_control_gym/safety_filters/mpsc/nl_mpsc.py

diff --git a/examples/rl/config_overrides/quadrotor_2D_attitude/ppo_quadrotor_2D_attitude.yaml b/examples/rl/config_overrides/quadrotor_2D_attitude/ppo_quadrotor_2D_attitude.yaml
index 099581cf8..383d80a3b 100644
--- a/examples/rl/config_overrides/quadrotor_2D_attitude/ppo_quadrotor_2D_attitude.yaml
+++ b/examples/rl/config_overrides/quadrotor_2D_attitude/ppo_quadrotor_2D_attitude.yaml
@@ -1,8 +1,8 @@
 algo: ppo
 algo_config:
   # model args
-  hidden_dim: 128
-  activation: tanh
+  hidden_dim: 64
+  activation: relu
 
   # loss args
   gamma: 0.98
@@ -19,7 +19,7 @@ algo_config:
   critic_lr: 0.001
 
   # runner args
-  max_env_steps: 2640000
+  max_env_steps: 660000
   rollout_batch_size: 1
   rollout_steps: 660
   eval_batch_size: 10
diff --git a/examples/rl/config_overrides/quadrotor_2D_attitude/quadrotor_2D_attitude_track.yaml b/examples/rl/config_overrides/quadrotor_2D_attitude/quadrotor_2D_attitude_track.yaml
index 4110ab495..eab68983b 100644
--- a/examples/rl/config_overrides/quadrotor_2D_attitude/quadrotor_2D_attitude_track.yaml
+++ b/examples/rl/config_overrides/quadrotor_2D_attitude/quadrotor_2D_attitude_track.yaml
@@ -1,5 +1,4 @@
 task_config:
-  seed: 1337
   info_in_reset: True
   ctrl_freq: 60
   pyb_freq: 60
@@ -36,13 +35,10 @@ task_config:
   # RL Reward
   rew_state_weight: [10, 0.1, 10, 0.1, 0.1, 0.001]
   rew_act_weight: [0.1, 0.1]
+  info_mse_metric_state_weight: [1, 0, 1, 0, 0, 0]
   rew_exponential: True
 
   constraints:
-    - constraint_form: default_constraint
-      constrained_variable: state
-      upper_bounds: [ 0.9,  2, 1.45,  2,  0.75,  3]
-      lower_bounds: [-0.9, -2, 0.55, -2, -0.75, -3]
     - constraint_form: default_constraint
       constrained_variable: input
 
diff --git a/experiments/mpsc/config_overrides/mpsc_acados_quadrotor_2D_attitude.yaml b/experiments/mpsc/config_overrides/mpsc_acados_quadrotor_2D_attitude.yaml
index 21146f069..a3cc8b21e 100644
--- a/experiments/mpsc/config_overrides/mpsc_acados_quadrotor_2D_attitude.yaml
+++ b/experiments/mpsc/config_overrides/mpsc_acados_quadrotor_2D_attitude.yaml
@@ -21,6 +21,7 @@ sf_config:
   warmstart: True
   integration_algo: rk4
   use_terminal_set: False
+  max_w: 0.002
 
   # Cost function
   cost_function: one_step_cost
diff --git a/experiments/mpsc/config_overrides/nl_mpsc_quadrotor_2D_attitude.yaml b/experiments/mpsc/config_overrides/nl_mpsc_quadrotor_2D_attitude.yaml
new file mode 100644
index 000000000..3df801790
--- /dev/null
+++ b/experiments/mpsc/config_overrides/nl_mpsc_quadrotor_2D_attitude.yaml
@@ -0,0 +1,30 @@
+safety_filter: nl_mpsc
+sf_config:
+  # LQR controller parameters
+  q_mpc: [18, 0.1, 18, 0.5, 0.5, 0.0001]
+  r_mpc: [3., 3.]
+
+  # MPC Parameters
+  use_acados: True
+  horizon: 25
+  warmstart: True
+  integration_algo: rk4
+  use_terminal_set: False
+
+  # Prior info
+  prior_info:
+    prior_prop: null
+    randomize_prior_prop: False
+    prior_prop_rand_info: null
+
+  # Learning disturbance bounds
+  n_samples: 6000
+
+  # Cost function
+  cost_function: one_step_cost
+  mpsc_cost_horizon: 5
+  decay_factor: 0.85
+
+  # Softening
+  soften_constraints: True
+  slack_cost: 250
diff --git a/experiments/mpsc/config_overrides/ppo_quadrotor_2D_attitude.yaml b/experiments/mpsc/config_overrides/ppo_quadrotor_2D_attitude.yaml
index c9a8f8f93..638ab0f7f 100644
--- a/experiments/mpsc/config_overrides/ppo_quadrotor_2D_attitude.yaml
+++ b/experiments/mpsc/config_overrides/ppo_quadrotor_2D_attitude.yaml
@@ -1,8 +1,8 @@
 algo: ppo
 algo_config:
   # model args
-  hidden_dim: 128
-  activation: tanh
+  hidden_dim: 64
+  activation: relu
 
   # loss args
   gamma: 0.98
@@ -19,7 +19,7 @@ algo_config:
   critic_lr: 0.001
 
   # runner args
-  max_env_steps: 2640000
+  max_env_steps: 660000
   rollout_batch_size: 1
   rollout_steps: 660
   eval_batch_size: 10
diff --git a/experiments/mpsc/config_overrides/quadrotor_2D_attitude_tracking.yaml b/experiments/mpsc/config_overrides/quadrotor_2D_attitude_tracking.yaml
index 4e127affa..2fe979028 100644
--- a/experiments/mpsc/config_overrides/quadrotor_2D_attitude_tracking.yaml
+++ b/experiments/mpsc/config_overrides/quadrotor_2D_attitude_tracking.yaml
@@ -34,6 +34,7 @@ task_config:
   # RL Reward
   rew_state_weight: [10, 0.1, 10, 0.1, 0.1, 0.001]
   rew_act_weight: [0.1, 0.1]
+  info_mse_metric_state_weight: [1, 0, 1, 0, 0, 0]
   rew_exponential: True
 
   constraints:
diff --git a/experiments/mpsc/models/mpsc_parameters/nl_mpsc_quadrotor_2D_attitude.pkl b/experiments/mpsc/models/mpsc_parameters/nl_mpsc_quadrotor_2D_attitude.pkl
new file mode 100644
index 0000000000000000000000000000000000000000..0c5896aa8894ab242cf875e27343ce92643ab441
GIT binary patch
literal 1872
zcmZuxYfuwc7$t@f2(bp0K|nOYR?(>pjzw_XunQ5<1i@B8oFZumk$}WtNCXrrDu!23
zM-~S~#l{v8%V;6iv1DB|g7{z@<RJ=EK+!4)K^|73lrG6$I!@Ui`^~-Ix#yhw-S6HE
z>%u^~mHA6YJv20hR4x>wL2yHXQXl`LNkiKvl_*8%P9o>HM<q*4^%Tn$5>J^bK^Z4f
zC`75K#wJNDN)Rc~0#rjYLx>ooOih$b&CJ^6i{@l!q2Hk%0;+}rp&=n5{7K?7{{&V_
zG@55?(eK7lHGvaYNo}Oe=}Fi;DbY|OP^q<sDO5<r@;ymPg-Wa>_@#6WeNT+VNCC0*
zD9WQmqZT=ez(!!BMy1T005-+S%9v8V=xF~NxUG>>mVvh5`A_Fwpfc!~m-p|%*IJiy
z*_7%V&hEAN$H+5`_QOrnxXc41gk1{q!uP<{JJnv??Dm8*aeg3Hr+7PgpZ6Hod9h2I
zTF0mP04`VEK<M3r*F>(%AF*%3xl)IvQd<_b;abnr;jJ_-&;@(|R~b8Z$^QM5a9nBg
z`?QuN-0KFb`9IltPx}M9fDhohK9mwZAHnixMfKv7?bG`J{(vsv12_XZPORe~C~*`T
ziU5^5Nu8$(DRl*9oJE$A_rt)d#F*M32kyZVhG8trq<34GUo58niFYdteZp$$@I+~t
zx?bnV<)%97IJ9EDecbL(H5aRJr|s_;lE5l_`}qi=slyTLtC-WJhP6;v<33%V;1zsU
zyLZJ`!fM#!Vap62K0C^|PXAG1tO>r9#B&_Y>xR{VclWkOeT1~#;Vh=B8}`9;>_$V%
zIJ~-u)l|jT!>37{x8~cPrpx{C!K96MpjQYMuFZQ?RW$--TT8ev>Em#~VE@<g;`{L7
zD-n(BAH0WhD-6CnM-c3Yv3xMfb^+paY3&vzy$>E!87f*HEaRSaP544x=#J%`ydPv-
z=7zndIz+$zdjxVOadvNJ4@}&90ngQzO{_L}VIC7{kAxd0^#i28Tv8X>cixAw$b%cx
z+q*F8nHLr{d&9o;KirUSvXXP1&>q;6+{b#--?>!=zW-TwEM{-eHrwP$y*G)gbREB2
zsjjn>(Jn@kpcDxc<YLrvp&qvRUTpmsX}M4uDsj`vMAx>#w&s^cGC@xgMvD}}U1XAX
zXjs#k{R^3-B~K;ER1G$y!?l2rCKIIylgU(DRk5}6Ks33^S}crDn&D7cM3*shcp0~R
z-V-fogh4Fo8a0nWOthjAPs9)m;>zmVp8U51Fo?>uW-}f{k-%gggP7FaXC8w{UE{lY
zYjQ6PqPgv8u_BpFMEYkwS?Z%G8w9o5GF6WM-HXq9@(d>!7jFtj(hG1_2j-8Id*?rI
z!~L<^x))={)J~|<mc3Y68Hy}_Twgxa{1OJZ1tmM@Ech}AiRY?*Exhf7U3GaA{?EGS
z`t_S~RP}4OBL#v@tj8`xFyI5Y-NOyDulIx^!M$}JgAW;q@km(K=H>IT(v;TQ_Qy^`
zKo{@<TxQX!P$q|k3~8(Toxg9@%d$Fz>G@Zu{Q+IT2XNGk*h4o$R7lJ5+O)-d#`Hdb
zKcEZv08W0-T2kCMZ0Sj=V8%lJ_rS2BiCdSCoYKGhv|H{TZ-7iO3mw8j`|*x*YaO1^
z25>n>V{``BL4Iueii(hpdfm^3HjA%x;D=bZ0)|iY;u(CG5|_MOXoqa`hnm#mdVi-i
zQ7w&Q_)4hKj=$^)Za!&-OitVlVRW2mrlz#9G^JO-Uul!eJxgz<=`Pr<$mHN#`*zq<
lo}Txcm-*YBdE!C8QBGt)Nmb)b_T?)PVM~mDQ`9QYe*sPzZR`L5

literal 0
HcmV?d00001

diff --git a/experiments/mpsc/mpsc_experiment.py b/experiments/mpsc/mpsc_experiment.py
index a82b0329b..14500fc17 100644
--- a/experiments/mpsc/mpsc_experiment.py
+++ b/experiments/mpsc/mpsc_experiment.py
@@ -153,8 +153,8 @@ def run_multiple_models(plot, all_models):
                     all_cert_results[key].append(cert_results[key][0])
 
         met = MetricExtractor()
-        uncert_metrics = met.compute_metrics(data=all_uncert_results)
-        cert_metrics = met.compute_metrics(data=all_cert_results)
+        uncert_metrics = met.compute_metrics(data=all_uncert_results, max_steps=660)
+        cert_metrics = met.compute_metrics(data=all_cert_results, max_steps=66)
 
         all_results = {'uncert_results': all_uncert_results,
                        'uncert_metrics': uncert_metrics,
@@ -170,4 +170,4 @@ def run_multiple_models(plot, all_models):
 
 if __name__ == '__main__':
     # run(plot=True, training=False, model='none')
-    run_multiple_models(plot=True, all_models=['mpsf'])
+    run_multiple_models(plot=True, all_models=['mpsf7'])
diff --git a/experiments/mpsc/mpsc_experiment.sh b/experiments/mpsc/mpsc_experiment.sh
index 7b0bf4358..3b0350083 100755
--- a/experiments/mpsc/mpsc_experiment.sh
+++ b/experiments/mpsc/mpsc_experiment.sh
@@ -4,6 +4,7 @@ SYS='quadrotor_2D_attitude'
 TASK='tracking'
 ALGO='ppo'
 
+# SAFETY_FILTER='nl_mpsc'
 SAFETY_FILTER='mpsc_acados'
 # MPSC_COST='one_step_cost'
 MPSC_COST='precomputed_cost'
diff --git a/safe_control_gym/controllers/ppo/ppo.py b/safe_control_gym/controllers/ppo/ppo.py
index c70fc5b0d..4dbf25931 100644
--- a/safe_control_gym/controllers/ppo/ppo.py
+++ b/safe_control_gym/controllers/ppo/ppo.py
@@ -238,14 +238,15 @@ def run(self,
             action = self.select_action(obs=obs, info=info)
 
             # Adding safety filter
-            success = False
-            physical_action = env.denormalize_action(action)
-            unextended_obs = np.squeeze(true_obs)[:env.symbolic.nx]
-            certified_action, success = self.safety_filter.certify_action(unextended_obs, physical_action, info)
-            if success:
-                action = env.normalize_action(certified_action)
-            else:
-                self.safety_filter.ocp_solver.reset()
+            if self.safety_filter is not None:
+                success = False
+                physical_action = env.denormalize_action(action)
+                unextended_obs = np.squeeze(true_obs)[:env.symbolic.nx]
+                certified_action, success = self.safety_filter.certify_action(unextended_obs, physical_action, info)
+                if success:
+                    action = env.normalize_action(certified_action)
+                else:
+                    self.safety_filter.ocp_solver.reset()
 
             action = np.atleast_2d(np.squeeze([action]))
             obs, rew, done, info = env.step(action)
diff --git a/safe_control_gym/safety_filters/__init__.py b/safe_control_gym/safety_filters/__init__.py
index 41527f16c..b82a4b201 100644
--- a/safe_control_gym/safety_filters/__init__.py
+++ b/safe_control_gym/safety_filters/__init__.py
@@ -6,6 +6,10 @@
          entry_point='safe_control_gym.safety_filters.mpsc.linear_mpsc:LINEAR_MPSC',
          config_entry_point='safe_control_gym.safety_filters.mpsc:mpsc.yaml')
 
+register(idx='nl_mpsc',
+         entry_point='safe_control_gym.safety_filters.mpsc.nl_mpsc:NL_MPSC',
+         config_entry_point='safe_control_gym.safety_filters.mpsc:mpsc.yaml')
+
 register(idx='mpsc_acados',
          entry_point='safe_control_gym.safety_filters.mpsc.mpsc_acados:MPSC_ACADOS',
          config_entry_point='safe_control_gym.safety_filters.mpsc:mpsc.yaml')
diff --git a/safe_control_gym/safety_filters/mpsc/mpsc_acados.py b/safe_control_gym/safety_filters/mpsc/mpsc_acados.py
index 1846f85ca..ec32fbff5 100644
--- a/safe_control_gym/safety_filters/mpsc/mpsc_acados.py
+++ b/safe_control_gym/safety_filters/mpsc/mpsc_acados.py
@@ -3,12 +3,10 @@
 import shutil
 from datetime import datetime
 
-import casadi as cs
 import numpy as np
 import scipy
 from acados_template import AcadosModel, AcadosOcp, AcadosOcpSolver
 
-from safe_control_gym.controllers.mpc.mpc_utils import set_acados_constraint_bound
 from safe_control_gym.safety_filters.mpsc.mpsc import MPSC
 from safe_control_gym.safety_filters.mpsc.mpsc_utils import Cost_Function
 from safe_control_gym.utils.utils import timing
@@ -35,6 +33,7 @@ def __init__(
             cost_function: Cost_Function = Cost_Function.ONE_STEP_COST,
             mpsc_cost_horizon: int = 5,
             decay_factor: float = 0.85,
+            max_w: float = 0.0,
             **kwargs
     ):
         '''Creates task and controller.
@@ -71,11 +70,71 @@ def __init__(
         # acados settings
         self.use_RTI = use_RTI
 
+        self.n = self.model.nx
+        self.m = self.model.nu
+        self.q = self.model.nx
+
+        self.state_constraint = self.constraints.state_constraints[0]
+        self.input_constraint = self.constraints.input_constraints[0]
+
+        [self.X_mid, L_x, l_x] = self.box2polytopic(self.state_constraint)
+        [self.U_mid, L_u, l_u] = self.box2polytopic(self.input_constraint)
+
+        # number of constraints
+        p_x = l_x.shape[0]
+        p_u = l_u.shape[0]
+        self.p = p_x + p_u
+
+        self.L_x = np.vstack((L_x, np.zeros((p_u, self.n))))
+        self.L_u = np.vstack((np.zeros((p_x, self.m)), L_u))
+        self.l_xu = np.concatenate([l_x, l_u])
+
         # Dynamics model.
         self.setup_acados_model()
         # Acados optimizer.
         self.setup_acados_optimizer()
 
+    def box2polytopic(self, constraint):
+        '''Convert constraints into an explicit polytopic form. This assumes that constraints contain the origin.
+
+        Args:
+            constraint (Constraint): The constraint to be converted.
+
+        Returns:
+            L (ndarray): The polytopic matrix.
+            l (ndarray): Whether the constraint is active.
+        '''
+
+        Limit = []
+        limit_active = []
+
+        Z_mid = (constraint.upper_bounds + constraint.lower_bounds) / 2.0
+        Z_limits = np.array([[constraint.upper_bounds[i] - Z_mid[i], constraint.lower_bounds[i] - Z_mid[i]] for i in range(constraint.upper_bounds.shape[0])])
+
+        dim = Z_limits.shape[0]
+        eye_dim = np.eye(dim)
+
+        for constraint_id in range(0, dim):
+            if Z_limits[constraint_id, 0] != -float('inf'):
+                if Z_limits[constraint_id, 0] == 0:
+                    limit_active += [0]
+                    Limit += [-eye_dim[constraint_id, :]]
+                else:
+                    limit_active += [1]
+                    factor = 1 / Z_limits[constraint_id, 0]
+                    Limit += [factor * eye_dim[constraint_id, :]]
+
+            if Z_limits[constraint_id, 1] != float('inf'):
+                if Z_limits[constraint_id, 1] == 0:
+                    limit_active += [0]
+                    Limit += [eye_dim[constraint_id, :]]
+                else:
+                    limit_active += [1]
+                    factor = 1 / Z_limits[constraint_id, 1]
+                    Limit += [factor * eye_dim[constraint_id, :]]
+
+        return Z_mid, np.array(Limit), np.array(limit_active)
+
     @timing
     def reset(self):
         '''Prepares for training or evaluation.'''
@@ -130,7 +189,6 @@ def setup_acados_optimizer(self):
         '''Sets up nonlinear optimization problem.'''
         nx, nu = self.model.nx, self.model.nu
         ny = nx + nu
-        ny_e = nx
 
         # create ocp object to formulate the OCP
         ocp = AcadosOcp()
@@ -141,21 +199,17 @@ def setup_acados_optimizer(self):
 
         # set cost (NOTE: safe-control-gym uses quadratic cost)
         ocp.cost.cost_type = 'LINEAR_LS'
-        ocp.cost.cost_type_e = 'LINEAR_LS'
 
         Q_mat = np.zeros((nx, nx))
         R_mat = np.eye(nu)
-        ocp.cost.W_e = np.zeros((nx, nx))
         ocp.cost.W = scipy.linalg.block_diag(Q_mat, R_mat)
 
         ocp.cost.Vx = np.zeros((ny, nx))
         ocp.cost.Vu = np.zeros((ny, nu))
         ocp.cost.Vu[nx:nx + nu, :] = np.eye(nu)
-        ocp.cost.Vx_e = np.eye(nx)
 
-        # placeholder y_ref and y_ref_e (will be set in select_action)
+        # placeholder y_ref
         ocp.cost.yref = np.zeros((ny, ))
-        ocp.cost.yref_e = np.zeros((ny_e, ))
 
         # set up solver options
         ocp.solver_options.qp_solver = 'PARTIAL_CONDENSING_HPIPM'
@@ -165,33 +219,20 @@ def setup_acados_optimizer(self):
         ocp.solver_options.nlp_solver_max_iter = 25 if not self.use_RTI else 1
         ocp.solver_options.tf = self.horizon * self.dt  # prediction horizon
 
+        ocp.constraints.constr_type = 'BGH'
         ocp.constraints.x0 = self.model.X_EQ
-
-        # Constraints
-        # general constraint expressions
-        state_constraint_expr_list = []
-        input_constraint_expr_list = []
-        for state_constraint in self.state_constraints_sym:
-            state_constraint_expr_list.append(state_constraint(ocp.model.x))
-        for input_constraint in self.input_constraints_sym:
-            input_constraint_expr_list.append(input_constraint(ocp.model.u))
-
-        h_expr_list = state_constraint_expr_list + input_constraint_expr_list
-        h_expr = cs.vertcat(*h_expr_list)
-        h0_expr = cs.vertcat(*h_expr_list)
-        he_expr = cs.vertcat(*state_constraint_expr_list)  # terminal constraints are only state constraints
-        # pass the constraints to the ocp object
-        ocp = self.processing_acados_constraints_expression(ocp, h0_expr, h_expr, he_expr)
+        ocp.constraints.C = self.L_x
+        ocp.constraints.D = self.L_u
+        ocp.constraints.lg = -1000 * np.ones((self.p))
+        ocp.constraints.ug = np.zeros((self.p))
 
         # slack costs for nonlinear constraints
         if self.soften_constraints:
-            # slack variables for all constraints
-            ocp.constraints.Jsh = np.eye(2 * ny)
-            # slack penalty
-            ocp.cost.Zu = self.slack_cost * np.ones(2 * ny)
-            ocp.cost.Zl = self.slack_cost * np.ones(2 * ny)
-            ocp.cost.zl = self.slack_cost * np.ones(2 * ny)
-            ocp.cost.zu = self.slack_cost * np.ones(2 * ny)
+            ocp.constraints.Jsg = np.eye(self.p)
+            ocp.cost.Zu = self.slack_cost * np.ones(self.p)
+            ocp.cost.Zl = self.slack_cost * np.ones(self.p)
+            ocp.cost.zl = self.slack_cost * np.ones(self.p)
+            ocp.cost.zu = self.slack_cost * np.ones(self.p)
 
         solver_json = 'acados_ocp_mpsf.json'
         ocp_solver = AcadosOcpSolver(ocp, json_file=solver_json, generate=True, build=True)
@@ -202,58 +243,14 @@ def setup_acados_optimizer(self):
         for stage in range(self.mpsc_cost_horizon, self.horizon):
             ocp_solver.cost_set(stage, 'W', 0 * ocp.cost.W)
 
-        self.ocp_solver = ocp_solver
-        self.ocp = ocp
+        g = np.zeros((self.horizon, self.p))
 
-    def processing_acados_constraints_expression(self, ocp: AcadosOcp, h0_expr, h_expr, he_expr) -> AcadosOcp:
-        '''Preprocess the constraints to be compatible with acados.
-            Args:
-                ocp (AcadosOcp): acados ocp object
-                h0_expr (casadi expression): initial state constraints
-                h_expr (casadi expression): state and input constraints
-                he_expr (casadi expression): terminal state constraints
-            Returns:
-                ocp (AcadosOcp): acados ocp object with constraints set.
-
-        An alternative way to set the constraints is to use bounded constraints of acados:
-        # bounded input constraints
-        idxbu = np.where(np.sum(self.env.constraints.input_constraints[0].constraint_filter, axis=0) != 0)[0]
-        ocp.constraints.Jbu = np.eye(nu)
-        ocp.constraints.lbu = self.env.constraints.input_constraints[0].lower_bounds
-        ocp.constraints.ubu = self.env.constraints.input_constraints[0].upper_bounds
-        ocp.constraints.idxbu = idxbu # active constraints dimension
-        '''
+        for i in range(self.horizon):
+            for j in range(self.p):
+                tighten_by = (self.max_w * i) if (j < nx * 2) else 0
+                g[i, j] = (self.l_xu[j] - tighten_by)
+            g[i, :] += (self.L_x @ self.X_mid) + (self.L_u @ self.U_mid)
+            ocp_solver.constraints_set(i, 'ug', g[i, :])
 
-        ub = {'h': set_acados_constraint_bound(h_expr, 'ub', self.constraint_tol),
-              'h0': set_acados_constraint_bound(h0_expr, 'ub', self.constraint_tol),
-              'he': set_acados_constraint_bound(he_expr, 'ub', self.constraint_tol), }
-
-        lb = {'h': set_acados_constraint_bound(h_expr, 'lb'),
-              'h0': set_acados_constraint_bound(h0_expr, 'lb'),
-              'he': set_acados_constraint_bound(he_expr, 'lb'), }
-
-        # make sure all the ub and lb are 1D numpy arrays
-        # (see: https://discourse.acados.org/t/infeasible-qps-when-using-nonlinear-casadi-constraint-expressions/1595/5?u=mxche)
-        for key in ub.keys():
-            ub[key] = ub[key].flatten() if ub[key].ndim != 1 else ub[key]
-            lb[key] = lb[key].flatten() if lb[key].ndim != 1 else lb[key]
-        # check ub and lb dimensions
-        for key in ub.keys():
-            assert ub[key].ndim == 1, f'ub[{key}] is not 1D numpy array'
-            assert lb[key].ndim == 1, f'lb[{key}] is not 1D numpy array'
-        assert ub['h'].shape == lb['h'].shape, 'h_ub and h_lb have different shapes'
-
-        # pass the constraints to the ocp object
-        ocp.model.con_h_expr_0, ocp.model.con_h_expr, ocp.model.con_h_expr_e = \
-            h0_expr, h_expr, he_expr
-        ocp.dims.nh_0, ocp.dims.nh, ocp.dims.nh_e = \
-            h0_expr.shape[0], h_expr.shape[0], he_expr.shape[0]
-        # assign constraints upper and lower bounds
-        ocp.constraints.uh_0 = ub['h0']
-        ocp.constraints.lh_0 = lb['h0']
-        ocp.constraints.uh = ub['h']
-        ocp.constraints.lh = lb['h']
-        ocp.constraints.uh_e = ub['he']
-        ocp.constraints.lh_e = lb['he']
-
-        return ocp
+        self.ocp_solver = ocp_solver
+        self.ocp = ocp
diff --git a/safe_control_gym/safety_filters/mpsc/nl_mpsc.py b/safe_control_gym/safety_filters/mpsc/nl_mpsc.py
new file mode 100644
index 000000000..36b2f012c
--- /dev/null
+++ b/safe_control_gym/safety_filters/mpsc/nl_mpsc.py
@@ -0,0 +1,1051 @@
+'''NL Model Predictive Safety Certification (NL MPSC).
+
+The core idea is that any learning controller input can be either certificated as safe or, if not safe, corrected
+using an MPC controller based on Robust NL MPC.
+
+Based on
+    * K.P. Wabsersich and M.N. Zeilinger 'Linear model predictive safety certification for learning-based control' 2019
+      https://arxiv.org/pdf/1803.08552.pdf
+    * J. Köhler, R. Soloperto, M. A. Müller, and F. Allgöwer, “A computationally efficient robust model predictive
+      control framework for uncertain nonlinear systems -- extended version,” IEEE Trans. Automat. Contr., vol. 66,
+      no. 2, pp. 794 801, Feb. 2021, doi: 10.1109/TAC.2020.2982585. http://arxiv.org/abs/1910.12081
+'''
+
+import pickle
+
+import casadi as cs
+import cvxpy as cp
+import numpy as np
+from acados_template import AcadosOcp, AcadosOcpSolver
+from acados_template.acados_model import AcadosModel
+from pytope import Polytope
+from scipy.linalg import block_diag, solve_discrete_are, sqrtm
+
+from safe_control_gym.controllers.mpc.mpc_utils import discretize_linear_system, rk_discrete
+from safe_control_gym.envs.benchmark_env import Environment, Task
+from safe_control_gym.safety_filters.cbf.cbf_utils import cartesian_product
+from safe_control_gym.safety_filters.mpsc.mpsc import MPSC
+from safe_control_gym.safety_filters.mpsc.mpsc_utils import Cost_Function
+
+
+class NL_MPSC(MPSC):
+    '''Model Predictive Safety Certification Class.'''
+
+    def __init__(self,
+                 env_func,
+                 horizon: int = 10,
+                 q_mpc: list = None,
+                 r_mpc: list = None,
+                 integration_algo: str = 'rk4',
+                 warmstart: bool = True,
+                 additional_constraints: list = None,
+                 use_terminal_set: bool = True,
+                 n_samples: int = 600,
+                 cost_function: Cost_Function = Cost_Function.ONE_STEP_COST,
+                 mpsc_cost_horizon: int = 5,
+                 decay_factor: float = 0.85,
+                 soften_constraints: bool = False,
+                 slack_cost: float = 250,
+                 **kwargs
+                 ):
+        '''Initialize the MPSC.
+
+        Args:
+            env_func (partial BenchmarkEnv): Environment for the task.
+            horizon (int): The MPC horizon.
+            integration_algo (str): The algorithm used for integrating the dynamics,
+                either 'rk4', 'rk', or 'cvodes'.
+            warmstart (bool): If the previous MPC soln should be used to warmstart the next mpc step.
+            additional_constraints (list): List of additional constraints to consider.
+            use_terminal_set (bool): Whether to use a terminal set constraint or not.
+            n_samples (int): The number of state/action pairs to test when determining w_func.
+            cost_function (Cost_Function): A string (from Cost_Function) representing the cost function to be used.
+            mpsc_cost_horizon (int): How many steps forward to check for constraint violations.
+            decay_factor (float): How much to discount future costs.
+        '''
+
+        self.model_bias = None
+        super().__init__(env_func, horizon, q_mpc, r_mpc, integration_algo, warmstart, additional_constraints, use_terminal_set, cost_function, mpsc_cost_horizon, decay_factor, **kwargs)
+
+        self.n_samples = n_samples
+        self.soften_constraints = soften_constraints
+        self.slack_cost = slack_cost
+
+        self.n = self.model.nx
+        self.m = self.model.nu
+        self.q = self.model.nx
+
+        self.state_constraint = self.constraints.state_constraints[0]
+        self.input_constraint = self.constraints.input_constraints[0]
+
+        [self.X_mid, L_x, l_x] = self.box2polytopic(self.state_constraint)
+        [self.U_mid, L_u, l_u] = self.box2polytopic(self.input_constraint)
+
+        # number of constraints
+        p_x = l_x.shape[0]
+        p_u = l_u.shape[0]
+        self.p = p_x + p_u
+
+        self.L_x = np.vstack((L_x, np.zeros((p_u, self.n))))
+        self.L_u = np.vstack((np.zeros((p_x, self.m)), L_u))
+        self.l_xu = np.concatenate([l_x, l_u])
+
+    def set_dynamics(self):
+        '''Compute the discrete dynamics.'''
+
+        if self.integration_algo == 'LTI':
+            dfdxdfdu = self.model.df_func(x=self.X_EQ, u=self.U_EQ)
+            self.Ac = dfdxdfdu['dfdx'].toarray()
+            self.Bc = dfdxdfdu['dfdu'].toarray()
+
+            delta_x = self.model.x_sym
+            delta_u = self.model.u_sym
+            delta_w = cs.MX.sym('delta_w', self.model.nx, 1)
+
+            self.Ad, self.Bd = discretize_linear_system(self.Ac, self.Bc, self.dt, exact=True)
+
+            x_dot_lin_vec = self.Ad @ delta_x + self.Bd @ delta_u
+
+            if self.model_bias is not None:
+                x_dot_lin_vec = x_dot_lin_vec + self.model_bias
+
+            dynamics_func = cs.Function('fd',
+                                        [delta_x, delta_u],
+                                        [x_dot_lin_vec],
+                                        ['x0', 'p'],
+                                        ['xf'])
+
+            self.Ac = cs.Function('Ac', [delta_x, delta_u, delta_w], [self.Ac], ['x', 'u', 'w'], ['Ac'])
+            self.Bc = cs.Function('Bc', [delta_x, delta_u, delta_w], [self.Bc], ['x', 'u', 'w'], ['Bc'])
+
+            self.Ad = cs.Function('Ad', [delta_x, delta_u, delta_w], [self.Ad], ['x', 'u', 'w'], ['Ad'])
+            self.Bd = cs.Function('Bd', [delta_x, delta_u, delta_w], [self.Bd], ['x', 'u', 'w'], ['Bd'])
+        elif self.integration_algo == 'rk4':
+            dynamics_func = rk_discrete(self.model.fc_func,
+                                        self.model.nx,
+                                        self.model.nu,
+                                        self.dt)
+        else:
+            dynamics_func = cs.integrator('fd', self.integration_algo,
+                                          {'x': self.model.x_sym,
+                                           'p': self.model.u_sym,
+                                           'ode': self.model.x_dot}, {'tf': self.dt}
+                                          )
+
+        self.dynamics_func = dynamics_func
+
+    def learn(self,
+              env=None,
+              **kwargs
+              ):
+        '''Compute values used by the MPC.
+
+        Args:
+            env (BenchmarkEnv): If a different environment is to be used for learning, can supply it here.
+        '''
+
+        if env is None:
+            env = self.training_env
+
+        if self.env.NAME == Environment.CARTPOLE:
+            self.x_r = np.array([self.X_EQ[0], 0, 0, 0])
+        elif self.env.NAME == Environment.QUADROTOR and self.env.QUAD_TYPE in [2, 4]:
+            self.x_r = np.array([self.X_EQ[0], 0, self.X_EQ[2], 0, 0, 0])
+        elif self.env.NAME == Environment.QUADROTOR and self.env.QUAD_TYPE == 3:
+            self.x_r = np.array([self.X_EQ[0], 0, self.X_EQ[2], 0, self.X_EQ[4], 0, 0, 0, 0, 0, 0, 0])
+        self.u_r = self.U_EQ
+
+        x_sym = self.model.x_sym
+        u_sym = self.model.u_sym
+        w_sym = cs.MX.sym('delta_w', self.q, 1)
+
+        self.get_error_function(env=env)
+        if self.integration_algo == 'rk4':
+            self.Ec = np.diag(self.max_w_per_dim) / self.dt
+
+            self.f = cs.Function('f', [x_sym, u_sym, w_sym], [self.model.fc_func(x_sym + self.X_mid, u_sym + self.U_mid) + self.Ec @ w_sym], ['x', 'u', 'w'], ['f'])
+            phi_1 = cs.Function('phi_1', [x_sym, u_sym, w_sym], [self.f(x_sym, u_sym, w_sym)], ['x', 'u', 'w'], ['phi_1'])
+            phi_2 = cs.Function('phi_2', [x_sym, u_sym, w_sym], [self.f(x_sym + 0.5 * self.dt * phi_1(x_sym, u_sym, w_sym), u_sym, w_sym)], ['x', 'u', 'w'], ['phi_2'])
+            phi_3 = cs.Function('phi_3', [x_sym, u_sym, w_sym], [self.f(x_sym + 0.5 * self.dt * phi_2(x_sym, u_sym, w_sym), u_sym, w_sym)], ['x', 'u', 'w'], ['phi_3'])
+            phi_4 = cs.Function('phi_4', [x_sym, u_sym, w_sym], [self.f(x_sym + self.dt * phi_3(x_sym, u_sym, w_sym), u_sym, w_sym)], ['x', 'u', 'w'], ['phi_4'])
+            rungeKutta = x_sym + self.dt / 6 * (phi_1(x_sym, u_sym, w_sym) + 2 * phi_2(x_sym, u_sym, w_sym) + 2 * phi_3(x_sym, u_sym, w_sym) + phi_4(x_sym, u_sym, w_sym))
+            self.disc_f = cs.Function('disc_f', [x_sym, u_sym, w_sym], [rungeKutta + self.X_mid], ['x', 'u', 'w'], ['disc_f'])
+
+            self.Ac = cs.Function('Ac', [x_sym, u_sym, w_sym], [cs.jacobian(self.f(x_sym, u_sym, w_sym), x_sym)], ['x', 'u', 'w'], ['Ac'])
+            self.Bc = cs.Function('Bc', [x_sym, u_sym, w_sym], [cs.jacobian(self.f(x_sym, u_sym, w_sym), u_sym)], ['x', 'u', 'w'], ['Bc'])
+
+            self.Ad = cs.Function('Ad', [x_sym, u_sym, w_sym], [cs.jacobian(self.disc_f(x_sym, u_sym, w_sym), x_sym)], ['x', 'u', 'w'], ['Ad'])
+            self.Bd = cs.Function('Bd', [x_sym, u_sym, w_sym], [cs.jacobian(self.disc_f(x_sym, u_sym, w_sym), u_sym)], ['x', 'u', 'w'], ['Bd'])
+        elif self.integration_algo == 'LTI':
+            self.Ed = np.diag(self.max_w_per_dim)
+            self.Ec = self.Ed / self.dt
+
+            self.f = cs.Function('disc_f', [x_sym, u_sym, w_sym], [self.Ac(x_sym, u_sym, w_sym) @ x_sym + self.Bc(x_sym, u_sym, w_sym) @ u_sym + self.Ec @ w_sym], ['x', 'u', 'w'], ['disc_f'])
+            self.disc_f = cs.Function('disc_f', [x_sym, u_sym, w_sym], [self.Ad(x_sym, u_sym, w_sym) @ x_sym + self.Bd(x_sym, u_sym, w_sym) @ u_sym + self.Ed @ w_sym], ['x', 'u', 'w'], ['disc_f'])
+
+        self.synthesize_lyapunov()
+        self.get_terminal_ingredients()
+
+        self.L_x_sym = cs.MX(self.L_x)
+        self.L_u_sym = cs.MX(self.L_u)
+        self.L_size = np.sum(np.abs(self.L_x), axis=1) + np.sum(np.abs(self.L_u), axis=1)
+        self.L_size_sym = cs.MX(self.L_size)
+        self.l_sym = cs.MX(self.l_xu)
+        self.setup_optimizer()
+
+    def get_error_function(self, env):
+        '''Computes the maximum disturbance found in the training environment.
+
+        Args:
+            env (BenchmarkEnv): If a different environment is to be used for learning, can supply it here.
+        '''
+
+        if env is None:
+            env = self.training_env
+
+        # Create set of error residuals.
+        w = np.zeros((self.n_samples, self.n))
+        states = np.zeros((self.n_samples, self.n))
+        actions = np.zeros((self.n_samples, self.m))
+
+        # Use uniform sampling of control inputs and states.
+        for i in range(self.n_samples):
+            init_state = env.reset()[0][:self.n]
+            states[i, :] = init_state
+            if self.env.NAME == Environment.QUADROTOR:
+                u = np.random.rand(self.model.nu) / 20 - 1 / 40 + self.U_EQ
+            else:
+                u = env.action_space.sample()  # Will yield a random action within action space.
+            actions[i, :] = u
+            x_next_obs = env.step(u)[0][:self.n]
+            x_next_estimate = np.squeeze(self.dynamics_func(x0=init_state, p=u)['xf'].toarray())
+            w[i, :] = x_next_obs - x_next_estimate
+
+        print('MEAN ERROR PER DIM:', np.mean(w, axis=0))
+        self.model_bias = np.mean(w, axis=0)
+        # self.model_bias = np.array([-4.938e-07, -3.543e-05, -8.896e-07, -1.934e-04, -1.112e-05, -2.644e-05])
+        self.set_dynamics()
+
+        num_stds = 2
+        w = w - np.mean(w, axis=0)
+        normed_w = np.linalg.norm(w, axis=1)
+        self.max_w_per_dim = np.minimum(np.max(np.abs(w), axis=0), np.mean(np.abs(w), axis=0) + num_stds * np.std(np.abs(w), axis=0))
+        self.max_w = min(np.max(normed_w), np.mean(normed_w) + num_stds * np.std(normed_w))
+        # self.max_w_per_dim = np.array([0.00052966, 0.04261379, 0.00027445, 0.02223242, 0.00361825, 0.01043795])/10.0
+        # self.max_w = 0.04483104869135911/10.0
+
+        print('MAX ERROR:', np.max(normed_w))
+        print('STD ERROR:', np.mean(normed_w) + num_stds * np.std(normed_w))
+        print('MEAN ERROR:', np.mean(normed_w))
+        print('MAX ERROR PER DIM:', np.max(np.abs(w), axis=0))
+        print('STD ERROR PER DIM:', np.mean(np.abs(w), axis=0) + num_stds * np.std(np.abs(w), axis=0))
+        print('TOTAL ERRORS BY CHANNEL:', np.sum(np.abs(w), axis=0))
+
+        # if self.integration_algo == 'LTI':
+        #     degree = 1
+        #     num_stds = 2
+        # else:
+        #     degree = 2
+        #     num_stds = 3
+        # self.error_parameters = get_error_parameters(states, actions, normed_w, degree)
+        # def w_func(state, action):
+        #     input_vec = cs.horzcat(state.T, action.T)
+        #     return error_function(*self.error_parameters, num_stds, input_vec)
+        # self.w_func = w_func
+
+    def synthesize_lyapunov(self):
+        '''Synthesize the appropriate constants related to the lyapunov function of the system.'''
+        # Incremental Lyapunov function: Find upper bound for S-procedure variable lambda
+        lamb_lb = None
+        lamb_ub = None
+
+        lamb = 0.008  # lambda lower bound
+        self.rho_c = 0.192  # tuning parameter determines how fast the lyapunov function contracts
+
+        if self.integration_algo == 'LTI':
+            self.Theta = [0]
+        elif self.env.NAME == Environment.CARTPOLE or (self.env.NAME == Environment.QUADROTOR and self.env.QUAD_TYPE in [2, 4]):
+            self.Theta = [self.state_constraint.lower_bounds[-2], 0, self.state_constraint.upper_bounds[-2]]
+        else:
+            self.Theta = [self.state_constraint.lower_bounds[6], 0, self.state_constraint.upper_bounds[6]]
+
+        while lamb < 100:
+            lamb = lamb * 2
+            [X, Y, cost, constraints] = self.setup_tube_optimization(lamb)
+            prob = cp.Problem(cp.Minimize(cost), constraints)
+            try:
+                print(f'Attempting with lambda={lamb}.')
+                cost = prob.solve(solver=cp.MOSEK, verbose=False)
+                if prob.status == 'optimal' and cost != float('inf'):
+                    print(f'Succeeded with cost={cost}.')
+                    if lamb_lb is None:
+                        lamb_lb = lamb
+                    lamb_ub = lamb
+                else:
+                    raise Exception('Not optimal or cost is infinite.')
+            except Exception as e:
+                print('Error in optimization:', e)
+                if lamb_lb is not None:
+                    break
+
+        # Incremental Lyapunov function: Determine optimal lambda
+        lamb_lb = lamb_lb / 2
+        lamb_ub = lamb_ub * 2
+
+        num_candidates = 50
+
+        lambda_candidates = np.logspace(np.log(lamb_lb) / np.log(10), np.log(lamb_ub) / np.log(10), num_candidates)
+        cost_values = []
+
+        for i in range(num_candidates):
+            lambda_candidate = lambda_candidates[i]
+            [X, Y, cost, constraints] = self.setup_tube_optimization(lambda_candidate)
+            prob = cp.Problem(cp.Minimize(cost), constraints)
+            try:
+                cost = prob.solve(solver=cp.MOSEK, verbose=False)
+                if prob.status != 'optimal' or cost == float('inf'):
+                    raise cp.SolverError
+            except Exception as e:
+                print('Error in optimization:', e)
+                cost = float('inf')
+            cost_values += [cost]
+
+        best_index = cost_values.index(min(cost_values))
+        best_lamb = lambda_candidates[best_index]
+        [X, Y, cost, constraints] = self.setup_tube_optimization(best_lamb)
+        prob = cp.Problem(cp.Minimize(cost), constraints)
+        cost = prob.solve(solver=cp.MOSEK, verbose=False)
+        if prob.status != 'optimal' or cost == float('inf'):
+            raise cp.SolverError
+
+        # Resulting continuous-time parameters
+        self.X = X.value
+        self.P = np.linalg.pinv(self.X)
+        self.K = Y.value @ self.P
+
+        self.c_js = np.zeros(self.p)
+
+        for j in range(self.p):
+            self.c_js[j] = np.linalg.norm((self.L_x[j, :] + self.L_u[j, :] @ self.K) @ sqrtm(self.X))
+
+        c_max = max(self.c_js)
+        w_bar_c = np.sqrt(np.max(np.linalg.eig(self.Ec.T @ self.P @ self.Ec)[0]))
+
+        # Get Discrete-time system values
+        self.rho = np.exp(-self.rho_c * self.dt)
+        self.w_bar = w_bar_c * (1 - self.rho) / self.rho_c  # even using rho_c from the paper yields different w_bar
+        # self.w_bar = max(self.w_bar, self.max_w)
+        horizon_multiplier = (1 - self.rho**self.horizon) / (1 - self.rho)
+        self.s_bar_f = horizon_multiplier * self.w_bar
+        # assert self.s_bar_f > self.max_w * horizon_multiplier, f'[ERROR] s_bar_f ({self.s_bar_f}) is too small with respect to max_w ({self.max_w}).'
+        # assert self.max_w * horizon_multiplier < 1.0, '[ERROR] max_w is too large and will overwhelm terminal set.'
+        self.gamma = 1 / c_max - self.s_bar_f
+
+        self.delta_loc = (horizon_multiplier * self.w_bar)**2
+
+        print(f'rho: {self.rho}')
+        print(f'w_bar: {self.w_bar}')
+        print(f's_bar_f: {self.s_bar_f}')
+        print(f'gamma: {self.gamma}')
+
+        self.check_decay_rate()
+        self.check_lyapunov_func()
+
+    def get_terminal_ingredients(self):
+        '''Calculate the terminal ingredients of the MPC optimization.'''
+        # Solve Lyapunov SDP using linearized discrete-time dynamics based on RK4 for terminal ingredients
+        w_none = np.zeros((self.q, 1))
+        A_lin = self.Ad(self.x_r - self.X_mid, self.u_r - self.U_mid, w_none).toarray()
+        B_lin = self.Bd(self.x_r - self.X_mid, self.u_r - self.U_mid, w_none).toarray()
+
+        self.P_f = solve_discrete_are(A_lin, B_lin, self.Q, self.R)
+        btp = np.dot(B_lin.T, self.P_f)
+        self.K_f = -np.dot(np.linalg.inv(self.R + np.dot(btp, B_lin)), np.dot(btp, A_lin))
+        # self.check_terminal_ingredients()
+        # self.check_terminal_constraints()
+
+        if self.integration_algo == 'LTI' and self.use_terminal_set:
+            self.get_terminal_constraint()
+
+    def box2polytopic(self, constraint):
+        '''Convert constraints into an explicit polytopic form. This assumes that constraints contain the origin.
+
+        Args:
+            constraint (Constraint): The constraint to be converted.
+
+        Returns:
+            L (ndarray): The polytopic matrix.
+            l (ndarray): Whether the constraint is active.
+        '''
+
+        Limit = []
+        limit_active = []
+
+        Z_mid = (constraint.upper_bounds + constraint.lower_bounds) / 2.0
+        Z_limits = np.array([[constraint.upper_bounds[i] - Z_mid[i], constraint.lower_bounds[i] - Z_mid[i]] for i in range(constraint.upper_bounds.shape[0])])
+
+        dim = Z_limits.shape[0]
+        eye_dim = np.eye(dim)
+
+        for constraint_id in range(0, dim):
+            if Z_limits[constraint_id, 0] != -float('inf'):
+                if Z_limits[constraint_id, 0] == 0:
+                    limit_active += [0]
+                    Limit += [-eye_dim[constraint_id, :]]
+                else:
+                    limit_active += [1]
+                    factor = 1 / Z_limits[constraint_id, 0]
+                    Limit += [factor * eye_dim[constraint_id, :]]
+
+            if Z_limits[constraint_id, 1] != float('inf'):
+                if Z_limits[constraint_id, 1] == 0:
+                    limit_active += [0]
+                    Limit += [eye_dim[constraint_id, :]]
+                else:
+                    limit_active += [1]
+                    factor = 1 / Z_limits[constraint_id, 1]
+                    Limit += [factor * eye_dim[constraint_id, :]]
+
+        return Z_mid, np.array(Limit), np.array(limit_active)
+
+    def setup_tube_optimization(self, lamb):
+        '''Sets up the optimization to find the lyapunov function.
+
+        Args:
+            lamb (float): The S-procedure constant.
+
+        Returns:
+            X (cp.Variable): The X variable in the optimization.
+            Y (cp.Variable): The Y variable in the optimization.
+            Cost (cp.Expression): The cost function expression.
+            Constraints (list): The list of cvxpy expressions representing the constraints.
+        '''
+
+        X = cp.Variable((self.n, self.n), PSD=True, name='X', complex=False)
+        Y = cp.Variable((self.m, self.n), name='Y', complex=False)
+
+        Cost = -cp.log_det(X)
+
+        Constraints = []
+
+        x_test = np.zeros((self.n, 1))
+        u_test = self.U_EQ
+        w_test = np.zeros((self.q, 1))
+
+        for angle in self.Theta:
+            if self.env.NAME == Environment.CARTPOLE or (self.env.NAME == Environment.QUADROTOR and self.env.QUAD_TYPE in [2, 4]):
+                x_test[-2] = angle
+            else:
+                x_test[-4] = angle
+                x_test[-5] = angle
+                x_test[-6] = angle
+            A_theta = self.Ac(x_test, u_test - self.U_mid, w_test).toarray()
+            B_theta = self.Bc(x_test, u_test - self.U_mid, w_test).toarray()
+
+            AXBY = A_theta @ X + B_theta @ Y
+
+            constraint_1 = AXBY + AXBY.T + 2 * self.rho_c * X
+            constraint_2 = cp.bmat([[AXBY + AXBY.T + lamb * X, self.Ec], [self.Ec.T, -lamb * np.eye(self.q)]])
+
+            Constraints += [constraint_1 << 0]
+            Constraints += [constraint_2 << 0]
+
+        for j in range(0, self.p):
+            LXLY = self.L_x[j:j + 1, :] @ X + self.L_u[j:j + 1, :] @ Y
+
+            constraint_3 = cp.bmat([[np.array([[1]]), LXLY], [LXLY.T, X]])
+            Constraints += [constraint_3 >> 0]
+
+        return X, Y, Cost, Constraints
+
+    def randsphere(self, num, dim, r):
+        '''This function returns an num by dim array in which
+           each of the num rows has the dim Cartesian coordinates
+           of a random point uniformly-distributed over the
+           interior of an dim-dimensional hypersphere with
+           radius r and center at the origin.
+
+        Args:
+            num (int): The number of vectors.
+            dim (int): The dimension of the hypersphere.
+            r (float): The radius of the hypersphere.
+
+        Returns:
+            vectors (ndarray): The resulting random points inside the hypersphere.
+        '''
+
+        vectors = []
+
+        while len(vectors) < num:
+            u = np.random.normal(0, 1, dim)  # an array of d normally distributed random variables
+            norm = np.sum(u**2)**(0.5)
+            radius = r * np.random.rand()**(1.0 / dim)
+            vec = radius * u / norm
+            vectors.append(vec)
+
+        return np.vstack(vectors)
+
+    def check_decay_rate(self):
+        '''Check the decay rate.'''
+
+        x_test = np.zeros((self.n, 1))
+        u_test = self.U_EQ
+        w_test = np.zeros((self.q, 1))
+
+        X_sqrt = sqrtm(self.X)
+        P_sqrt = sqrtm(self.P)
+        for angle in self.Theta:
+            if self.env.NAME == Environment.CARTPOLE or (self.env.NAME == Environment.QUADROTOR and self.env.QUAD_TYPE in [2, 4]):
+                x_test[-2] = angle
+            else:
+                x_test[-4] = angle
+                x_test[-5] = angle
+                x_test[-6] = angle
+            A_theta = self.Ac(x_test, u_test - self.U_mid, w_test).toarray()
+            B_theta = self.Bc(x_test, u_test - self.U_mid, w_test).toarray()
+            left_side = max(np.linalg.eig(X_sqrt @ (A_theta + B_theta @ self.K).T @ P_sqrt + P_sqrt @ (A_theta + B_theta @ self.K) @ X_sqrt)[0]) + 2 * self.rho_c
+            assert left_side <= 0.0001, f'[ERROR] The solution {left_side} is not within the tolerance {0.0001}'
+
+    def check_lyapunov_func(self):
+        '''Check the incremental Lyapunov function.'''
+
+        # select the number of random vectors to check
+        num_random_vectors = 10000
+
+        # Sample random points inside the set V_delta(x, z) <= delta_loc
+        delta_x = self.randsphere(num_random_vectors, self.n, self.delta_loc).T
+        dx_transform = np.linalg.inv(sqrtm(self.P)) @ delta_x
+        dx_transform = self.x_r[:, None] + dx_transform  # transform point from error to actual state
+
+        # sample random disturbance bounded by max_w
+        w_dist = self.randsphere(num_random_vectors, self.q, self.max_w).T
+
+        # set arbitrary v that satisfies the constraints for testing
+        v = np.array(self.constraints.input_constraints[0].upper_bounds) / 10
+
+        # initialize counters
+        num_valid = 0
+        inside_set = 0
+        is_invariant = 0
+
+        for i in range(num_random_vectors):
+            # get random state
+            x_i = dx_transform[:, i]
+
+            # set up control inputs (u_r is required to get f_kappa(0, 0) = 0)
+            u_x = self.K @ x_i + v + self.u_r
+            u_z = self.K @ self.x_r + v + self.u_r
+
+            # get dynamics
+            w_none = np.zeros((self.q, 1))
+            x_dot = np.squeeze(self.f(x_i - self.X_mid, u_x - self.U_mid, w_none).toarray())
+            z_dot = np.squeeze(self.f(self.x_r - self.X_mid, u_z - self.U_mid, w_none).toarray())
+
+            # evaluate Lyapunov function and its time derivative
+            V_d = (x_i - self.x_r).T @ self.P @ (x_i - self.x_r)
+            dVdt = (x_i - self.x_r).T @ self.P @ (x_dot - z_dot)
+
+            # Check incremental Lypaunov function condition
+            if dVdt <= -self.rho_c * V_d:
+                num_valid += 1
+
+            # check if states are inside V_d(x_i, z) <= delta_loc
+            if V_d <= self.delta_loc:
+                inside_set += 1
+
+            # get next state
+            x_plus = np.squeeze(self.disc_f(x_i - self.X_mid, u_x - self.U_mid, w_dist[:, i]).toarray())
+            V_d_plus = (x_plus - self.x_r).T @ self.P @ (x_plus - self.x_r)
+
+            # check robust control invariance
+            if V_d_plus <= self.delta_loc:
+                is_invariant += 1
+
+        print('NUM_VALID:', num_valid / num_random_vectors)
+        print('INSIDE SET:', inside_set / num_random_vectors)
+        print('IS INVARIANT:', is_invariant / num_random_vectors)
+
+    def check_terminal_ingredients(self):
+        '''Check the terminal ingredients.'''
+
+        w_none = np.zeros((self.q, 1))
+        num_random_vectors = 10000
+
+        # Sample points from gamma^2 * unit sphere
+        delta_x = self.randsphere(num_random_vectors, self.n, self.gamma**2).T
+
+        # Transform sampled points into ellipsoid to span the candidate terminal
+        # set and shift around reference point x_r
+        dx_transform = np.linalg.inv(sqrtm(self.P_f)) @ delta_x
+        dx_transform = self.x_r[:, None] + dx_transform
+
+        # sample random disturbance bounded by max_w
+        w_dist = self.randsphere(num_random_vectors, self.q, self.max_w).T
+
+        # initialize counter
+        num_valid = 0
+        inside_set = 0
+
+        for i in range(num_random_vectors):
+            # get sampled vector
+            x_i = dx_transform[:, i]
+
+            # get terminal control input
+            u = self.K_f @ (x_i - self.x_r) + self.u_r
+
+            # simulate system using control input
+            x_plus = np.squeeze(self.disc_f(x_i - self.X_mid, u - self.U_mid, w_none).toarray())
+
+            # disturbed x_plus
+            x_plus_noisy = np.squeeze(self.disc_f(x_i - self.X_mid, u - self.U_mid, w_dist[:, i]).toarray())
+
+            # evaluate stage cost and terminal costs
+            stage = (x_i - self.x_r).T @ self.Q @ (x_i - self.x_r)
+            V_f = (x_i - self.x_r).T @ self.P_f @ (x_i - self.x_r)
+            V_f_plus = (x_plus - self.x_r).T @ self.P_f @ (x_plus - self.x_r)
+
+            # check Lyapunov condition for terminal cost
+            if V_f_plus <= V_f - stage:
+                num_valid += 1
+
+            # check if noisy state is still in terminal set
+            V_f_plus_noisy = (x_plus_noisy - self.x_r).T @ self.P_f @ (x_plus_noisy - self.x_r)
+            if V_f_plus_noisy <= self.gamma**2:
+                inside_set += 1
+
+        print('NUM_VALID:', num_valid / num_random_vectors)
+        print('INSIDE SET:', inside_set / num_random_vectors)
+
+    def check_terminal_constraints(self,
+                                   num_points: int = 40,
+                                   ):
+        '''
+        Check if the provided terminal set is only contains valid states using a gridded approach.
+
+        Args:
+            num_points (int): The number of points in each dimension to check.
+
+        Returns:
+            valid_cbf (bool): Whether the provided CBF candidate is valid.
+            infeasible_states (list): List of all states for which the QP is infeasible.
+        '''
+
+        # Determine if terminal set inside state constraints
+        terminal_max = np.sqrt(np.diag(np.linalg.inv(self.P_f / self.gamma**2)))
+        terminal_min = -np.sqrt(np.diag(np.linalg.inv(self.P_f / self.gamma**2)))
+
+        max_bounds = np.zeros((self.n))
+        min_bounds = np.zeros((self.n))
+        for i in range(self.n):
+            tighten_by_max = self.c_js[i * 2] * self.s_bar_f
+            tighten_by_min = self.c_js[i * 2 + 1] * self.s_bar_f
+            max_bounds[i] = 1.0 / self.L_x[i * 2, i] * (self.l_xu[i * 2] - tighten_by_max)
+            min_bounds[i] = 1.0 / self.L_x[i * 2 + 1, i] * (self.l_xu[i * 2 + 1] - tighten_by_min)
+
+        if np.any(terminal_max > max_bounds) or np.any(terminal_min < min_bounds):
+            raise ValueError('Terminal set is not constrained within the constraint set.')
+
+        # Determine if the maximum input is within input constraints
+        x = cp.Variable((self.n, 1))
+        C = np.linalg.cholesky(self.P_f).T
+        cost = cp.Maximize(self.K_f[0, :] @ x)
+        constraint = [cp.norm(C @ x) <= self.gamma]
+        prob = cp.Problem(cost, constraint)
+        max_input = prob.solve(solver=cp.MOSEK)
+
+        max_bounds = np.zeros((self.m))
+        min_bounds = np.zeros((self.m))
+        for i in range(self.m):
+            tighten_by_max = self.c_js[self.n * 2 + i * 2] * self.s_bar_f
+            tighten_by_min = self.c_js[self.n * 2 + i * 2 + 1] * self.s_bar_f
+            max_bounds[i] = 1.0 / self.L_u[self.n * 2 + i * 2, i] * (self.l_xu[self.n * 2 + i * 2] - tighten_by_max)
+            min_bounds[i] = 1.0 / self.L_u[self.n * 2 + i * 2 + 1, i] * (self.l_xu[self.n * 2 + i * 2 + 1] - tighten_by_min)
+
+        if np.any(max_input + self.u_r > max_bounds + self.U_mid) or np.any(-max_input + self.u_r < min_bounds + self.U_mid):
+            raise ValueError(f'Terminal controller causes inputs (max_input: {-max_input+self.u_r[0]}/{max_input+self.u_r[0]}) outside of input constraints (constraints: {min_bounds[0] + self.U_mid[0]}/{max_bounds[0] + self.U_mid[0]}).')
+
+        # Make sure that every vertex is checked
+        num_points = max(2 * self.n, num_points + num_points % (2 * self.n))
+        num_points_per_dim = num_points // self.n
+
+        # Create the lists of states to check
+        states_to_sample = [np.linspace(self.X_mid[i], terminal_max[i] + self.X_mid[i], num_points_per_dim) for i in range(self.n)]
+        states_to_check = cartesian_product(*states_to_sample)
+
+        num_states_inside_set = 0
+        failed_checks = 0
+        failed_29a = 0
+        failed_29b = 0
+        failed_29d = 0
+
+        for state in states_to_check:
+            terminal_cost = (state - self.X_mid).T @ self.P_f @ (state - self.X_mid)
+            in_terminal_set = terminal_cost < self.gamma**2
+
+            if in_terminal_set:
+                num_states_inside_set += 1
+                failed = False
+
+                # Testing condition 29a
+                stable_input = self.K_f @ (state - self.x_r) + self.u_r
+                next_state = np.squeeze(self.disc_f(state - self.X_mid, stable_input - self.U_mid, np.zeros((self.q, 1))).toarray())
+                stage_cost = (state.T - self.X_mid) @ self.Q @ (state - self.X_mid)
+                next_terminal_cost = (next_state - self.X_mid).T @ self.P_f @ (next_state - self.X_mid)
+
+                if terminal_cost - stage_cost != 0 and next_terminal_cost / (terminal_cost - stage_cost) > 1.01:
+                    failed_29a += 1
+                    failed = True
+
+                # Testing condition 29b
+                num_disturbances = 100
+                disturbances = self.randsphere(num_disturbances, self.n, self.max_w).T
+                for w in range(num_disturbances):
+                    disturbed_state = next_state + disturbances[:, w]
+                    terminal_cost = (disturbed_state - self.X_mid).T @ self.P_f @ (disturbed_state - self.X_mid)
+                    in_terminal_set = terminal_cost < self.gamma**2
+
+                    if not in_terminal_set:
+                        failed_29b += 1
+                        failed = True
+                        break
+
+                # Testing condition 29d
+                for j in range(self.p):
+                    constraint_satisfaction = self.L_x[j, :] @ (state - self.X_mid) + self.L_u[j, :] @ (stable_input - self.U_mid) - self.l_xu[j] + self.c_js[j] * self.s_bar_f <= 0
+                    if not constraint_satisfaction:
+                        failed_29d += 1
+                        failed = True
+                        break
+
+                if failed:
+                    failed_checks += 1
+
+        print(f'Number of states checked: {len(states_to_check)}')
+        print(f'Number of states inside terminal set: {num_states_inside_set}')
+        print(f'Number of checks failed: {failed_checks}')
+        print(f'Number of checks failed due to 29a: {failed_29a}')
+        print(f'Number of checks failed due to 29b: {failed_29b}')
+        print(f'Number of checks failed due to 29d: {failed_29d}')
+
+    def get_terminal_constraint(self):
+        '''Calculates the terminal set as a linear constraint'''
+        interior_points = []
+        for _ in range(self.n_samples):
+            state = np.random.uniform(self.state_constraint.lower_bounds, self.state_constraint.upper_bounds)
+            if (state - self.X_mid).T @ self.P_f @ (state - self.X_mid) <= self.gamma**2:
+                interior_points.append(state)
+        self.terminal_set = Polytope(interior_points)
+        self.terminal_set.minimize_V_rep()
+
+        self.terminal_A = self.terminal_set.A
+        self.terminal_b = self.terminal_set.b
+
+    def load(self,
+             path,
+             ):
+        '''Load values used by the MPSC.
+
+        Args:
+            path (str): Path to the required file.
+        '''
+
+        with open(path, 'rb') as f:
+            parameters = pickle.load(f)
+
+        self.rho_c = parameters['rho_c']
+        self.Theta = parameters['Theta']
+        self.X = parameters['X']
+        self.K = parameters['K']
+        self.P = parameters['P']
+        self.delta_loc = parameters['delta_loc']
+        self.rho = parameters['rho']
+        self.s_bar_f = parameters['s_bar_f']
+        self.w_bar = parameters['w_bar']
+        self.max_w = parameters['max_w']
+        # self.error_parameters = parameters['error_parameters']
+        # if self.integration_algo == 'LTI':
+        #     num_stds = 2
+        # else:
+        #     num_stds = 3
+        # def w_func(state, action):
+        #     input_vec = cs.horzcat(state.T, action.T)
+        #     return error_function(*self.error_parameters, num_stds, input_vec)
+        # self.w_func = w_func
+        self.c_js = parameters['c_js']
+        self.gamma = parameters['gamma']
+        self.P_f = parameters['P_f']
+        self.K_f = parameters['K_f']
+        self.model_bias = parameters['model_bias']
+
+        self.set_dynamics()
+
+        if self.integration_algo == 'LTI' and self.use_terminal_set is True:
+            self.terminal_A = parameters['terminal_A']
+            self.terminal_b = parameters['terminal_b']
+
+        self.L_x_sym = cs.MX(self.L_x)
+        self.L_u_sym = cs.MX(self.L_u)
+        self.L_size = np.sum(np.abs(self.L_x), axis=1) + np.sum(np.abs(self.L_u), axis=1)
+        self.L_size_sym = cs.MX(self.L_size)
+        self.l_sym = cs.MX(self.l_xu)
+
+        self.setup_optimizer()
+
+    def save(self, path):
+        '''Save values used by the MPSC.
+
+        Args:
+            path (str): Name of the file to be created.
+        '''
+
+        parameters = {}
+        parameters['rho_c'] = self.rho_c
+        parameters['Theta'] = self.Theta
+        parameters['X'] = self.X
+        parameters['K'] = self.K
+        parameters['P'] = self.P
+        parameters['delta_loc'] = self.delta_loc
+        parameters['rho'] = self.rho
+        parameters['s_bar_f'] = self.s_bar_f
+        parameters['w_bar'] = self.w_bar
+        parameters['max_w'] = self.max_w
+        # parameters['error_parameters'] = self.error_parameters
+        parameters['c_js'] = self.c_js
+        parameters['gamma'] = self.gamma
+        parameters['P_f'] = self.P_f
+        parameters['K_f'] = self.K_f
+        parameters['model_bias'] = self.model_bias
+
+        if self.integration_algo == 'LTI' and self.use_terminal_set is True:
+            parameters['terminal_A'] = self.terminal_A
+            parameters['terminal_b'] = self.terminal_b
+
+        with open(path, 'wb') as f:
+            pickle.dump(parameters, f)
+
+    def setup_casadi_optimizer(self):
+        '''Setup the certifying MPC problem.'''
+
+        # Horizon parameter.
+        horizon = self.horizon
+        nx, nu = self.model.nx, self.model.nu
+        # Define optimizer and variables.
+        if self.integration_algo == 'LTI':
+            opti = cs.Opti('conic')
+        elif self.integration_algo == 'rk4':
+            opti = cs.Opti()
+        # States.
+        z_var = opti.variable(nx, horizon + 1)
+        # Inputs.
+        v_var = opti.variable(nu, horizon)
+        # Lyapunov bound.
+        s_var = opti.variable(1, horizon + 1)
+        # Certified input.
+        next_u = opti.variable(nu, 1)
+        # Desired input.
+        u_L = opti.parameter(nu, 1)
+        # Current observed state.
+        x_init = opti.parameter(nx, 1)
+        # Reference trajectory and predicted LQR gains
+        if self.env.TASK == Task.STABILIZATION:
+            X_GOAL = opti.parameter(1, nx)
+        elif self.env.TASK == Task.TRAJ_TRACKING:
+            X_GOAL = opti.parameter(self.horizon, nx)
+
+        if self.soften_constraints:
+            slack = opti.variable(1, 1)
+            slack_term = opti.variable(1, 1)
+        else:
+            slack = opti.variable(1, 1)
+            slack_term = opti.variable(1, 1)
+            opti.subject_to(slack == 0)
+            opti.subject_to(slack_term == 0)
+
+        for i in range(self.horizon):
+            # Dynamics constraints
+            next_state = self.dynamics_func(x0=z_var[:, i], p=v_var[:, i])['xf']
+            opti.subject_to(z_var[:, i + 1] == next_state)
+
+            # Lyapunov size increase
+            opti.subject_to(s_var[:, i + 1] == self.rho * s_var[:, i] + self.max_w)  # self.w_func(z_var[:, i], v_var[:, i]))
+            opti.subject_to(s_var[:, i] <= self.s_bar_f)
+            # opti.subject_to(self.w_func(z_var[:, i], v_var[:, i]) <= self.max_w)
+
+            # Constraints
+            for j in range(self.p):
+                tighten_by = self.c_js[j] * s_var[:, i + 1]
+                if self.soften_constraints:
+                    opti.subject_to(self.L_x_sym[j, :] @ (z_var[:, i + 1] - self.X_mid) + self.L_u_sym[j, :] @ (v_var[:, i] - self.U_mid) - self.l_sym[j] + tighten_by <= slack)
+                    opti.subject_to(slack >= 0)
+                else:
+                    opti.subject_to(self.L_x_sym[j, :] @ (z_var[:, i + 1] - self.X_mid) + self.L_u_sym[j, :] @ (v_var[:, i] - self.U_mid) - self.l_sym[j] + tighten_by <= 0)
+
+        # Final state constraints
+        if self.use_terminal_set:
+            if self.integration_algo == 'LTI':
+                if self.soften_constraints:
+                    opti.subject_to(cs.vec(self.terminal_A @ (z_var[:, -1] - self.X_mid) - self.terminal_b) <= slack_term)
+                    opti.subject_to(slack_term >= 0)
+                else:
+                    opti.subject_to(cs.vec(self.terminal_A @ (z_var[:, -1] - self.X_mid) - self.terminal_b) <= 0)
+            elif self.integration_algo == 'rk4':
+                terminal_cost = (z_var[:, -1] - self.X_mid).T @ self.P_f @ (z_var[:, -1] - self.X_mid)
+                if self.soften_constraints:
+                    opti.subject_to(terminal_cost <= self.gamma**2 + slack_term)
+                    opti.subject_to(slack_term >= 0)
+                else:
+                    opti.subject_to(terminal_cost <= self.gamma**2)
+        else:
+            if self.soften_constraints:
+                opti.subject_to(slack_term == 0)
+
+        # Initial state constraints
+        opti.subject_to(z_var[:, 0] == x_init)
+        opti.subject_to(s_var[:, 0] == 0)
+
+        # Real input
+        opti.subject_to(next_u == v_var[:, 0])
+
+        # Create solver (IPOPT solver as of this version).
+        if self.integration_algo == 'LTI':
+            opts = {'expand': True, 'printLevel': 'none'}
+            opti.solver('qpoases', opts)
+        elif self.integration_algo == 'rk4':
+            opts = {'expand': True,
+                    'ipopt.print_level': 0,
+                    'ipopt.sb': 'yes',
+                    'ipopt.max_iter': 50,
+                    'print_time': 0}
+            opti.solver('ipopt', opts)
+        self.opti_dict = {
+            'opti': opti,
+            'z_var': z_var,
+            'v_var': v_var,
+            's_var': s_var,
+            'u_L': u_L,
+            'x_init': x_init,
+            'next_u': next_u,
+            'X_GOAL': X_GOAL,
+            'slack': slack,
+            'slack_term': slack_term,
+        }
+
+        # Cost (# eqn 5.a, note: using 2norm or sqrt makes this infeasible).
+        cost = self.cost_function.get_cost(self.opti_dict)
+        if self.soften_constraints:
+            cost = cost + self.slack_cost * slack
+            cost = cost + self.slack_cost * slack_term
+        opti.minimize(cost)
+        self.opti_dict['cost'] = cost
+
+    def setup_acados_optimizer(self):
+        '''setup_optimizer_acados'''
+        # create ocp object to formulate the OCP
+        ocp = AcadosOcp()
+
+        # Setup model
+        model = AcadosModel()
+        model.x = self.model.x_sym
+        model.u = self.model.u_sym
+        model.f_expl_expr = self.model.x_dot
+
+        if self.env.NAME == Environment.CARTPOLE:
+            x1_dot = cs.MX.sym('x1_dot')
+            v_dot = cs.MX.sym('v_dot')
+            theta1_dot = cs.MX.sym('theta1_dot')
+            dtheta_dot = cs.MX.sym('dtheta_dot')
+            xdot = cs.vertcat(x1_dot, v_dot, theta1_dot, dtheta_dot)
+        elif self.env.NAME == Environment.QUADROTOR and self.env.QUAD_TYPE in [2, 4]:
+            x1_dot = cs.MX.sym('x1_dot')
+            vx_dot = cs.MX.sym('vx_dot')
+            z1_dot = cs.MX.sym('z1_dot')
+            vz_dot = cs.MX.sym('vz_dot')
+            theta1_dot = cs.MX.sym('theta1_dot')
+            dtheta_dot = cs.MX.sym('dtheta_dot')
+            xdot = cs.vertcat(x1_dot, vx_dot, z1_dot, vz_dot, theta1_dot, dtheta_dot)
+        else:
+            x1_dot = cs.MX.sym('x1_dot')
+            vx_dot = cs.MX.sym('vx_dot')
+            y1_dot = cs.MX.sym('y1_dot')
+            vy_dot = cs.MX.sym('vy_dot')
+            z1_dot = cs.MX.sym('z1_dot')
+            vz_dot = cs.MX.sym('vz_dot')
+            phi1_dot = cs.MX.sym('phi1_dot')  # Roll
+            theta1_dot = cs.MX.sym('theta1_dot')  # Pitch
+            psi1_dot = cs.MX.sym('psi1_dot')  # Yaw
+            p1_body_dot = cs.MX.sym('p1_body_dot')  # Body frame roll rate
+            q1_body_dot = cs.MX.sym('q1_body_dot')  # body frame pith rate
+            r1_body_dot = cs.MX.sym('r1_body_dot')  # body frame yaw rate
+            xdot = cs.vertcat(x1_dot, vx_dot, y1_dot, vy_dot, z1_dot, vz_dot, phi1_dot, theta1_dot, psi1_dot, p1_body_dot, q1_body_dot, r1_body_dot)
+
+        model.xdot = xdot
+        model.f_impl_expr = model.xdot - model.f_expl_expr
+        model.name = 'mpsf'
+        ocp.model = model
+
+        nx, nu = self.model.nx, self.model.nu
+        ny = nx + nu
+
+        ocp.dims.N = self.horizon
+
+        # set cost module
+        ocp.cost.cost_type = 'LINEAR_LS'
+
+        Q_mat = np.zeros((nx, nx))
+        R_mat = np.eye(nu)
+        ocp.cost.W = block_diag(Q_mat, R_mat)
+
+        ocp.cost.Vx = np.zeros((ny, nx))
+        ocp.cost.Vu = np.zeros((ny, nu))
+        ocp.cost.Vu[nx:nx + nu, :] = np.eye(nu)
+
+        # Updated on each iteration
+        ocp.cost.yref = np.concatenate((self.model.X_EQ, self.model.U_EQ))
+
+        # set constraints
+        ocp.constraints.constr_type = 'BGH'
+        ocp.constraints.x0 = self.model.X_EQ
+        ocp.constraints.C = self.L_x
+        ocp.constraints.D = self.L_u
+        ocp.constraints.lg = -1000 * np.ones((self.p))
+        ocp.constraints.ug = np.zeros((self.p))
+
+        # Slack
+        if self.soften_constraints:
+            ocp.constraints.Jsg = np.eye(self.p)
+            ocp.cost.Zu = self.slack_cost * np.ones(self.p)
+            ocp.cost.Zl = self.slack_cost * np.ones(self.p)
+            ocp.cost.zl = self.slack_cost * np.ones(self.p)
+            ocp.cost.zu = self.slack_cost * np.ones(self.p)
+
+        # Options
+        ocp.solver_options.qp_solver = 'FULL_CONDENSING_HPIPM'
+        ocp.solver_options.hessian_approx = 'GAUSS_NEWTON'
+        ocp.solver_options.hpipm_mode = 'BALANCE'
+        ocp.solver_options.integrator_type = 'ERK'
+        ocp.solver_options.nlp_solver_type = 'SQP_RTI'
+
+        # set prediction horizon
+        ocp.solver_options.tf = self.dt * self.horizon
+
+        solver_json = 'acados_ocp_mpsf.json'
+        ocp_solver = AcadosOcpSolver(ocp, json_file=solver_json, generate=True, build=True)
+
+        for stage in range(self.mpsc_cost_horizon):
+            ocp_solver.cost_set(stage, 'W', (self.cost_function.decay_factor**stage) * ocp.cost.W)
+
+        for stage in range(self.mpsc_cost_horizon, self.horizon):
+            ocp_solver.cost_set(stage, 'W', 0 * ocp.cost.W)
+
+        s_var = np.zeros((self.horizon + 1))
+        g = np.zeros((self.horizon, self.p))
+
+        for i in range(self.horizon):
+            s_var[i + 1] = self.rho * s_var[i] + self.max_w
+            for j in range(self.p):
+                tighten_by = self.c_js[j] * s_var[i + 1]
+                g[i, j] = (self.l_xu[j] - tighten_by)
+            g[i, :] += (self.L_x @ self.X_mid) + (self.L_u @ self.U_mid)
+            ocp_solver.constraints_set(i, 'ug', g[i, :])
+
+        self.ocp_solver = ocp_solver