MPC_ARPO_Project/src/trajectorySimulate.py at master · IsaacTroche1/MPC_ARPO_Project · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
"""
This function performs trajectory simulation using an MPC controller on the DISCRETE-TIME, LINEAR Clohessy-Wiltshire
equations of relative motion.

Further documentation describing these objects can be found in the module src.mpcsim

The function utilizes a small selection of helpers to aid readability/conciseness.
These can be found in the module src.simhelpers
"""

import sympy as sy
import osqp
from filterpy.kalman import UnscentedKalmanFilter, MerweScaledSigmaPoints

from src.simhelpers import *

def trajectorySimulate(sim_conditions:SimConditions, mpc_params:MPCParams, fail_params:FailsafeParams, debris:Debris):
    """
    Performs discrete-time linear simulation

    :param sim_conditions: A SimConditions object representing general simulation conditions (initial state, orbital parameters, etc.)
    :param mpc_params: An MPCParams object containing the tunable parameters of the MPC controller to be used during simulation
    :param fail_params: A FailsafeParams object containing the tunable parameters of the failsafe controllers to be during simulation
    :param debris: A Debris object containing information describing the debris to be avoided by the control algorithm during simulation
    :return: A SimRun object with the necessary telemetry for data reduction and visualization/animation
    """

    random.seed(123)  # Uncomment for repeatable behavior

    isDeltaV = sim_conditions.isDeltaV
    inTrack = sim_conditions.inTrack
    distTol = sim_conditions.suc_cond[0]
    angTol = sim_conditions.suc_cond[1]
    noise = sim_conditions.noise

    # Noise characteristics
    if noise is not None:
        sigMat = sim_conditions.noise.constructSigMat()
        noiseRepeat = sim_conditions.noise.noise_length
    else:
        sigMat = np.diag([0.,0.,0.,0.])
        noiseRepeat = 1


    # Simulation Constants
    gam = sim_conditions.los_ang
    rp = sim_conditions.r_p
    rtot = sim_conditions.r_tol
    phi = sim_conditions.hatch_ofst
    n = sim_conditions.mean_mtn
    T = sim_conditions.time_stp

    time_final = sim_conditions.T_final
    nsimD = int(time_final / T)

    # Initial and reference states
    x0 = sim_conditions.x0
    xr = sim_conditions.xr

    # Debris setup
    if debris is not None:
        #Debris bounding box
        sqVerts = debris.constructVertArr()
        center = debris.center
        sideLength = debris.side_length
        hasDebris = True
    else:
        center = (-np.inf,-np.inf)
        sideLength = 0
        hasDebris = False

    # Continuous-time linear CW equations
    Ap = np.array([
    [0.,      0.,     1., 0.],
    [0.,      0.,     0., 1.],
    [3*n**2,      0.,     0., 2*n],
    [0.,  0.,     -2*n, 0.],
    ])

    Adi = np.eye(2)
    ndi = Adi.shape[0]

    Bp = np.array([
    [0.,      0.],
    [0.,  0.],
    [1.,  0.],
    [0.,     1.],
    ])
    [nx, nu] = Bp.shape

    Cm = np.array([
    [1., 0., 0., 0.],
    [0., 1., 0., 0.],
    ])

    [nx, nu] = Bp.shape
    nym = Cm.shape[0]

    # Discretize
    Ad = sparse.csc_matrix(sp.linalg.expm(Ap*T))
    x = sy.symbols('x')
    Ax = sy.Matrix(Ap)*x
    eAx = Ax.exp()
    eAxInt = np.empty([Ap.shape[0],Ap.shape[0]])
    for (i,j), func_ij in np.ndenumerate(eAx):
        func = sy.lambdify((x),func_ij)
        eAxInt[i,j] = sp.integrate.quad(func,0.,T)[0]
    if not isDeltaV:
        Bd = sparse.csc_matrix(eAxInt@Bp)
    else:
        Bd = sparse.csc_matrix(Ad@np.vstack([np.zeros([2,2]),np.eye(2)]))

    # State observer system for disturbance estimation
    Ao = sp.linalg.block_diag(Ad.toarray(), Adi)
    Ao[0,4] = 1.
    Ao[1,5] = 1.
    Bou = np.vstack([Bd.toarray(), np.zeros([2, 2])])
    Co = np.hstack([Cm, np.zeros([2,2])])

    # Measurement and state transition model for unscented kalman filter
    def fx(x, u):
        return Ao@x + Bou@u

    def hx(x):
        ymeas = np.empty(nym)
        ymeas[0] = np.linalg.norm(x[:2])
        ymeas[1] = math.atan2(x[1],x[0])
        return ymeas

    sig_points = MerweScaledSigmaPoints(6, alpha=0.1, beta=2., kappa=-1)

    # Define initial state constraints
    C_11 = math.sin(phi+gam)/((rp-rtot)*math.sin(gam))
    C_12 = -math.cos(phi+gam)/((rp-rtot)*math.sin(gam))
    C_21 = -math.sin(phi-gam)/((rp-rtot)*math.sin(gam))
    C_22 = math.cos(phi-gam)/((rp-rtot)*math.sin(gam))
    if (x0[0] - (center[0] + sideLength / 2) < 0 and x0[0] - (center[0] - sideLength / 2) > 0):
        slope = (x0[1] - sqVerts[1, 1]) / (x0[0] - sqVerts[1, 0])
        inter = -slope * x0[0] + x0[1]
    elif (hasDebris):
        slope = (x0[1] - sqVerts[0, 1]) / (x0[0] - sqVerts[0, 0])
        inter = -slope * x0[0] + x0[1]
    else:
        slope = 0
    C = np.array([
            [C_11, C_12, 0., 0.],
            [C_21, C_22, 0., 0.],
            [1., 0., 0., 0.],
            [0., 0., 1., 1.],
            [-slope, 1., 0., 0.],
                ])

    if (inTrack):
        C[2,:] = np.array([0.,1.,0.,0.])

    ny = C.shape[0]


    # Define input constraints
    ulim = mpc_params.u_lim
    umin = np.hstack([-ulim[0], -ulim[1], np.zeros(ny)])
    umax = np.hstack([ulim[0], ulim[1], np.inf*np.ones(ny)])
    Vecr = mpc_params.V_ecr


    D = np.hstack([np.zeros([ny,nu]),np.diag(Vecr)])

    # State and input penalty matrices for MPC formulation
    Q = mpc_params.Q_state
    Ru = mpc_params.R_input
    Rs = mpc_params.R_slack
    R = sparse.block_diag([Ru,Rs])

    # Virtual LQR Controller for stabilization
    S = sp.linalg.solve_discrete_are(Ad.toarray(), Bd.toarray(), Q.toarray(), Ru.toarray())
    K = np.asarray(np.linalg.inv(Ru + np.transpose(Bd)@S@Bd)@(np.transpose(Bd)@S@Ad))
    QN = S

    # LQR Failsafe (homing controller)
    Qf = fail_params.Q_fail
    Rf = fail_params.R_fail
    Crefx = fail_params.C_int
    nr = Crefx.shape[0]

    Kf = ct.dlqr(Ad.toarray(),Bd.toarray(),Qf,Rf, integral_action=Crefx)[0]
    Kpf = Kf[:,:nx]
    Kif = Kf[:,nx:nx+nr]

    # Deadbeat debris avoidance maneuver
    Crefy = np.array([[0.,1.,0.,0.]])
    Bd_prune = np.reshape(Bd[:, 1], (nx, 1))[[1, 3],]
    Ad_prune = Ad[[1, 3], :][:, [1, 3]]
    C_prune = np.array([1, 0])

    A_aug = np.block([[Ad_prune.toarray(), np.zeros([2, 1])], [C_prune, np.eye(1)]])
    B_aug = np.block([[Bd_prune.toarray()], [np.zeros([1, 1])]])
    des_eig = np.array([0, 0, 0])
    K_prune = ct.acker(A_aug, B_aug, des_eig)

    K_total = np.zeros([nu, nx])
    K_total[1, 1] = K_prune[0, 0]
    K_total[1, 3] = K_prune[0, 1]
    K_i = np.vstack([0, K_prune[0, 2]])

    #For debugging
    if ~(np.all(np.linalg.eigvals(S) > 0)):
        raise Exception("Riccati solution not positive definite")


    # MPC horizons
    Nx = mpc_params.Nx
    Nc = mpc_params.Nc
    Nb = mpc_params.Nb

    # Quadratic objective for QP problem
    P = sparse.block_diag([sparse.kron(sparse.eye(Nx), Q), QN, sparse.kron(sparse.eye(Nc), R), 1*sparse.eye(ndi)], format='csc')
    # Linear objective for QP problem
    q = np.hstack([np.kron(np.ones(Nx), -Q@xr), -QN@xr, np.zeros(Nc*(nu+ny)), np.zeros(ndi)])
    # Linear dynamics constraint for QP problem
    Aeq = constructOsqpAeq(mpc_params, Ad, Bd, K, ny)   #Helper function
    leq = np.hstack([-x0, np.zeros(Nx*nx)])
    ueq = leq

    # Initialize state and input constraints for QP problem
    Aineq2 = sparse.kron(sparse.eye(Nc), sparse.eye(nu+ny))
    Block12 = sparse.vstack([np.kron(np.eye(Nc),D), np.kron(np.zeros([(Nx+1)-Nc,Nc]),np.zeros([ny,nu+ny]))])
    Block21 = sparse.coo_matrix((Nc*(nu+ny),(Nx+1)*nx))
    AextCol = sparse.vstack([np.zeros([nx, ndi]), np.kron(np.ones([Nx, 1]), np.vstack([np.eye(ndi), np.zeros([nx - ndi, ndi])])),np.kron(np.zeros([(Nx + 1), 1]), np.zeros([ny, ndi])), np.kron(np.zeros([(Nc), 1]), np.zeros([nu + ny, ndi]))])
    AextRow = sparse.csc_matrix(np.hstack([np.kron(np.ones([1, Nx + 1]), np.zeros([ndi, nx])), np.kron(np.ones([1, Nc]), np.zeros([ndi, nu + ny])),np.eye(ndi)]))

    block_mats = (Aeq, Aineq2, Block12, Block21, AextRow, AextCol, C)
    u_lim = (umin, umax)

    A, lineq, uineq = configureDynamicConstraints(sim_conditions, mpc_params, debris, np.hstack([np.copy(x0),0,0]), block_mats, u_lim)  #Helper function
    l = np.hstack([leq, lineq])
    u = np.hstack([ueq, uineq])

    block_mats = (Aeq,Aineq2,Block12,Block21,AextRow,AextCol,C)
    u_lim = (umin,umax)

    # Create an OSQP object
    prob = osqp.OSQP()

    #Setup workspace
    prob.setup(P, q, A, l, u, warm_start=True, verbose = False)

    # Initial conditions for simulation telemetry
    xtrue0 = x0
    xest0 = np.hstack([x0, 0., 0.]) #note this assumes we don't know the initial distrubance value (zeros)
    Pest = sp.linalg.block_diag(1e-20*np.eye(nx),np.eye(ndi))

    # This is a mess :( TODO refactor
    nsim = nsimD
    iterm = nsim
    ifailsd = []
    ifailsf = []
    impc = []
    xtrueP = np.empty([nx,nsim+1])
    xestO = np.empty([nx+ndi,nsim+1])
    xintf = 0
    noiseStored = np.empty([nx,nsim+1])
    ctrls = np.empty([nu,nsim+1])
    ctrls[:, 0] = np.array([0., 0.])
    xv1n = np.empty([1,nsim+1])
    xv1n[0,0] = xtrueP[2,0] + xtrueP[3,0]
    xtrueP[:,0] = xtrue0
    xestO[:,0] = xest0
    noiseVec = sigMat@random.normal(0, 1, 4)
    noiseStored[:,0] = noiseVec

    # Noise covariance setup
    Bnoise = np.vstack([np.zeros([nx,ndi]), (T)*np.eye(ndi)]) #try with T*eye
    Qw = np.diag([sigMat[0,0]**2, sigMat[1,1]**2])
    Qw = Bnoise@Qw@np.transpose(Bnoise)
    Qw[:4,:][:,:4] = 0.001*np.eye(nx)

    # Setup UKF
    kf = UnscentedKalmanFilter(dim_x=6, dim_z=2, dt=T, fx=fx, hx=hx, points=sig_points)
    kf.x = xest0
    kf.P = Pest
    kf.R = np.zeros([nym, nym])
    kf.Q = Qw

    # Closed-loop simuation
    for i in range(nsim):

        # Terminate simulation conditions
        if (not inTrack and (np.linalg.norm(xtrueP[0:2,i]) < rp or xtrueP[0,i] < rp - rtot)):
            iterm = i
            break
        elif (inTrack and (np.linalg.norm(xtrueP[0:2,i]) < rp or xtrueP[1,i] < rp - rtot)):
            iterm = i
            break

        # Attempt to solve QP problem
        res = prob.solve()

        # Check solver status to determine action
        if res.info.status != 'solved':
            if (xestO[0,i] - (center[0] + sideLength/2) < 0 and xestO[0,i] - (center[0] - sideLength/2) > 0 and xestO[1,i] < (center[1] + sideLength/2) and xestO[1,i] > (center[1] - sideLength/2)):
                # Use deadbeat collision avoidance
                ifailsd.append(i)
                xintf = xintf + Crefy@xestO[:4,i] - (center[1] + sideLength/2) #theres a potential bug here with the sign of the control, test in animation
                ctrl = -K_total@xestO[:4,i] - K_i@xintf
            else:
                # Use failsafe (homing) controller
                ifailsf.append(i)
                xintf = xintf + Crefx@xestO[:4,i] - xr[0]
                ctrl = -Kpf@xestO[:4,i] - Kif@xintf
        else:
            # Use MPC controller
            impc.append(i)
            xintf = 0
            ctrl = res.x[(Nx+1)*nx:(Nx+1)*nx+nu]

        # Scale input if desired exceeds max/min
        if (np.linalg.norm(ctrl) > umax[0]):
            ctrl[0] = ctrl[0]*(umax[0]/np.linalg.norm(ctrl))
            ctrl[1] = ctrl[1]*(umax[0]/np.linalg.norm(ctrl))


        # Apply chosen control input to the plant
        ctrls[:,i+1] = ctrl
        xtrueP[:,i+1] = Ad@xtrueP[:,i] + Bd@ctrls[:,i] + noiseVec
        xv1n[0,i+1] = np.absolute(xtrueP[2,i+1]) + np.absolute(xtrueP[3,i+1])


        # Measurement and state estimation
        if (noise is not None):
            ymeas = np.empty(nym)
            ymeas[0] = np.linalg.norm(xtrueP[:2,i+1])
            ymeas[1] = math.atan2(xtrueP[1,i+1], xtrueP[0,i+1])
            kf.predict(ctrls[:,i])
            kf.update(z=ymeas)
            xestO[:, i+1] = kf.x
        else:
            xestO[:,i+1] = np.hstack([xtrueP[:,i+1], [0.,0.]])

        # Update initial state in QP problem
        l[:nx] = -xestO[:4,i+1]
        u[:nx] = -xestO[:4,i+1]
        prob.update(l=l, u=u)

        # Reconfigure constraints
        A, lineq, uineq = configureDynamicConstraints(sim_conditions, mpc_params, debris, xestO[:,i+1], block_mats, u_lim)
        l[(Nx+1)*nx:] = lineq
        u[(Nx+1)*nx:] = uineq
        prob.update(Ax = A.data, l=l, u=u)

        # Inject noise into plant based on noise interval
        if ((i+1) % noiseRepeat == 0):
            noiseVec = sigMat@random.normal(0, 1, 4)
            noiseStored[:,i+1] = noiseVec
        else:
            noiseVec = noiseVec
            noiseStored[:,i+1] = noiseVec

    # Construct piecewise trajectory (based on controller used)
    xtruePiece = np.empty([nx,iterm])
    xtruePiece[:,impc] = xtrueP[:,impc]
    xtruePiece[:,ifailsf] = xtrueP[:,ifailsf]
    xtruePiece[:,ifailsd] = xtrueP[:,ifailsd]

    # Construct velocity 1-norms
    xv1n_test = np.empty(xtruePiece.shape[1])
    for i in range(xtruePiece.shape[1]):
        xv1n_test[i] = np.absolute(xtruePiece[2,i]) + np.absolute(xtruePiece[3,i])

    # Decide if trajectory was successful
    succTraj = False
    for i in range(iterm-1,0,-1):
        dist = np.linalg.norm(xtruePiece[0:2,i] - xr[0:2])
        ang = abs(math.atan(xtruePiece[3,i]/xtruePiece[2,i]))*(180/np.pi)
        if (dist <= distTol and ang <= angTol):
            succTraj = True
            break

    # Catalogue controller used at each point
    controllerSeq = np.empty(iterm)
    for i in impc:
        controllerSeq[i] = 1    # A value of 1 means the MPC controller was used at this time step
    for i in ifailsf:
        controllerSeq[i] = 2    # A value of 2 means the LQR failsafe (homing) controller was used at this time step
    for i in ifailsd:
        controllerSeq[i] = 3    # A value of 3 means the deadbeat debris avoidance controller was used at this time step

    sim_run = SimRun(iterm, succTraj, xtruePiece, xestO, ctrls, controllerSeq, noiseStored)
    return sim_run