OM, MU = 10, 4    # Picking omega=10, mu=4
func = lambda x: fSysNLn(0, x, om=OM, rr=MU)
pltQuiver([-3,3], 25, func, rr=2)


# Suppose now we generate the following two sample trajectories for training
dt = 0.0001    # Step size
Tf = 1.0       # Total time period
eps = 0.0      # Noise
x0s = [[1,0], [3,3]]  # Two initial conditions
t_train, x_train = genDataFixPar(dt, Tf, eps, x0s, (OM, MU))

# And we also generate two test trajectories
x0t = [[-0.5,-0.5], [-2,3]]  # Two initial conditions
t_test, x_test = genDataFixPar(dt, Tf, eps, x0t, (OM, MU))


# As expected, all trajectories converge to the limit cycle
# But the test trajectories cover a different region in state space.
cmpTrajPhase(x_train, x_test, ['Train', 'Test'])


# Now we use the PySINDy implementation to do the fit
model = ps.SINDy(
    differentiation_method=ps.FiniteDifference(order=2),
    feature_library=clib_lco,             # We have pre-defined the feature vectors
    optimizer=ps.STLSQ(threshold=1e-4),   # This is almost like simple linear regression
    feature_names=["x", "y"])
model.fit(x_train, t=t_train, multiple_trajectories=True)
model.print()
print('\nFitted coefficients - not bad!')
model.coefficients()

(x)' = -0.007 x + -9.963 y + 4.011 xr^2 + -0.019 yr^2 + -1.002 xr^4 + 0.002 yr^4
(y)' = 9.994 x + 0.036 y + 0.011 xr^2 + 3.982 yr^2 + -0.002 xr^4 + -0.998 yr^4

Fitted coefficients - not bad!

array([[-0.0066, -9.9631,  4.0110, -0.0189, -1.0024,  0.0024],
       [ 9.9936,  0.0360,  0.0107,  3.9816, -0.0023, -0.9977]])


# The learned model performs very well on unseen data
x_pred = predTrajFixPar(model, x0t, t_train)
cmpTraj2D(x_test, x_pred, t_train, 2)

Solving [-0.5, -0.5]
Solving [-2, 3]


# Another comparison on the phase plane
cmpPhasePlane((OM,MU), [model], ['Learned'])


model_overfit = ps.SINDy(
    differentiation_method=ps.FiniteDifference(order=2),
    feature_library=ps.PolynomialLibrary(degree=5),     # Now we use monomials up to 5th order
    # feature_library=ps.FourierLibrary(),
    optimizer=ps.STLSQ(threshold=1e-4),
    feature_names=["x", "y"])
model_overfit.fit(x_train, t=t_train, multiple_trajectories=True)
model_overfit.print()
print('\nFitted coefficients - cannot be true as they are all non-zero!')

(x)' = 6.983 1 + -6.383 x + -16.805 y + -2.350 x^2 + 7.366 x y + -1.197 y^2 + 5.719 x^3 + 1.852 x^2 y + 3.463 x y^2 + 2.317 y^3 + 0.151 x^4 + -1.841 x^3 y + 0.014 x^2 y^2 + -1.842 x y^3 + -0.137 y^4 + -1.031 x^5 + -0.038 x^4 y + -1.498 x^3 y^2 + -0.192 x^2 y^3 + -0.467 x y^4 + -0.154 y^5
(y)' = 6.807 1 + 3.779 x + -6.633 y + -2.291 x^2 + 7.180 x y + -1.167 y^2 + 1.675 x^3 + 5.805 x^2 y + -0.524 x y^2 + 6.259 y^3 + 0.147 x^4 + -1.795 x^3 y + 0.014 x^2 y^2 + -1.795 x y^3 + -0.133 y^4 + -0.030 x^5 + -1.037 x^4 y + 0.490 x^3 y^2 + -2.187 x^2 y^3 + 0.520 x y^4 + -1.150 y^5

Fitted coefficients - cannot be true as they are all non-zero!


# Prediction for train trajectories works well
x_pred = predTrajFixPar(model_overfit, x0s, t_train)
cmpTraj2D(x_train, x_pred, t_train, 2)

Solving [1, 0]
Solving [3, 3]


# Test prediction is totally off - clearly the model is overfitting
x_pred = predTrajFixPar(model_overfit, x0t, t_train)
cmpTraj2D(x_test, x_pred, t_train, 2)

Solving [-0.5, -0.5]
Solving [-2, 3]


# Using the same data
dt, Tf, eps = 0.0001, 1.0, 0.0
x0s = [[1,0], [3,3]]
t_train, x_train = genDataFixPar(dt, Tf, eps, x0s, (OM, MU))
x0t = [[-0.5,-0.5], [-2,3]]
t_test, x_test = genDataFixPar(dt, Tf, eps, x0t, (OM, MU))


opt = ps.SR3(
    threshold=0.8,
    thresholder="l0",
    max_iter=10000,
    tol=1e-10)       # The new optimizer

model_sr3 = ps.SINDy(
    differentiation_method=ps.FiniteDifference(order=2),
    feature_library=ps.PolynomialLibrary(degree=5, include_bias=False),
    optimizer=opt,
    feature_names=["x", "y"])
model_sr3.fit(x_train, t=t_train, multiple_trajectories=True)
print('Fitted coefficients - It is picking out the correct terms!')
model_sr3.print()

Fitted coefficients - It is picking out the correct terms!
(x)' = -10.000 y + 3.992 x^3 + 4.011 x y^2 + -0.998 x^5 + -2.001 x^3 y^2 + -1.003 x y^4
(y)' = 10.000 x + 4.001 x^2 y + 4.002 y^3 + -1.000 x^4 y + -2.001 x^2 y^3 + -1.001 y^5


# Now the test prediction is almost perfect
x_pred = predTrajFixPar(model_sr3, x0t, t_train)
cmpTraj2D(x_test, x_pred, t_train, 2)

Solving [-0.5, -0.5]
Solving [-2, 3]


# Using the same set up, but now with noise
dt, Tf, eps = 0.0001, 1.0, 0.1
x0s = [[-1.5,1], [2,2], [1,0], [3,3]]
t_train, x_train = genDataFixPar(dt, Tf, eps, x0s, (OM, MU))
# Set zero noise in test data
x0t = [[-2,2], [1,2.5]]
t_test, x_test = genDataFixPar(dt, Tf, 0.0, x0t, (OM, MU))


# Fit the model with customized features
model_noise = ps.SINDy(
    differentiation_method=ps.FiniteDifference(order=2),
    feature_library=clib_lco,
    optimizer=ps.SR3(threshold=0.8, thresholder="l0",
                     max_iter=10000, tol=1e-10),
    feature_names=["x", "y"])
model_noise.fit(x_train, t=t_train, multiple_trajectories=True)
model_noise.print()
print('\nFitted coefficients - even with cheating the fitting fails!')
model_noise.coefficients()

(x)' = 21.635 y + -0.067 xr^2 + -7.913 yr^2
(y)' = 10.791 x + -18.559 y + -0.163 xr^2 + 10.486 yr^2 + -1.451 yr^4

Fitted coefficients - even with cheating the fitting fails!

array([[ 0.0000,  21.6354, -0.0667, -7.9125,  0.0000,  0.0000],
       [ 10.7908, -18.5590, -0.1632,  10.4856,  0.0000, -1.4508]])


# Even the prediction for train trajectories does not work well
x_pred = predTrajFixPar(model_noise, x0s, t_train)
cmpTraj2D(x_train, x_pred, t_train, 2)

Solving [-1.5, 1]
Solving [2, 2]
Solving [1, 0]
Solving [3, 3]


# Another comparison, in quiver plot - clearly the noise creates a problem
cmpPhasePlane((OM,MU), [model_noise], ['Model with noisy data'])


# Still fitting the model with customized features
# But now with smoothed finite difference for time derivatives
model_smooth = ps.SINDy(
    differentiation_method=ps.SmoothedFiniteDifference(order=2),
    feature_library=clib_lco,
    optimizer=ps.SR3(threshold=0.4, thresholder="l0",
                     max_iter=20000, tol=1e-12),
    feature_names=["x", "y"])
model_smooth.fit(x_train, t=t_train, multiple_trajectories=True)
model_smooth.print()
print('\nFitted coefficients - does not seem to work well!')
model_smooth.coefficients()

(x)' = 4.861 x + -27.096 y + -1.202 xr^2 + 9.029 yr^2 + -1.177 yr^4
(y)' = 7.639 x + 2.659 xr^2 + 1.843 yr^2 + -0.516 xr^4 + -0.458 yr^4

Fitted coefficients - does not seem to work well!

array([[ 4.8613, -27.0956, -1.2017,  9.0287,  0.0000, -1.1770],
       [ 7.6390,  0.0000,  2.6589,  1.8431, -0.5161, -0.4575]])


# Somewhat improved
x_pred = predTrajFixPar(model_smooth, x0s, t_train)
cmpTraj2D(x_train, x_pred, t_train, 2)

Solving [-1.5, 1]
Solving [2, 2]
Solving [1, 0]
Solving [3, 3]


# # But DIVERGES in the second test case
# x_pred = predTrajFixPar(model_smooth, x0t, t_train)
# cmpTraj2D(x_test, x_pred, t_train, 2)


# Again we use PySINDy implementation
pts, K = 400, 400
ode_lib = ps.WeakPDELibrary(
    library_functions=clib_func, function_names=clib_name, spatiotemporal_grid=t_train,
    include_bias=False, is_uniform=True, num_pts_per_domain=pts, K=K)
opt = ps.SR3(threshold=0.4, thresholder="l0", max_iter=60000, tol=1e-12)

model = ps.SINDy(feature_library=ode_lib, optimizer=opt, feature_names=["x", "y"])
model.fit(x_train, multiple_trajectories=True)
model_weak = wsWrapper(model, clib_lco, opt, x_train, t_train)
model_weak.print()
print('\nFitted coefficients - cannot say the coefficients are the most accurate')
model_weak.coefficients()

(x)' = -21.735 y + 2.238 xr^2 + 5.490 yr^2 + -0.559 xr^4 + -0.630 yr^4
(y)' = 10.791 x + -18.559 y + -0.163 xr^2 + 10.486 yr^2 + -1.451 yr^4

Fitted coefficients - cannot say the coefficients are the most accurate

/Users/daninghuang/Library/Python/3.8/lib/python/site-packages/pysindy/optimizers/sr3.py:388: ConvergenceWarning: SR3._reduce did not converge after 60000 iterations.
  warnings.warn(

array([[ 0.0000, -21.7348,  2.2385,  5.4900, -0.5588, -0.6299],
       [ 10.7908, -18.5590, -0.1632,  10.4856,  0.0000, -1.4508]])


# We lost one training case...
x_pred = predTrajFixPar(model_weak, x0s, t_train)
cmpTraj2D(x_train, x_pred, t_train, 2)

Solving [-1.5, 1]
Solving [2, 2]
Solving [1, 0]
Solving [3, 3]


# But the test cases seem to work really well
x_pred = predTrajFixPar(model_weak, x0t, t_train)
cmpTraj2D(x_test, x_pred, t_train, 2)

Solving [-2, 2]
Solving [1, 2.5]


# A closer look at the phase plane - note the catastrophic diverging region in the model with smoothed FD
cmpPhasePlane((OM,MU), [model_smooth, model_weak], ['Smoothed FD', 'Weak form'])


# Now we generate a new dataset
dt, Tf, eps = 0.0001, 2.0, 0.0
# Training: mu = -2, -1, 0, 1, 2
x0s = [[-1.5,1], [2,2], [1,0], [3,3]]
args = [(OM,-2), (OM,-1), (OM,0), (OM,1), (OM,2)]
inps = [(_a[1],) for _a in args]
t_train, x_train = genDataMultiPar(dt, Tf, eps, x0s, args, 1)
# Test: mu = -2.5, -1.5, -0.5, 0.5, 1.5, 2.5
x0t = [[-2,2], [1,2.5]]
argt = [(OM,-2.5), (OM,-1.5), (OM,-0.5), (OM,0.5), (OM,1.5), (OM,2.5)]
inpt = [(_a[1],) for _a in argt]
t_test, x_test = genDataMultiPar(dt, Tf, eps, x0t, argt, 1)


optimizer = ps.SR3(
    threshold=1.0,
    thresholder="l0",
    max_iter=1000,
    tol=1e-10)
library = ps.PolynomialLibrary(degree=6, include_bias=False)
model = ps.SINDy(optimizer=optimizer, feature_library=library, feature_names=['x', 'y', 'u'])
model.fit(x_train, t=t_train, multiple_trajectories=True, quiet=True)
model.print()
# Numbers are looking familiar and the last term is correctly zero.

(x)' = -10.086 y + 1.686 x^3 u + -1.560 x^5 + -1.986 x^3 y^2 + -0.476 x y^4
(y)' = 10.064 x + 0.752 x^2 y u + 1.103 y^3 u + -2.980 x^2 y^3 + -0.972 y^5
(u)' = 0.000


# Comparing the trajectories in 3D - they look identical!
# Also note that some of the test cases are BEYOND the training cases
cmpTraj3D(x_test, x_pred, 2)

Machine Learning for Engineering¶

Dynamical System: Regression models¶

Instructor: Daning Huang¶

TODAY: Dynamical System¶

References¶

Previously...¶

Simple Linear Regression¶

Model problem¶

However ...¶

Feature selection: Sparse identification¶

Back to the example¶

Solution: Regularization¶

Side note¶

Try the new optimizer out¶

Denoising the data¶

Effect of noise in sample data¶

To start with...¶

The weak form formulation¶

Side note¶

Try the weak form out¶

Handling parameters¶

It is easy¶

Side note¶