├── images
├── BOPINNalgo.PNG
└── BOPINN_methodolody.png
├── data
├── u_analytic_c=0.2t=0.25snr=39.36.mat
├── u_analytic_c=0.55t=0.25snr=38.91.mat
└── u_analytic_c=0.85t=0.25snr=37.5.mat
├── LICENSE
├── lib
├── network.py
├── layer.py
├── pinn_wave.py
└── optimizer.py
├── README.md
├── analytical.py
├── PINN.py
├── BOPINN.py
└── BOPINN.ipynb
/images/BOPINNalgo.PNG:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mahindrautela/BOPINN/HEAD/images/BOPINNalgo.PNG
--------------------------------------------------------------------------------
/images/BOPINN_methodolody.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mahindrautela/BOPINN/HEAD/images/BOPINN_methodolody.png
--------------------------------------------------------------------------------
/data/u_analytic_c=0.2t=0.25snr=39.36.mat:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mahindrautela/BOPINN/HEAD/data/u_analytic_c=0.2t=0.25snr=39.36.mat
--------------------------------------------------------------------------------
/data/u_analytic_c=0.55t=0.25snr=38.91.mat:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mahindrautela/BOPINN/HEAD/data/u_analytic_c=0.55t=0.25snr=38.91.mat
--------------------------------------------------------------------------------
/data/u_analytic_c=0.85t=0.25snr=37.5.mat:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mahindrautela/BOPINN/HEAD/data/u_analytic_c=0.85t=0.25snr=37.5.mat
--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
1 | MIT License
2 |
3 | Copyright (c) 2024 Mahindra Rautela
4 |
5 | Permission is hereby granted, free of charge, to any person obtaining a copy
6 | of this software and associated documentation files (the "Software"), to deal
7 | in the Software without restriction, including without limitation the rights
8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 |
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 |
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 |
--------------------------------------------------------------------------------
/lib/network.py:
--------------------------------------------------------------------------------
1 | import tensorflow as tf
2 |
3 | class Network:
4 | """
5 | Build a physics informed neural network (PINN) model for the wave equation.
6 | """
7 |
8 | @classmethod
9 | def build(cls, num_inputs=2, layers=[64, 128, 128, 128, 128, 64], activation='tanh', num_outputs=1):
10 | """
11 | Build a PINN model for the wave equation with input shape (t, x) and output shape u(t, x).
12 |
13 | Args:
14 | num_inputs: number of input variables. Default is 2 for (t, x).
15 | layers: number of hidden layers.
16 | activation: activation function in hidden layers.
17 | num_outpus: number of output variables. Default is 1 for u(t, x).
18 |
19 | Returns:
20 | keras network model.
21 | """
22 |
23 | # input layer
24 | inputs = tf.keras.layers.Input(shape=(num_inputs,))
25 | # hidden layers
26 | x = inputs
27 | for layer in layers:
28 | x = tf.keras.layers.Dense(layer, activation=activation,
29 | kernel_initializer='he_normal')(x)
30 | x = tf.keras.layers.Dropout(0.1)(x)
31 | # output layer
32 | outputs = tf.keras.layers.Dense(num_outputs,
33 | kernel_initializer='he_normal')(x)
34 |
35 | return tf.keras.models.Model(inputs=inputs, outputs=outputs)
36 |
--------------------------------------------------------------------------------
/lib/layer.py:
--------------------------------------------------------------------------------
1 | import tensorflow as tf
2 |
3 | class GradientLayer(tf.keras.layers.Layer):
4 | """
5 | Custom layer to compute 1st and 2nd derivatives for the wave equation.
6 |
7 | Attributes:
8 | model: keras network model.
9 | """
10 |
11 | def __init__(self, model, **kwargs):
12 | """
13 | Args:
14 | model: keras network model.
15 | """
16 |
17 | self.model = model
18 | super().__init__(**kwargs)
19 |
20 | def call(self, tx):
21 | """
22 | Computing 1st and 2nd derivatives for the wave equation.
23 |
24 | Args:
25 | tx: input variables (t, x).
26 |
27 | Returns:
28 | u: network output.
29 | du_dt: 1st derivative of t.
30 | du_dx: 1st derivative of x.
31 | d2u_dt2: 2nd derivative of t.
32 | d2u_dx2: 2nd derivative of x.
33 | """
34 |
35 | with tf.GradientTape() as g:
36 | g.watch(tx)
37 | with tf.GradientTape() as gg:
38 | gg.watch(tx)
39 | u = self.model(tx)
40 | du_dtx = gg.batch_jacobian(u, tx)
41 | du_dt = du_dtx[..., 0]
42 | du_dx = du_dtx[..., 1]
43 | d2u_dtx2 = g.batch_jacobian(du_dtx, tx)
44 | d2u_dt2 = d2u_dtx2[..., 0, 0]
45 | d2u_dx2 = d2u_dtx2[..., 1, 1]
46 |
47 | return u, du_dt, du_dx, d2u_dt2, d2u_dx2
48 |
--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
1 | # BOPINN (Bayesian optimized physics-informed neural network)
2 | BOPINN presents new paradigm to solve inverse problems by bringing an amalgamation of PINNs and BO. It uses BO (a gradient-free and global optimization scheme) and PINNs (a fast neural surrogate solver for PDEs). In BOPINN, a PINN utilizes a neural surrogate to solve the partial differential equation (wave propagation here). Bayesian optimization runs over the PINN model and estimates the optimum parameters (wave velocity in the medium here) using a single snapshot observation of the field. BOPINN queries the black-box PINN model at different wave velocities until it converges to the true wave velocity. The proposed method is simpler (uses single neural network), robust (capturs uncertainty) and flexible (useful in real-time and online settings) as compared to it's counterparts.
3 |
4 |
5 |
6 |
7 |
8 |
9 |
10 |
11 |
12 | ## About the repository:
13 | 1. Written in tensorflow 2.10 with cuda 11.8 and cudnn 8.x
14 | 2. The code uses BO repository from [bayesian-optimization](https://github.com/bayesian-optimization/BayesianOptimization).
15 | 3. "BOPINN.py" is the python file (run in spyder) and "BOPINN.ipynb" is a notebook (use colab or jupyter)
16 | 4. "PINN.py" is a PINN based solver for forward wave propagation problem. It's an auxillary code to understand the forward problem
17 | 5. "analytical.py" gives the exact solution of the wave equation with dirichlet BC and it is used to collect data (added white noise)
18 | 6. data folder contains the snapshot observation collected from "analytical.py"
19 | 7. lib folder has .py files required to run "PINN.py" and "BOPINN.py"
20 |
21 | For more information:
22 | 1. [Link](https://doi.org/10.48550/arXiv.2312.14064) of the paper: Bayesian optimized physics-informed neural network for estimating wave propagation velocities.
23 | 2. Please cite the paper if you are using code, paper or data.
24 | ```
25 | @article{rautela2023bayesian,
26 | title={Bayesian optimized physics-informed neural network for estimating wave propagation velocities},
27 | author={Rautela, Mahindra and Gopalakrishnan, S and Senthilnath, J},
28 | journal={arXiv preprint arXiv:2312.14064},
29 | year={2023}
30 | }
31 | ```
32 |
33 |
--------------------------------------------------------------------------------
/lib/pinn_wave.py:
--------------------------------------------------------------------------------
1 | import tensorflow as tf
2 | from .layer import GradientLayer
3 |
4 | class PINN:
5 | """
6 | Build a physics informed neural network (PINN) model for the wave equation.
7 |
8 | Attributes:
9 | network: keras network model with input (t, x) and output u(t, x).
10 | c: wave velocity.
11 | grads: gradient layer.
12 | """
13 |
14 | def __init__(self, network, c):
15 | """
16 | Args:
17 | network: keras network model with input (t, x) and output u(t, x).
18 | c: wave velocity. Default is 1.
19 | """
20 |
21 | self.network = network
22 | self.c = c
23 | self.grads = GradientLayer(self.network)
24 |
25 | def build(self):
26 | """
27 | Build a PINN model for the wave equation.
28 |
29 | Returns:
30 | PINN model for the projectile motion with
31 | input: [ (t, x) relative to equation,
32 | (t=0, x) relative to initial condition,
33 | (t, x=bounds) relative to boundary condition ],
34 | output: [ u(t,x) relative to equation,
35 | u(t=0, x) relative to initial condition,
36 | du_dt(t=0, x) relative to initial derivative of t,
37 | u(t, x=bounds) relative to boundary condition ]
38 | """
39 |
40 | # equation input: (t, x)
41 | tx_eqn = tf.keras.layers.Input(shape=(2,))
42 | # initial condition input: (t=0, x)
43 | tx_ini = tf.keras.layers.Input(shape=(2,))
44 | # boundary condition input: (t, x=-1) or (t, x=+1)
45 | tx_bnd = tf.keras.layers.Input(shape=(2,))
46 |
47 | # compute gradients
48 | _, _, _, d2u_dt2, d2u_dx2 = self.grads(tx_eqn)
49 |
50 | # equation output being zero
51 | u_eqn = d2u_dt2 - self.c*self.c * d2u_dx2
52 | # initial condition output
53 | u_ini, du_dt_ini, _, _, _ = self.grads(tx_ini)
54 | # boundary condition output
55 | u_bnd = self.network(tx_bnd) # dirichlet
56 | #_, _, u_bnd, _, _ = self.grads(tx_bnd) # neumann
57 |
58 | # build the PINN model for the wave equation
59 | return tf.keras.models.Model(
60 | inputs=[tx_eqn, tx_ini, tx_bnd],
61 | outputs=[u_eqn, u_ini, du_dt_ini, u_bnd])
62 |
63 |
--------------------------------------------------------------------------------
/analytical.py:
--------------------------------------------------------------------------------
1 | import numpy as np
2 | import math
3 | import matplotlib.pyplot as plt
4 | from matplotlib.colors import Normalize
5 | from matplotlib.gridspec import GridSpec
6 | import os
7 |
8 | # Other variables
9 | L = 10
10 | n = L
11 | T = 1
12 |
13 | # speed
14 | C = [0.20, 0.55, 0.85]
15 | c = C[0]
16 |
17 | # snapshot time
18 | tfrac = np.array([0.25, 0.50, 0.75])
19 | tilde_t = tfrac*T
20 |
21 | # number of scan points
22 | num_points = 5000
23 |
24 | # RMS function
25 | def RMS(S):
26 | rms = np.sqrt(np.mean(S**2))
27 | return rms
28 |
29 | def u_analytic(t,x,c,L,n):
30 | # x and t in mesh form
31 | usol = -np.sin(math.pi*x)*np.cos(n*math.pi*c*t/L)
32 | return usol
33 |
34 | # Full analytical solution of the domain [0,L] and [0,T]
35 | t = np.linspace(0,T,num_points)
36 | x = np.linspace(0,L,num_points)
37 | x_mesh, t_mesh = np.meshgrid(x, t)
38 | usol_full = u_analytic(t_mesh, x_mesh, c, L, n)
39 |
40 | # index of snapshot time in the array
41 | idx = [int(p) for p in num_points*tfrac]
42 |
43 | # plot u(t,x) distribution as a color-map
44 | fig = plt.figure(figsize=(7,4))
45 | gs = GridSpec(2, 3) # A grid layout to place subplots within a figure.
46 | plt.subplot(gs[0, :])
47 | vmin, vmax = -1.0, +1.0
48 | plt.pcolormesh(t_mesh, x_mesh, usol_full, cmap='rainbow', shading = 'auto', norm=Normalize(vmin=vmin, vmax=vmax))
49 | plt.xlabel('t')
50 | plt.ylabel('x')
51 | cbar = plt.colorbar(pad=0.05, aspect=10)
52 | cbar.set_label('u(t,x)')
53 | cbar.mappable.set_clim(vmin, vmax)
54 |
55 | # plot u(t=const, x) cross-sections
56 | for i, t_cs in enumerate(tilde_t):
57 | plt.subplot(gs[1, i])
58 | plt.plot(x, usol_full[idx[i],:], 'b', linewidth = 2)
59 | plt.title('t={}'.format(t_cs))
60 | plt.xlabel('x')
61 | plt.ylabel('u(t,x)')
62 | plt.ylim(-1,1)
63 | plt.tight_layout()
64 | plt.show()
65 |
66 | #%% usol at particular snapshot time
67 | from scipy.io import savemat
68 |
69 | # data storing
70 | path = "C:\MSR\data\PINNBO\data"
71 |
72 | # amplitude of noise
73 | beta_range = [0.0075] #[0.0075, 0.01, 0.025, 0.05]
74 |
75 | # these parameters need to be set
76 | usol_app = []
77 | usol_n_app = []
78 | for ii in range(len(C)):
79 | for jj in range(len(tilde_t)):
80 | for kk in range(len(beta_range)):
81 | c = C[ii]
82 | t_obs = tilde_t[jj]
83 | beta = beta_range[kk]
84 |
85 | # without noise
86 | tt = np.full(t.shape, t_obs)
87 | xx = np.linspace(0,L,num_points)
88 | xx_mesh, tt_mesh = np.meshgrid(xx, tt)
89 | usol = u_analytic(tt_mesh, xx_mesh, c, L, n)
90 | usol = usol[0,:] # all rows (time) are same
91 | usol_app.append(usol)
92 |
93 | # Add white noise to the data
94 | mu = 0
95 | sigma = 1
96 | noise = beta*(sigma*np.random.randn(num_points,1) + mu)
97 |
98 | # noisy data
99 | usol_n = usol[:,np.newaxis] + noise
100 | usol_n_app.append(usol_n)
101 |
102 | # signal to noise ratio
103 | snr = 20*np.log10(RMS(usol)/RMS(noise))
104 | snr_percent = RMS(noise)/RMS(usol)*100
105 |
106 | f1 = "c="+str(c)
107 | f2 = "t="+str(t_obs)
108 | f3 = "snr="+str(np.round(snr,2))
109 |
110 | plt.figure(figsize=(22,4))
111 | fig, (ax1, ax2) = plt.subplots(1, 2,figsize=(10,4))
112 | ax1.plot(xx,usol)
113 | ax1.set_title('Without noise', fontsize = 15)
114 | ax1.set(xlabel='x', ylabel='Normalized u(x,t)')
115 | ax1.set_ylim(-1.2,1.2)
116 |
117 | ax2.plot(xx,usol_n)
118 | ax2.set_title(f1+f2+f3, fontsize = 15)
119 | ax2.set(xlabel='x')
120 | ax2.set_ylim(-1.2,1.2)
121 |
122 | plt.show()
123 |
124 | # save data
125 | filename = "u_analytic_"+f1+f2+f3
126 | filepath = os.path.join(path, filename)
127 | mdic = {"a1": usol_n, "label": "experiment"}
128 | savemat(filepath+".mat", mdic)
129 |
130 | #%% analysis of experimental data
131 | usol_app = np.array(usol_app)
132 | usol_n_app = np.array(usol_n_app)
133 | color = ['k','tab:blue','tab:orange',
134 | 'tab:green','tab:red','tab:purple',
135 | 'tab:brown','tab:pink','tab:gray','tab:cyan']
136 |
137 | plt.figure(figsize=(10,4))
138 | for i in range(usol_app.shape[0]):
139 | plt.plot(xx,usol_app[i,:],color[i])
140 | plt.legend(['1','2','3','4','5','6','7','8','9'])
141 | #plt.savefig('analytical_9_withoutnoise', dpi = 300)
142 |
143 | plt.figure(figsize=(10,4))
144 | for i in range(usol_app.shape[0]):
145 | plt.plot(xx,usol_n_app[i,:],color[i])
146 | plt.legend(['1','2','3','4','5','6','7','8','9'])
147 | #plt.savefig('analytical_9_withnoise', dpi = 300)
148 |
--------------------------------------------------------------------------------
/PINN.py:
--------------------------------------------------------------------------------
1 | #import lib.tf_silent
2 | import numpy as np
3 | import tensorflow as tf
4 | import matplotlib.pyplot as plt
5 | from matplotlib.colors import Normalize
6 | from matplotlib.gridspec import GridSpec
7 | from lib.pinn_wave import PINN
8 | from lib.network import Network
9 | from lib.optimizer import L_BFGS_B
10 | import math
11 | import time
12 |
13 | # number of training samples
14 | num_train_samples = 25000
15 |
16 | # number of test samples
17 | num_test_samples = 5000
18 |
19 | c = 0.2 #scaled speed
20 | L = 10
21 | n = L
22 | T = 1
23 |
24 | # Initial conditions
25 | def u0(t):
26 | z = -np.sin(1*math.pi*t)
27 | return z
28 |
29 | def du0_dt(tx):
30 | with tf.GradientTape() as g:
31 | g.watch(tx)
32 | u = u0(tx)
33 | du_dt = g.batch_jacobian(u, tx)[..., 0]
34 | return du_dt
35 |
36 | # Analytical solution
37 | xx = np.linspace(0,L,num_test_samples)
38 | tt = np.linspace(0,T,num_test_samples)
39 | usol = np.zeros((num_test_samples,num_test_samples))
40 | for i,xi in enumerate(xx):
41 | for j,tj in enumerate(tt):
42 | usol[i,j] = -np.sin(math.pi*xi)*np.cos(n*math.pi*c*tj/L)
43 |
44 |
45 | ########################################################################
46 | ######################## collocation points ############################
47 | ########################################################################
48 |
49 | # create training input
50 | tx_eqn = np.random.rand(num_train_samples, 2)
51 | tx_eqn[..., 0] = T*tx_eqn[..., 0] # t = 0 ~ +1
52 | tx_eqn[..., 1] = L*tx_eqn[..., 1] # x = 0 ~ +10
53 | #print('\nShape of t_eqn ==>',tx_eqn.shape)
54 |
55 | tx_ini = np.random.rand(num_train_samples, 2)
56 | tx_ini[..., 0] = 0 # t = 0
57 | tx_ini[..., 1] = L*tx_ini[..., 1] # x = 0 ~ +10
58 | #print('\nShape of tx_ini ==>',tx_ini.shape)
59 |
60 | tx_bnd = np.random.rand(num_train_samples, 2)
61 | tx_bnd[..., 0] = T*tx_bnd[..., 0] # t = 0 ~ +1
62 | tx_bnd[..., 1] = L*np.round(tx_bnd[..., 1]) # x = 0 or +10
63 | #print('\nShape of tx_bnd ==>',tx_bnd.shape)
64 |
65 | u_zero = np.zeros((num_train_samples, 1))
66 | u_ini = u0(tx_ini[:,1,None])
67 | du_dt_ini = np.zeros((num_train_samples, 1))
68 |
69 | #########################################################################
70 | ########################### TRAINING PINNs ##############################
71 | #########################################################################
72 |
73 | # build a core network model
74 | network = Network.build()
75 | #network.summary()
76 |
77 | # build a PINN model
78 | pinn = PINN(network,c).build()
79 |
80 | # train the model using L-BFGS-B algorithm
81 | begin = time.time()
82 | x_train = [tx_eqn, tx_ini, tx_bnd]
83 | y_train = [u_zero, u_ini, du_dt_ini, u_zero]
84 | lbfgs = L_BFGS_B(model=pinn, x_train=x_train, y_train=y_train)
85 | lbfgs.fit()
86 | end = time.time()
87 | totaltime = end-begin
88 | print("\n Total runtime of the program is (min.)",totaltime/60)
89 |
90 | #########################################################################
91 | ######################## PREDICTION #####################################
92 | #########################################################################
93 |
94 | # predict u(t,x) distribution
95 | t_flat = np.linspace(0, T, num_test_samples)
96 | x_flat = np.linspace(0, L, num_test_samples)
97 | t, x = np.meshgrid(t_flat, x_flat)
98 | tx = np.stack([t.flatten(), x.flatten()], axis=-1)
99 | u = network.predict(tx, batch_size=num_test_samples)
100 | u = u.reshape(t.shape)
101 |
102 | # plot u(t,x) distribution as a color-map
103 | fig = plt.figure(figsize=(12,8))
104 | gs = GridSpec(2, 3) # A grid layout to place subplots within a figure.
105 | plt.subplot(gs[0, :])
106 | vmin, vmax = -1.0, +1.0
107 | plt.pcolormesh(t, x, u, cmap='rainbow', shading = 'auto', norm=Normalize(vmin=vmin, vmax=vmax))
108 | plt.xlabel('t',fontsize=20)
109 | plt.ylabel('x',fontsize=20)
110 | plt.xticks(fontsize=20)
111 | plt.yticks(fontsize=20)
112 | cbar = plt.colorbar(pad=0.05, aspect=10)
113 | cbar.set_label('u(t,x)', fontsize=20)
114 | cbar.ax.tick_params(labelsize=20)
115 | cbar.mappable.set_clim(vmin, vmax)
116 |
117 | # plot u(t=const, x) cross-sections
118 | tfrac = np.array([0.25,0.5,0.75])
119 | t_cross_sections = (T*tfrac).tolist()
120 | idx = [int(x) for x in (num_test_samples*tfrac)]
121 |
122 | for i, t_cs in enumerate(t_cross_sections):
123 | plt.subplot(gs[1, i])
124 | full = np.full(t_flat.shape, t_cs)
125 | tx = np.stack([np.full(t_flat.shape, t_cs), x_flat], axis=-1)
126 | u = network.predict(tx, batch_size=num_test_samples)
127 | #print(u.shape)
128 | plt.plot(x_flat, u, '.b')
129 | plt.plot(x_flat, usol[:,idx[i]], 'r--', linewidth = 2)
130 | plt.title('t = {}'.format(t_cs),fontsize=20)
131 | plt.xlabel('x',fontsize=20)
132 | plt.ylabel('u(t,x)',fontsize=20)
133 | plt.xticks(fontsize=20)
134 | plt.yticks(fontsize=20)
135 | plt.ylim(-1,1)
136 | plt.legend(['Prediction','Exact'], loc = 'upper right',fontsize=8)
137 | plt.tight_layout()
138 | plt.savefig('PINNs_at_'+str(c)+'.png', transparent=True, dpi = 900)
139 | plt.show()
140 |
141 |
--------------------------------------------------------------------------------
/lib/optimizer.py:
--------------------------------------------------------------------------------
1 | import scipy.optimize
2 | import numpy as np
3 | import tensorflow as tf
4 |
5 | class L_BFGS_B:
6 | """
7 | Optimize the keras network model using L-BFGS-B algorithm.
8 |
9 | Attributes:
10 | model: optimization target model.
11 | samples: training samples.
12 | factr: convergence condition. typical values for factr are: 1e12 for low accuracy;
13 | 1e7 for moderate accuracy; 10 for extremely high accuracy.
14 | m: maximum number of variable metric corrections used to define the limited memory matrix.
15 | maxls: maximum number of line search steps (per iteration).
16 | maxiter: maximum number of iterations.
17 | metris: logging metrics.
18 | progbar: progress bar.
19 | """
20 |
21 | def __init__(self, model, x_train, y_train, m=10, factr=1e7, pgtol=1e-5,
22 | epsilon=1e-8, maxiter=5000, maxls=50):
23 | """
24 | Args:
25 | model: optimization target model.
26 | samples: training samples.
27 | factr: convergence condition. typical values for factr are: 1e12 for low accuracy;
28 | 1e7 for moderate accuracy; 10.0 for extremely high accuracy.
29 | m: maximum number of variable metric corrections used to define the limited memory matrix.
30 | maxls: maximum number of line search steps (per iteration).
31 | maxiter: maximum number of iterations.
32 | """
33 |
34 | # set attributes
35 | self.model = model
36 | self.x_train = [ tf.constant(x, dtype=tf.float32) for x in x_train ]
37 | self.y_train = [ tf.constant(y, dtype=tf.float32) for y in y_train ]
38 | self.factr = factr
39 | self.m = m
40 | self.pgtol = pgtol
41 | self.epsilon = epsilon
42 | self.maxls = maxls
43 | self.maxiter = maxiter
44 | self.metrics = ['loss']
45 | # initialize the progress bar
46 | self.progbar = tf.keras.callbacks.ProgbarLogger(
47 | count_mode='steps', stateful_metrics=self.metrics)
48 | self.progbar.set_params( {
49 | 'verbose':1, 'epochs':1, 'steps':self.maxiter, 'metrics':self.metrics})
50 |
51 | def set_weights(self, flat_weights):
52 | """
53 | Set weights to the model.
54 |
55 | Args:
56 | flat_weights: flatten weights.
57 | """
58 |
59 | # get model weights
60 | shapes = [ w.shape for w in self.model.get_weights() ]
61 | # compute splitting indices
62 | split_ids = np.cumsum([ np.prod(shape) for shape in [0] + shapes ])
63 | # reshape weights
64 | weights = [ flat_weights[from_id:to_id].reshape(shape)
65 | for from_id, to_id, shape in zip(split_ids[:-1], split_ids[1:], shapes) ]
66 | # set weights to the model
67 | self.model.set_weights(weights)
68 |
69 | @tf.function
70 | def tf_evaluate(self, x, y):
71 | """
72 | Evaluate loss and gradients for weights as tf.Tensor.
73 |
74 | Args:
75 | x: input data.
76 |
77 | Returns:
78 | loss and gradients for weights as tf.Tensor.
79 | """
80 |
81 | with tf.GradientTape() as g:
82 | loss = tf.reduce_mean(tf.keras.losses.mse(self.model(x), y))
83 | grads = g.gradient(loss, self.model.trainable_variables)
84 | return loss, grads
85 |
86 | def evaluate(self, weights):
87 | """
88 | Evaluate loss and gradients for weights as ndarray.
89 |
90 | Args:
91 | weights: flatten weights.
92 |
93 | Returns:
94 | loss and gradients for weights as ndarray.
95 | """
96 |
97 | # update weights
98 | self.set_weights(weights)
99 | # compute loss and gradients for weights
100 | loss, grads = self.tf_evaluate(self.x_train, self.y_train)
101 | # convert tf.Tensor to flatten ndarray
102 | loss = loss.numpy().astype('float64')
103 | grads = np.concatenate([ g.numpy().flatten() for g in grads ]).astype('float64')
104 |
105 | return loss, grads
106 |
107 | def callback(self, weights):
108 | """
109 | Callback that prints the progress to stdout.
110 |
111 | Args:
112 | weights: flatten weights.
113 | """
114 | self.progbar.on_batch_begin(0)
115 | loss, _ = self.evaluate(weights)
116 | self.progbar.on_batch_end(0, logs=dict(zip(self.metrics, [loss])))
117 |
118 | def fit(self):
119 | """
120 | Train the model using L-BFGS-B algorithm.
121 | """
122 |
123 | # get initial weights as a flat vector
124 | initial_weights = np.concatenate(
125 | [ w.flatten() for w in self.model.get_weights() ])
126 | # optimize the weight vector
127 | print('Optimizer: L-BFGS-B (maxiter={})'.format(self.maxiter))
128 | self.progbar.on_train_begin()
129 | self.progbar.on_epoch_begin(1)
130 |
131 | scipy.optimize.fmin_l_bfgs_b(func=self.evaluate,
132 | x0=initial_weights,
133 | factr=self.factr,
134 | pgtol=self.pgtol,
135 | epsilon=self.epsilon,
136 | m=self.m,
137 | maxls=self.maxls,
138 | maxiter=self.maxiter,
139 | callback=self.callback)
140 |
141 |
142 | # scipy.optimize.least_squares(func = self.evaluate, x0 = initial_weights)
143 |
144 | # scipy.optimize.minimize(fun = self.evaluate,
145 | # x0 = initial_weights,
146 | # method='L-BFGS-B',
147 | # jac= True, # If jac is True, fun is assumed to return the gradient along with the objective function
148 | # callback = self.callback,
149 | # options = {'disp': None,
150 | # 'maxcor': 200,
151 | # 'ftol': 1 * np.finfo(float).eps, #The iteration stops when (f^k - f^{k+1})/max{|f^k|,|f^{k+1}|,1} <= ftol
152 | # 'gtol': 5e-5,
153 | # 'maxfun': 50000,
154 | # 'maxiter': 1,
155 | # 'iprint': 50, #print update every 50 iterations
156 | # 'maxls': 50})
157 |
158 | # scipy.optimize.minimize(fun=self.evaluate,
159 | # x0=initial_weights,
160 | # jac=True,
161 | # method='BFGS',
162 | # callback=self.callback,
163 | # options={'maxiter': 15000,
164 | # 'maxls': 20})
165 |
166 | # scipy.optimize.minimize(fun = self.evaluate,
167 | # x0 = initial_weights,
168 | # args=(),
169 | # method='L-BFGS-B',
170 | # jac= True,
171 | # callback = self.callback,
172 | # options = {'disp': None,
173 | # 'maxcor': 200,
174 | # 'ftol': 1 * np.finfo(float).eps, #The iteration stops when (f^k - f^{k+1})/max{|f^k|,|f^{k+1}|,1} <= ftol
175 | # 'gtol': 5e-5,
176 | # 'maxfun': 50000,
177 | # 'maxiter': 1,
178 | # 'iprint': 50, #print update every 50 iterations
179 | # 'maxls': 50})
180 |
181 | self.progbar.on_epoch_end(1)
182 | self.progbar.on_train_end()
183 |
--------------------------------------------------------------------------------
/BOPINN.py:
--------------------------------------------------------------------------------
1 | import numpy as np
2 | import tensorflow as tf
3 | import matplotlib.pyplot as plt
4 | from lib.pinn_wave import PINN
5 | from lib.network import Network
6 | from lib.optimizer import L_BFGS_B
7 | import math
8 | from bayes_opt import BayesianOptimization, UtilityFunction
9 | import scipy.io
10 | import os
11 | from os.path import join
12 | import time
13 |
14 | # number of training samples
15 | num_train_samples = 25000
16 |
17 | # number of test samples
18 | num_test_samples = 5000
19 |
20 | # Other variables
21 | L = 10
22 | n = L
23 | T = 1
24 |
25 | # define x,t for PINNs prediction
26 | x_test = np.linspace(0,L,num_test_samples)
27 | t_test = np.linspace(0,T,num_test_samples)
28 |
29 | # upload the snapshot observation
30 | path = "E:\MSR\data\BOPINN\data"
31 | dir_list = os.listdir(path)
32 | print("Files in directory",dir_list)
33 |
34 | idx_data = 3 # 0,3,6
35 | data = dir_list[idx_data]
36 | print("Imported file", data)
37 |
38 | file = join(path, data)
39 | u_analy = scipy.io.loadmat(file)
40 | u_analy = u_analy['a1']
41 |
42 | # plot the snapshot observation
43 | fig = plt.figure(figsize=(7,4))
44 | plt.plot(x_test,u_analy, '-', linewidth = 2)
45 | plt.xlabel('$x$', fontsize = 15)
46 | plt.ylabel('Normalized u(x,t)', fontsize = 15)
47 | plt.xticks(fontsize = 12)
48 | plt.yticks(fontsize = 12)
49 |
50 | # time of observation
51 | tilde_t = 0.25
52 |
53 | #%% Initial conditions
54 | def u0(t):
55 | z = -np.sin(1*math.pi*t)
56 | return z
57 |
58 | def du0_dt(tx):
59 | with tf.GradientTape() as g:
60 | g.watch(tx)
61 | u = u0(tx)
62 | du_dt = g.batch_jacobian(u, tx)[..., 0]
63 | return du_dt
64 |
65 | def RMS(S):
66 | rms = np.sqrt(np.mean(S**2))
67 | return rms
68 |
69 | #%% collocation points
70 | # create training input
71 | tx_eqn = np.random.rand(num_train_samples, 2)
72 | tx_eqn[..., 0] = T*tx_eqn[..., 0] # t = 0 ~ +1
73 | tx_eqn[..., 1] = L*tx_eqn[..., 1] # x = 0 ~ +10
74 | #print('\nShape of t_eqn ==>',tx_eqn.shape)
75 |
76 | tx_ini = np.random.rand(num_train_samples, 2)
77 | tx_ini[..., 0] = 0 # t = 0
78 | tx_ini[..., 1] = L*tx_ini[..., 1] # x = 0 ~ +10
79 | #print('\nShape of tx_ini ==>',tx_ini.shape)
80 |
81 | tx_bnd = np.random.rand(num_train_samples, 2)
82 | tx_bnd[..., 0] = T*tx_bnd[..., 0] # t = 0 ~ +1
83 | tx_bnd[..., 1] = L*np.round(tx_bnd[..., 1]) # x = 0 or +10
84 | #print('\nShape of tx_bnd ==>',tx_bnd.shape)
85 |
86 | # initial and boundary conditions
87 | u_zero = np.zeros((num_train_samples, 1))
88 | u_ini = u0(tx_ini[:,1,None])
89 | du_dt_ini = np.zeros((num_train_samples, 1))
90 |
91 | #%% g(c) = (u_pred - u_true)^2; u_pred via PINNs
92 |
93 | def model_builder(ic):
94 | #ic = hp.Float('ic', min_value=0.1, max_value=1, step=10)
95 | print('\n ## ->>>> PINNs simulation at speed = ' + str(ic))
96 |
97 | # build a PINN model
98 | network = Network.build()
99 | pinn = PINN(network,ic).build()
100 |
101 | # train the model using L-BFGS-B algorithm
102 | begin = time.time()
103 | x_train = [tx_eqn, tx_ini, tx_bnd]
104 | y_train = [u_zero, u_ini, du_dt_ini, u_zero]
105 | lbfgs = L_BFGS_B(model=pinn, x_train=x_train, y_train=y_train)
106 | lbfgs.fit()
107 | end = time.time()
108 | totaltime = end-begin
109 | print("\n Total runtime is (min.)",totaltime/60)
110 |
111 | # test the model
112 | tx = np.stack([np.full(t_test.shape, tilde_t), x_test], axis=-1)
113 | u_pred = network.predict(tx, batch_size=num_test_samples)
114 |
115 | # mse between u_pred via PINN and snapshot observation
116 | mse = -np.mean(np.square(u_analy - u_pred))
117 |
118 | del network, pinn, lbfgs, u_pred
119 |
120 | return mse
121 |
122 | #%% Bayesian Optimization
123 | # Attributes of BO
124 | itt_explore = 5
125 | itt = 45
126 | itt_all = itt_explore + itt
127 | n_runs = 10
128 |
129 | # bounds of BO
130 | pbounds = {'ic': (0.1, 1)}
131 |
132 | # Start BO
133 | mse_star_all = []
134 | cstar_all = []
135 | mse_all_all = []
136 | ic_all_all = []
137 |
138 | for r in range(n_runs):
139 | print('\n ## ->>>> Run = ' + str(r))
140 |
141 | # define the model
142 | optimizer = BayesianOptimization(
143 | f=model_builder,
144 | pbounds=pbounds,
145 | allow_duplicate_points=True)
146 |
147 | # utility function
148 | util = UtilityFunction(kind='ucb',
149 | kappa=2.576,
150 | kappa_decay=1,
151 | kappa_decay_delay=0)
152 |
153 | # run the model
154 | optimizer.maximize(init_points=itt_explore,
155 | n_iter=itt,
156 | acquisition_function=util)
157 |
158 | soln = optimizer.max
159 | resi = optimizer.res
160 |
161 | # optimum values
162 | mse_star = list(soln.values())[0]
163 | cstar = list(soln.values())[1]
164 | cstar2 = list(cstar.values())[0]
165 |
166 | # append all optimum values
167 | mse_star_all.append(mse_star)
168 | cstar_all.append(cstar2)
169 |
170 | # all run values
171 | mse_all = []
172 | ic_all = []
173 | for i,res in enumerate(resi):
174 | mse = list(res.values())[0]
175 | ic = list(res.values())[1]
176 | ic2 = list(ic.values())[0]
177 |
178 | # append all run values
179 | mse_all.append(mse)
180 | ic_all.append(ic2)
181 |
182 | mse_all_all.append(np.array(mse_all))
183 | ic_all_all.append(np.array(ic_all))
184 |
185 | del optimizer
186 |
187 | mse_all_all = np.array(mse_all_all)
188 | mse_star_all = np.array(mse_star_all)
189 | ic_all_all = np.array(ic_all_all)
190 | cstar_all = np.array(cstar_all)
191 |
192 | #%% Process the BO results
193 | # max, min, mean and sd target function/objective function value across different runs
194 | max_mse_star_allruns, min_mse_star_allruns = np.max(mse_star_all), np.min(mse_star_all)
195 | mean_mse_star_allruns, std_mse_star_allruns = np.mean(mse_star_all), np.std(mse_star_all)
196 |
197 | # optima corresponding to abovementioned optimal points
198 | idx_max_mse_star_allruns = np.where(max_mse_star_allruns == mse_star_all)
199 | idx_min_mse_star_allruns = np.where(min_mse_star_allruns == mse_star_all)
200 |
201 | max_cstar_allruns = cstar_all[idx_max_mse_star_allruns]
202 | min_cstar_allruns = cstar_all[idx_min_mse_star_allruns]
203 | mean_cstar_allruns = np.mean(cstar_all)
204 | std_cstar_allruns = np.std(cstar_all)
205 |
206 | print("Max (best optimal) tf across runs = ",max_mse_star_allruns)
207 | print("Min (least optimal) tf across runs = ",min_mse_star_allruns)
208 | print("Mean tf across runs = ",mean_mse_star_allruns)
209 | print("Std tf across runs = ",std_mse_star_allruns)
210 |
211 | print("Max (best optimal) c* across runs = ",max_cstar_allruns)
212 | print("Min (least optimal) c* across runs = ",min_cstar_allruns)
213 | print("Mean c* across runs = ",mean_cstar_allruns)
214 | print("Std c* across runs = ",std_cstar_allruns)
215 |
216 | #%% plot the BO results
217 | # plot best optimal run with the optima
218 | idx_max_all = []
219 | for i in range(mse_all_all.shape[0]):
220 | idx_max = np.where(mse_all_all[i,:] == mse_star_all[i])
221 | idx_max = idx_max[0][0]
222 | idx_max_all.append(idx_max)
223 |
224 | mean_mse_all = np.mean(mse_all_all, axis=0)
225 | std_mse_all = np.std(mse_all_all, axis=0)
226 | mean_ic_all = np.mean(ic_all_all, axis=0)
227 | std_ic_all = np.std(ic_all_all, axis=0)
228 |
229 | opt_mse_run = mse_all_all[idx_max_mse_star_allruns[0][0]]
230 | opt_c_run = ic_all_all[idx_max_mse_star_allruns[0][0]]
231 | opt_mse = mse_star_all[idx_max_mse_star_allruns[0][0]]
232 | opt_c = cstar_all[idx_max_mse_star_allruns[0][0]]
233 |
234 | # tf vs c
235 | txt = 'c* = '+ str(round(opt_c,4))
236 | plt.figure(figsize = (8, 6))
237 | plt.plot(opt_c_run,opt_mse_run,'ob',markersize=6)
238 | plt.plot(opt_c,opt_mse,'*r',markersize=8, label = 'Best optima')
239 | #plt.text(0.75, -0.03, txt, fontsize=18, c = 'r')
240 | plt.xlabel("velocity, c",fontsize=20)
241 | plt.ylabel("target function, g(c)",fontsize=20)
242 | plt.xticks(fontsize=20)
243 | plt.yticks(fontsize=20)
244 | plt.legend(fontsize = 14, loc='upper left')
245 | plt.savefig('tfvsc_'+str(idx_data+1)+'.png', bbox_inches='tight', dpi=600)
246 | plt.show()
--------------------------------------------------------------------------------
/BOPINN.ipynb:
--------------------------------------------------------------------------------
1 | {
2 | "cells": [
3 | {
4 | "cell_type": "markdown",
5 | "source": [
6 | "## Colab computing infra available\n",
7 | "### Preliminaries\n",
8 | "#### 1. Runtime -> Change runtime type -> T4 GPU\n",
9 | "#### 2. Upload data folder from github repository on your google drive\n",
10 | "#### 3. Except first three cells, this notebook can be run on jupyter.\n",
11 | "#### 4. For 3., pip install bayesian-optimization is performed in anaconda tensorflow environment."
12 | ],
13 | "metadata": {
14 | "id": "XW60sZt3HGKv"
15 | }
16 | },
17 | {
18 | "cell_type": "code",
19 | "source": [
20 | "#GPU count and name\n",
21 | "!nvidia-smi -L\n",
22 | "!lscpu |grep 'Model name'\n",
23 | "#no.of sockets i.e available slots for physical processors\n",
24 | "!lscpu | grep 'Socket(s):'\n",
25 | "#no.of cores each processor is having\n",
26 | "!lscpu | grep 'Core(s) per socket:'\n",
27 | "#no.of threads each core is having\n",
28 | "!lscpu | grep 'Thread(s) per core'\n",
29 | "!lscpu | grep \"L3 cache\"\n",
30 | "#if it had turbo boost it would've shown Min and Max MHz also but it is only showing current frequency this means it always operates at 2.3GHz\n",
31 | "!lscpu | grep \"MHz\"\n",
32 | "#memory that we can use\n",
33 | "!cat /proc/meminfo | grep 'MemAvailable'\n",
34 | "#hard disk that we can use\n",
35 | "!df -h / | awk '{print $4}'"
36 | ],
37 | "metadata": {
38 | "id": "8iHIF9ANB7W-",
39 | "colab": {
40 | "base_uri": "https://localhost:8080/"
41 | },
42 | "outputId": "677a2eac-9246-478b-f44c-cbeef270bda4"
43 | },
44 | "execution_count": null,
45 | "outputs": [
46 | {
47 | "output_type": "stream",
48 | "name": "stdout",
49 | "text": [
50 | "GPU 0: Tesla T4 (UUID: GPU-2429e038-2c60-04b9-d3a5-5573f49827da)\n",
51 | "Model name: Intel(R) Xeon(R) CPU @ 2.30GHz\n",
52 | "Socket(s): 1\n",
53 | "Core(s) per socket: 1\n",
54 | "Thread(s) per core: 2\n",
55 | "L3 cache: 45 MiB (1 instance)\n",
56 | "MemAvailable: 12416136 kB\n",
57 | "Avail\n",
58 | "52G\n"
59 | ]
60 | }
61 | ]
62 | },
63 | {
64 | "cell_type": "code",
65 | "source": [
66 | "# mount google drive\n",
67 | "from google.colab import drive\n",
68 | "drive.mount('/content/gdrive')\n",
69 | "path = 'gdrive/MyDrive/BOPINN/data'"
70 | ],
71 | "metadata": {
72 | "id": "q_ae9KDsC2Q1",
73 | "colab": {
74 | "base_uri": "https://localhost:8080/"
75 | },
76 | "outputId": "6d816703-0158-473b-a2c5-95e4b09b1c99"
77 | },
78 | "execution_count": null,
79 | "outputs": [
80 | {
81 | "output_type": "stream",
82 | "name": "stdout",
83 | "text": [
84 | "Drive already mounted at /content/gdrive; to attempt to forcibly remount, call drive.mount(\"/content/gdrive\", force_remount=True).\n"
85 | ]
86 | }
87 | ]
88 | },
89 | {
90 | "cell_type": "code",
91 | "source": [
92 | "# install Bayesian optimization library \"https://github.com/bayesian-optimization/BayesianOptimization\"\n",
93 | "%pip install bayesian-optimization==1.4.1\n",
94 | "from bayes_opt import BayesianOptimization,UtilityFunction"
95 | ],
96 | "metadata": {
97 | "colab": {
98 | "base_uri": "https://localhost:8080/"
99 | },
100 | "id": "CrbZE4FvZhbf",
101 | "outputId": "7cbc93bf-ae8b-4936-9fa9-70eb3727dcfb"
102 | },
103 | "execution_count": null,
104 | "outputs": [
105 | {
106 | "output_type": "stream",
107 | "name": "stdout",
108 | "text": [
109 | "Requirement already satisfied: bayesian-optimization==1.4.1 in /usr/local/lib/python3.10/dist-packages (1.4.1)\n",
110 | "Requirement already satisfied: numpy>=1.9.0 in /usr/local/lib/python3.10/dist-packages (from bayesian-optimization==1.4.1) (1.23.5)\n",
111 | "Requirement already satisfied: scipy>=1.0.0 in /usr/local/lib/python3.10/dist-packages (from bayesian-optimization==1.4.1) (1.11.4)\n",
112 | "Requirement already satisfied: scikit-learn>=0.18.0 in /usr/local/lib/python3.10/dist-packages (from bayesian-optimization==1.4.1) (1.2.2)\n",
113 | "Requirement already satisfied: colorama in /usr/local/lib/python3.10/dist-packages (from bayesian-optimization==1.4.1) (0.4.6)\n",
114 | "Requirement already satisfied: joblib>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from scikit-learn>=0.18.0->bayesian-optimization==1.4.1) (1.3.2)\n",
115 | "Requirement already satisfied: threadpoolctl>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from scikit-learn>=0.18.0->bayesian-optimization==1.4.1) (3.2.0)\n"
116 | ]
117 | }
118 | ]
119 | },
120 | {
121 | "cell_type": "markdown",
122 | "source": [
123 | "## In-built classes"
124 | ],
125 | "metadata": {
126 | "id": "qECf7VXwCvKO"
127 | }
128 | },
129 | {
130 | "cell_type": "markdown",
131 | "source": [
132 | "### Gradient Tape"
133 | ],
134 | "metadata": {
135 | "id": "GQQzlB87IQS1"
136 | }
137 | },
138 | {
139 | "cell_type": "code",
140 | "source": [
141 | "import tensorflow as tf\n",
142 | "import numpy as np\n",
143 | "import matplotlib.pyplot as plt\n",
144 | "\n",
145 | "class GradientLayer(tf.keras.layers.Layer):\n",
146 | " \"\"\"\n",
147 | " Custom layer to compute 1st and 2nd derivatives for the wave equation.\n",
148 | "\n",
149 | " Attributes:\n",
150 | " model: keras network model.\n",
151 | " \"\"\"\n",
152 | "\n",
153 | " def __init__(self, model, **kwargs):\n",
154 | " \"\"\"\n",
155 | " Args:\n",
156 | " model: keras network model.\n",
157 | " \"\"\"\n",
158 | "\n",
159 | " self.model = model\n",
160 | " super().__init__(**kwargs)\n",
161 | "\n",
162 | " def call(self, tx):\n",
163 | " \"\"\"\n",
164 | " Computing 1st and 2nd derivatives for the wave equation.\n",
165 | "\n",
166 | " Args:\n",
167 | " tx: input variables (t, x).\n",
168 | "\n",
169 | " Returns:\n",
170 | " u: network output.\n",
171 | " du_dt: 1st derivative of t.\n",
172 | " du_dx: 1st derivative of x.\n",
173 | " d2u_dt2: 2nd derivative of t.\n",
174 | " d2u_dx2: 2nd derivative of x.\n",
175 | " \"\"\"\n",
176 | "\n",
177 | " with tf.GradientTape() as g:\n",
178 | " g.watch(tx)\n",
179 | " with tf.GradientTape() as gg:\n",
180 | " gg.watch(tx)\n",
181 | " u = self.model(tx)\n",
182 | " du_dtx = gg.batch_jacobian(u, tx)\n",
183 | " du_dt = du_dtx[..., 0]\n",
184 | " du_dx = du_dtx[..., 1]\n",
185 | " d2u_dtx2 = g.batch_jacobian(du_dtx, tx)\n",
186 | " d2u_dt2 = d2u_dtx2[..., 0, 0]\n",
187 | " d2u_dx2 = d2u_dtx2[..., 1, 1]\n",
188 | "\n",
189 | " return u, du_dt, du_dx, d2u_dt2, d2u_dx2"
190 | ],
191 | "metadata": {
192 | "id": "8GmwN5gSIOr2"
193 | },
194 | "execution_count": null,
195 | "outputs": []
196 | },
197 | {
198 | "cell_type": "markdown",
199 | "source": [
200 | "### PINNs"
201 | ],
202 | "metadata": {
203 | "id": "e7-8pYNbDJEv"
204 | }
205 | },
206 | {
207 | "cell_type": "code",
208 | "source": [
209 | "class PINN:\n",
210 | " \"\"\"\n",
211 | " Build a physics informed neural network (PINN) model for the wave equation.\n",
212 | "\n",
213 | " Attributes:\n",
214 | " network: keras network model with input (t, x) and output u(t, x).\n",
215 | " c: wave velocity.\n",
216 | " grads: gradient layer.\n",
217 | " \"\"\"\n",
218 | "\n",
219 | " def __init__(self, network, c):\n",
220 | " \"\"\"\n",
221 | " Args:\n",
222 | " network: keras network model with input (t, x) and output u(t, x).\n",
223 | " c: wave velocity. Default is 1.\n",
224 | " \"\"\"\n",
225 | "\n",
226 | " self.network = network\n",
227 | " self.c = c\n",
228 | " self.grads = GradientLayer(self.network)\n",
229 | "\n",
230 | " def build(self):\n",
231 | " \"\"\"\n",
232 | " Build a PINN model for the wave equation.\n",
233 | "\n",
234 | " Returns:\n",
235 | " PINN model for the projectile motion with\n",
236 | " input: [ (t, x) relative to equation,\n",
237 | " (t=0, x) relative to initial condition,\n",
238 | " (t, x=bounds) relative to boundary condition ],\n",
239 | " output: [ u(t,x) relative to equation,\n",
240 | " u(t=0, x) relative to initial condition,\n",
241 | " du_dt(t=0, x) relative to initial derivative of t,\n",
242 | " u(t, x=bounds) relative to boundary condition ]\n",
243 | " \"\"\"\n",
244 | "\n",
245 | " # equation input: (t, x)\n",
246 | " tx_eqn = tf.keras.layers.Input(shape=(2,))\n",
247 | " # initial condition input: (t=0, x)\n",
248 | " tx_ini = tf.keras.layers.Input(shape=(2,))\n",
249 | " # boundary condition input: (t, x=-1) or (t, x=+1)\n",
250 | " tx_bnd = tf.keras.layers.Input(shape=(2,))\n",
251 | "\n",
252 | " # compute gradients\n",
253 | " _, _, _, d2u_dt2, d2u_dx2 = self.grads(tx_eqn)\n",
254 | "\n",
255 | " # equation output being zero\n",
256 | " u_eqn = d2u_dt2 - self.c*self.c * d2u_dx2\n",
257 | " # initial condition output\n",
258 | " u_ini, du_dt_ini, _, _, _ = self.grads(tx_ini)\n",
259 | " # boundary condition output\n",
260 | " u_bnd = self.network(tx_bnd) # dirichlet\n",
261 | " #_, _, u_bnd, _, _ = self.grads(tx_bnd) # neumann\n",
262 | "\n",
263 | " # build the PINN model for the wave equation\n",
264 | " return tf.keras.models.Model(\n",
265 | " inputs=[tx_eqn, tx_ini, tx_bnd],\n",
266 | " outputs=[u_eqn, u_ini, du_dt_ini, u_bnd])"
267 | ],
268 | "metadata": {
269 | "id": "N_6QYlj4C04v"
270 | },
271 | "execution_count": null,
272 | "outputs": []
273 | },
274 | {
275 | "cell_type": "markdown",
276 | "source": [
277 | "### Network for PINN"
278 | ],
279 | "metadata": {
280 | "id": "ZWPMeef1DLeA"
281 | }
282 | },
283 | {
284 | "cell_type": "code",
285 | "source": [
286 | "class Network:\n",
287 | " \"\"\"\n",
288 | " Build a physics informed neural network (PINN) model for the wave equation.\n",
289 | " \"\"\"\n",
290 | "\n",
291 | " @classmethod\n",
292 | " def build(cls, num_inputs=2, layers=[64, 128, 128, 128, 128, 64], activation='tanh', num_outputs=1):\n",
293 | " \"\"\"\n",
294 | " Build a PINN model for the wave equation with input shape (t, x) and output shape u(t, x).\n",
295 | "\n",
296 | " Args:\n",
297 | " num_inputs: number of input variables. Default is 2 for (t, x).\n",
298 | " layers: number of hidden layers.\n",
299 | " activation: activation function in hidden layers.\n",
300 | " num_outpus: number of output variables. Default is 1 for u(t, x).\n",
301 | "\n",
302 | " Returns:\n",
303 | " keras network model.\n",
304 | " \"\"\"\n",
305 | "\n",
306 | " # input layer\n",
307 | " inputs = tf.keras.layers.Input(shape=(num_inputs,))\n",
308 | " # hidden layers\n",
309 | " x = inputs\n",
310 | " for layer in layers:\n",
311 | " x = tf.keras.layers.Dense(layer, activation=activation,\n",
312 | " kernel_initializer='he_normal')(x)\n",
313 | " x = tf.keras.layers.Dropout(0.1)(x)\n",
314 | " # output layer\n",
315 | " outputs = tf.keras.layers.Dense(num_outputs,\n",
316 | " kernel_initializer='he_normal')(x)\n",
317 | "\n",
318 | " return tf.keras.models.Model(inputs=inputs, outputs=outputs)"
319 | ],
320 | "metadata": {
321 | "id": "YqrofsFgDNXR"
322 | },
323 | "execution_count": null,
324 | "outputs": []
325 | },
326 | {
327 | "cell_type": "markdown",
328 | "source": [
329 | "### Optimizer for PINN"
330 | ],
331 | "metadata": {
332 | "id": "ipTUkVObDT3M"
333 | }
334 | },
335 | {
336 | "cell_type": "code",
337 | "source": [
338 | "import scipy.optimize\n",
339 | "\n",
340 | "class L_BFGS_B:\n",
341 | " \"\"\"\n",
342 | " Optimize the keras network model using L-BFGS-B algorithm.\n",
343 | "\n",
344 | " Attributes:\n",
345 | " model: optimization target model.\n",
346 | " samples: training samples.\n",
347 | " factr: convergence condition. typical values for factr are: 1e12 for low accuracy;\n",
348 | " 1e7 for moderate accuracy; 10 for extremely high accuracy.\n",
349 | " m: maximum number of variable metric corrections used to define the limited memory matrix.\n",
350 | " maxls: maximum number of line search steps (per iteration).\n",
351 | " maxiter: maximum number of iterations.\n",
352 | " metris: logging metrics.\n",
353 | " progbar: progress bar.\n",
354 | " \"\"\"\n",
355 | "\n",
356 | " def __init__(self, model, x_train, y_train, m=10, factr=1e7, pgtol=1e-5,\n",
357 | " epsilon=1e-8, maxiter=5000, maxls=50):\n",
358 | " \"\"\"\n",
359 | " Args:\n",
360 | " model: optimization target model.\n",
361 | " samples: training samples.\n",
362 | " factr: convergence condition. typical values for factr are: 1e12 for low accuracy;\n",
363 | " 1e7 for moderate accuracy; 10.0 for extremely high accuracy.\n",
364 | " m: maximum number of variable metric corrections used to define the limited memory matrix.\n",
365 | " maxls: maximum number of line search steps (per iteration).\n",
366 | " maxiter: maximum number of iterations.\n",
367 | " \"\"\"\n",
368 | "\n",
369 | " # set attributes\n",
370 | " self.model = model\n",
371 | " self.x_train = [ tf.constant(x, dtype=tf.float32) for x in x_train ]\n",
372 | " self.y_train = [ tf.constant(y, dtype=tf.float32) for y in y_train ]\n",
373 | " self.factr = factr\n",
374 | " self.m = m\n",
375 | " self.pgtol = pgtol\n",
376 | " self.epsilon = epsilon\n",
377 | " self.maxls = maxls\n",
378 | " self.maxiter = maxiter\n",
379 | " self.metrics = ['loss']\n",
380 | " # initialize the progress bar\n",
381 | " self.progbar = tf.keras.callbacks.ProgbarLogger(\n",
382 | " count_mode='steps', stateful_metrics=self.metrics)\n",
383 | " self.progbar.set_params( {\n",
384 | " 'verbose':1, 'epochs':1, 'steps':self.maxiter, 'metrics':self.metrics})\n",
385 | "\n",
386 | " def set_weights(self, flat_weights):\n",
387 | " \"\"\"\n",
388 | " Set weights to the model.\n",
389 | "\n",
390 | " Args:\n",
391 | " flat_weights: flatten weights.\n",
392 | " \"\"\"\n",
393 | "\n",
394 | " # get model weights\n",
395 | " shapes = [ w.shape for w in self.model.get_weights() ]\n",
396 | " # compute splitting indices\n",
397 | " split_ids = np.cumsum([ np.prod(shape) for shape in [0] + shapes ])\n",
398 | " # reshape weights\n",
399 | " weights = [ flat_weights[from_id:to_id].reshape(shape)\n",
400 | " for from_id, to_id, shape in zip(split_ids[:-1], split_ids[1:], shapes) ]\n",
401 | " # set weights to the model\n",
402 | " self.model.set_weights(weights)\n",
403 | "\n",
404 | " @tf.function\n",
405 | " def tf_evaluate(self, x, y):\n",
406 | " \"\"\"\n",
407 | " Evaluate loss and gradients for weights as tf.Tensor.\n",
408 | "\n",
409 | " Args:\n",
410 | " x: input data.\n",
411 | "\n",
412 | " Returns:\n",
413 | " loss and gradients for weights as tf.Tensor.\n",
414 | " \"\"\"\n",
415 | "\n",
416 | " with tf.GradientTape() as g:\n",
417 | " loss = tf.reduce_mean(tf.keras.losses.mse(self.model(x), y))\n",
418 | " grads = g.gradient(loss, self.model.trainable_variables)\n",
419 | " return loss, grads\n",
420 | "\n",
421 | " def evaluate(self, weights):\n",
422 | " \"\"\"\n",
423 | " Evaluate loss and gradients for weights as ndarray.\n",
424 | "\n",
425 | " Args:\n",
426 | " weights: flatten weights.\n",
427 | "\n",
428 | " Returns:\n",
429 | " loss and gradients for weights as ndarray.\n",
430 | " \"\"\"\n",
431 | "\n",
432 | " # update weights\n",
433 | " self.set_weights(weights)\n",
434 | " # compute loss and gradients for weights\n",
435 | " loss, grads = self.tf_evaluate(self.x_train, self.y_train)\n",
436 | " # convert tf.Tensor to flatten ndarray\n",
437 | " loss = loss.numpy().astype('float64')\n",
438 | " grads = np.concatenate([ g.numpy().flatten() for g in grads ]).astype('float64')\n",
439 | "\n",
440 | " return loss, grads\n",
441 | "\n",
442 | " def callback(self, weights):\n",
443 | " \"\"\"\n",
444 | " Callback that prints the progress to stdout.\n",
445 | "\n",
446 | " Args:\n",
447 | " weights: flatten weights.\n",
448 | " \"\"\"\n",
449 | " self.progbar.on_batch_begin(0)\n",
450 | " loss, _ = self.evaluate(weights)\n",
451 | " self.progbar.on_batch_end(0, logs=dict(zip(self.metrics, [loss])))\n",
452 | "\n",
453 | " def fit(self):\n",
454 | " \"\"\"\n",
455 | " Train the model using L-BFGS-B algorithm.\n",
456 | " \"\"\"\n",
457 | "\n",
458 | " # get initial weights as a flat vector\n",
459 | " initial_weights = np.concatenate(\n",
460 | " [ w.flatten() for w in self.model.get_weights() ])\n",
461 | " # optimize the weight vector\n",
462 | " print('Optimizer: L-BFGS-B (maxiter={})'.format(self.maxiter))\n",
463 | " self.progbar.on_train_begin()\n",
464 | " self.progbar.on_epoch_begin(1)\n",
465 | "\n",
466 | " scipy.optimize.fmin_l_bfgs_b(func=self.evaluate,\n",
467 | " x0=initial_weights,\n",
468 | " factr=self.factr,\n",
469 | " pgtol=self.pgtol,\n",
470 | " epsilon=self.epsilon,\n",
471 | " m=self.m,\n",
472 | " maxls=self.maxls,\n",
473 | " maxiter=self.maxiter,\n",
474 | " callback=self.callback)\n",
475 | "\n",
476 | " self.progbar.on_epoch_end(1)\n",
477 | " self.progbar.on_train_end()\n"
478 | ],
479 | "metadata": {
480 | "id": "RDynBdklDSqh"
481 | },
482 | "execution_count": null,
483 | "outputs": []
484 | },
485 | {
486 | "cell_type": "markdown",
487 | "source": [
488 | "## Upload data (snapshot observation)"
489 | ],
490 | "metadata": {
491 | "id": "WpYtKf8CDl7P"
492 | }
493 | },
494 | {
495 | "cell_type": "code",
496 | "source": [
497 | "#from bayes_opt import BayesianOptimization, UtilityFunction\n",
498 | "import math\n",
499 | "import scipy.io\n",
500 | "import os\n",
501 | "from os.path import join\n",
502 | "import time\n",
503 | "\n",
504 | "# number of training samples: found 25000 points is optimal for the resolution of u(x,t) in PINN\n",
505 | "num_train_samples = 25000\n",
506 | "\n",
507 | "# number of test samples\n",
508 | "num_test_samples = 5000\n",
509 | "\n",
510 | "# Other variables\n",
511 | "L = 10\n",
512 | "n = L\n",
513 | "T = 1\n",
514 | "\n",
515 | "# define x,t for PINNs prediction\n",
516 | "x_test = np.linspace(0,L,num_test_samples)\n",
517 | "t_test = np.linspace(0,T,num_test_samples)\n",
518 | "\n",
519 | "# upload the snapshot observation\n",
520 | "dir_list = os.listdir(path) # path defined in 2 cell\n",
521 | "print(\"Files in directory\",dir_list)\n",
522 | "idx_data = 0 # 0,1,2 # which file\n",
523 | "data = dir_list[idx_data]\n",
524 | "print(\"Imported file\", data)\n",
525 | "\n",
526 | "file = join(path, data)\n",
527 | "u_analy = scipy.io.loadmat(file)\n",
528 | "u_analy = u_analy['a1']\n",
529 | "\n",
530 | "# plot the snapshot observation\n",
531 | "fig = plt.figure(figsize=(7,4))\n",
532 | "plt.plot(x_test,u_analy, '-', linewidth = 2)\n",
533 | "plt.title(\"Snapshot observation at = 0.25s\",fontsize=15)\n",
534 | "plt.xlabel('$x$', fontsize = 15)\n",
535 | "plt.ylabel('Normalized u(x,t)', fontsize = 15)\n",
536 | "plt.xticks(fontsize = 12)\n",
537 | "plt.yticks(fontsize = 12)\n",
538 | "\n",
539 | "# time of observation = for PINN prediction of u(x,t) at tilde_t\n",
540 | "tilde_t = 0.25"
541 | ],
542 | "metadata": {
543 | "id": "_3cuJlPqCHZd",
544 | "colab": {
545 | "base_uri": "https://localhost:8080/",
546 | "height": 459
547 | },
548 | "outputId": "d5169459-39aa-4294-d7cb-127b58634e5e"
549 | },
550 | "execution_count": null,
551 | "outputs": [
552 | {
553 | "output_type": "stream",
554 | "name": "stdout",
555 | "text": [
556 | "Files in directory ['u_analytic_c=0.2t=0.25snr=39.36.mat', 'u_analytic_c=0.55t=0.25snr=38.91.mat', 'u_analytic_c=0.85t=0.25snr=37.5.mat']\n",
557 | "Imported file u_analytic_c=0.2t=0.25snr=39.36.mat\n"
558 | ]
559 | },
560 | {
561 | "output_type": "display_data",
562 | "data": {
563 | "text/plain": [
564 | ""
565 | ],
566 | "image/png": "\n"
567 | },
568 | "metadata": {}
569 | }
570 | ]
571 | },
572 | {
573 | "cell_type": "markdown",
574 | "source": [
575 | "## Collocation points"
576 | ],
577 | "metadata": {
578 | "id": "mPj-1ODfEFhe"
579 | }
580 | },
581 | {
582 | "cell_type": "code",
583 | "source": [
584 | "#%% Initial conditions\n",
585 | "def u0(t):\n",
586 | " z = -np.sin(1*math.pi*t)\n",
587 | " return z\n",
588 | "\n",
589 | "def du0_dt(tx):\n",
590 | " with tf.GradientTape() as g:\n",
591 | " g.watch(tx)\n",
592 | " u = u0(tx)\n",
593 | " du_dt = g.batch_jacobian(u, tx)[..., 0]\n",
594 | " return du_dt\n",
595 | "\n",
596 | "def RMS(S):\n",
597 | " rms = np.sqrt(np.mean(S**2))\n",
598 | " return rms\n",
599 | "\n",
600 | "#%% collocation points\n",
601 | "# create training input\n",
602 | "tx_eqn = np.random.rand(num_train_samples, 2)\n",
603 | "tx_eqn[..., 0] = T*tx_eqn[..., 0] # t = 0 ~ +1\n",
604 | "tx_eqn[..., 1] = L*tx_eqn[..., 1] # x = 0 ~ +10\n",
605 | "#print('\\nShape of t_eqn ==>',tx_eqn.shape)\n",
606 | "\n",
607 | "tx_ini = np.random.rand(num_train_samples, 2)\n",
608 | "tx_ini[..., 0] = 0 # t = 0\n",
609 | "tx_ini[..., 1] = L*tx_ini[..., 1] # x = 0 ~ +10\n",
610 | "#print('\\nShape of tx_ini ==>',tx_ini.shape)\n",
611 | "\n",
612 | "tx_bnd = np.random.rand(num_train_samples, 2)\n",
613 | "tx_bnd[..., 0] = T*tx_bnd[..., 0] # t = 0 ~ +1\n",
614 | "tx_bnd[..., 1] = L*np.round(tx_bnd[..., 1]) # x = 0 or +10\n",
615 | "#print('\\nShape of tx_bnd ==>',tx_bnd.shape)\n",
616 | "\n",
617 | "# initial and boundary conditions\n",
618 | "u_zero = np.zeros((num_train_samples, 1))\n",
619 | "u_ini = u0(tx_ini[:,1,None])\n",
620 | "du_dt_ini = np.zeros((num_train_samples, 1))"
621 | ],
622 | "metadata": {
623 | "id": "xHHrWjfvCeaP"
624 | },
625 | "execution_count": null,
626 | "outputs": []
627 | },
628 | {
629 | "cell_type": "markdown",
630 | "source": [
631 | "## Target function or objective function for BOPINN"
632 | ],
633 | "metadata": {
634 | "id": "_3hVo0wKEOyZ"
635 | }
636 | },
637 | {
638 | "cell_type": "code",
639 | "source": [
640 | "#%% Target function or ojective function, g(c) = (u_pred - u_true)^2; u_pred via PINNs\n",
641 | "def model_builder(ic):\n",
642 | " #ic = hp.Float('ic', min_value=0.1, max_value=1, step=10)\n",
643 | " print('\\n ## ->>>> PINNs simulation at speed = ' + str(ic))\n",
644 | "\n",
645 | " # build a PINN model\n",
646 | " network = Network.build()\n",
647 | " pinn = PINN(network,ic).build()\n",
648 | "\n",
649 | " # train the model using L-BFGS-B algorithm\n",
650 | " begin = time.time()\n",
651 | " x_train = [tx_eqn, tx_ini, tx_bnd]\n",
652 | " y_train = [u_zero, u_ini, du_dt_ini, u_zero]\n",
653 | " lbfgs = L_BFGS_B(model=pinn, x_train=x_train, y_train=y_train)\n",
654 | " lbfgs.fit()\n",
655 | " end = time.time()\n",
656 | " totaltime = end-begin\n",
657 | " print(\"\\n Total runtime is (min.)\",totaltime/60)\n",
658 | "\n",
659 | " # test the model\n",
660 | " tx = np.stack([np.full(t_test.shape, tilde_t), x_test], axis=-1)\n",
661 | " u_pred = network.predict(tx, batch_size=num_test_samples)\n",
662 | "\n",
663 | " # mse between u_pred via PINN and snapshot observation\n",
664 | " mse = -np.mean(np.square(u_analy - u_pred))\n",
665 | "\n",
666 | " del network, pinn, lbfgs, u_pred\n",
667 | "\n",
668 | " return mse"
669 | ],
670 | "metadata": {
671 | "id": "Q2NA5OvMCg64"
672 | },
673 | "execution_count": null,
674 | "outputs": []
675 | },
676 | {
677 | "cell_type": "markdown",
678 | "source": [
679 | "## Training"
680 | ],
681 | "metadata": {
682 | "id": "bJ-eT6gwEYSH"
683 | }
684 | },
685 | {
686 | "cell_type": "code",
687 | "source": [
688 | "#%% Bayesian Optimization\n",
689 | "# Attributes of BO\n",
690 | "itt_explore = 5\n",
691 | "itt = 45\n",
692 | "itt_all = itt_explore + itt\n",
693 | "n_runs = 10 # reduce this if colab has limited capability\n",
694 | "\n",
695 | "# bounds of BO\n",
696 | "pbounds = {'ic': (0.1, 1)}\n",
697 | "\n",
698 | "# Start BO\n",
699 | "mse_star_all = []\n",
700 | "cstar_all = []\n",
701 | "mse_all_all = []\n",
702 | "ic_all_all = []\n",
703 | "\n",
704 | "for r in range(n_runs):\n",
705 | " print('\\n ## ->>>> Run = ' + str(r))\n",
706 | "\n",
707 | " # define the model\n",
708 | " optimizer = BayesianOptimization(\n",
709 | " f=model_builder,\n",
710 | " pbounds=pbounds,\n",
711 | " allow_duplicate_points=True)\n",
712 | "\n",
713 | " # utility function\n",
714 | " util = UtilityFunction(kind='ucb',\n",
715 | " kappa=2.576,\n",
716 | " xi=0.0,\n",
717 | " kappa_decay=1,\n",
718 | " kappa_decay_delay=0)\n",
719 | "\n",
720 | " # run the model\n",
721 | " optimizer.maximize(init_points=itt_explore,\n",
722 | " n_iter=itt,\n",
723 | " acquisition_function=util)\n",
724 | "\n",
725 | " soln = optimizer.max\n",
726 | " resi = optimizer.res\n",
727 | "\n",
728 | " # optimum values\n",
729 | " mse_star = list(soln.values())[0]\n",
730 | " cstar = list(soln.values())[1]\n",
731 | " cstar2 = list(cstar.values())[0]\n",
732 | "\n",
733 | " # append all optimum values\n",
734 | " mse_star_all.append(mse_star)\n",
735 | " cstar_all.append(cstar2)\n",
736 | "\n",
737 | " # all run values\n",
738 | " mse_all, ic_all = [], []\n",
739 | " for i,res in enumerate(resi):\n",
740 | " mse = list(res.values())[0]\n",
741 | " ic = list(res.values())[1]\n",
742 | " ic2 = list(ic.values())[0]\n",
743 | "\n",
744 | " # append all run values\n",
745 | " mse_all.append(mse)\n",
746 | " ic_all.append(ic2)\n",
747 | "\n",
748 | " mse_all_all.append(np.array(mse_all))\n",
749 | " ic_all_all.append(np.array(ic_all))\n",
750 | "\n",
751 | " del optimizer\n",
752 | "\n",
753 | "mse_all_all = np.array(mse_all_all)\n",
754 | "mse_star_all = np.array(mse_star_all)\n",
755 | "ic_all_all = np.array(ic_all_all)\n",
756 | "cstar_all = np.array(cstar_all)"
757 | ],
758 | "metadata": {
759 | "id": "Mp27Bsy8Cl4P",
760 | "colab": {
761 | "base_uri": "https://localhost:8080/"
762 | },
763 | "outputId": "27b03b23-b1dc-4b7b-c550-c7633601a453"
764 | },
765 | "execution_count": null,
766 | "outputs": [
767 | {
768 | "metadata": {
769 | "tags": null
770 | },
771 | "name": "stdout",
772 | "output_type": "stream",
773 | "text": [
774 | "\n",
775 | " ## ->>>> Run = 0\n",
776 | "| iter | target | ic |\n",
777 | "-------------------------------------\n",
778 | "\n",
779 | " ## ->>>> PINNs simulation at speed = 0.4372813898716186\n",
780 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
781 | "5000/5000 [==============================] - 523s 105ms/step\n",
782 | "\n",
783 | " Total runtime is (min.) 8.710416158040365\n",
784 | "1/1 [==============================] - 0s 127ms/step\n",
785 | "| \u001b[0m1 \u001b[0m | \u001b[0m-0.001148\u001b[0m | \u001b[0m0.4373 \u001b[0m |\n",
786 | "\n",
787 | " ## ->>>> PINNs simulation at speed = 0.353260871860698\n",
788 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
789 | "5000/5000 [==============================] - 457s 91ms/step\n",
790 | "\n",
791 | " Total runtime is (min.) 7.620774328708649\n",
792 | "1/1 [==============================] - 0s 108ms/step\n",
793 | "| \u001b[95m2 \u001b[0m | \u001b[95m-0.000404\u001b[0m | \u001b[95m0.3533 \u001b[0m |\n",
794 | "\n",
795 | " ## ->>>> PINNs simulation at speed = 0.9598970605863492\n",
796 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
797 | "5000/5000 [==============================] - 1106s 221ms/step\n",
798 | "\n",
799 | " Total runtime is (min.) 18.436524299780526\n",
800 | "1/1 [==============================] - 0s 105ms/step\n",
801 | "| \u001b[0m3 \u001b[0m | \u001b[0m-0.03358 \u001b[0m | \u001b[0m0.9599 \u001b[0m |\n",
802 | "\n",
803 | " ## ->>>> PINNs simulation at speed = 0.868646025552868\n",
804 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
805 | "5000/5000 [==============================] - 779s 156ms/step\n",
806 | "\n",
807 | " Total runtime is (min.) 12.977701457341512\n",
808 | "1/1 [==============================] - 0s 68ms/step\n",
809 | "| \u001b[0m4 \u001b[0m | \u001b[0m-0.02251 \u001b[0m | \u001b[0m0.8686 \u001b[0m |\n",
810 | "\n",
811 | " ## ->>>> PINNs simulation at speed = 0.15795893544754053\n",
812 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
813 | "5000/5000 [==============================] - 502s 100ms/step\n"
814 | ]
815 | },
816 | {
817 | "metadata": {
818 | "tags": null
819 | },
820 | "name": "stderr",
821 | "output_type": "stream",
822 | "text": [
823 | "WARNING:tensorflow:5 out of the last 5 calls to .predict_function at 0x79d518d530a0> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for more details.\n"
824 | ]
825 | },
826 | {
827 | "metadata": {
828 | "tags": null
829 | },
830 | "name": "stdout",
831 | "output_type": "stream",
832 | "text": [
833 | "\n",
834 | " Total runtime is (min.) 8.373841834068298\n",
835 | "1/1 [==============================] - 0s 109ms/step\n",
836 | "| \u001b[95m5 \u001b[0m | \u001b[95m-7.06e-05\u001b[0m | \u001b[95m0.158 \u001b[0m |\n",
837 | "\n",
838 | " ## ->>>> PINNs simulation at speed = 0.35322383568991045\n",
839 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
840 | "5000/5000 [==============================] - 616s 123ms/step\n"
841 | ]
842 | },
843 | {
844 | "metadata": {
845 | "tags": null
846 | },
847 | "name": "stderr",
848 | "output_type": "stream",
849 | "text": [
850 | "WARNING:tensorflow:6 out of the last 6 calls to .predict_function at 0x79d50627e170> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for more details.\n"
851 | ]
852 | },
853 | {
854 | "output_type": "stream",
855 | "name": "stdout",
856 | "text": [
857 | "\n",
858 | " Total runtime is (min.) 10.258907715479532\n",
859 | "1/1 [==============================] - 0s 107ms/step\n",
860 | "| \u001b[0m6 \u001b[0m | \u001b[0m-0.000410\u001b[0m | \u001b[0m0.3532 \u001b[0m |\n",
861 | "\n",
862 | " ## ->>>> PINNs simulation at speed = 0.6265603597846434\n",
863 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
864 | "5000/5000 [==============================] - 702s 140ms/step\n",
865 | "\n",
866 | " Total runtime is (min.) 11.704780928293864\n",
867 | "1/1 [==============================] - 0s 105ms/step\n",
868 | "| \u001b[0m7 \u001b[0m | \u001b[0m-0.005768\u001b[0m | \u001b[0m0.6266 \u001b[0m |\n",
869 | "\n",
870 | " ## ->>>> PINNs simulation at speed = 0.10004206006951194\n",
871 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
872 | "5000/5000 [==============================] - 364s 73ms/step\n",
873 | "\n",
874 | " Total runtime is (min.) 6.072018718719482\n",
875 | "1/1 [==============================] - 0s 112ms/step\n",
876 | "| \u001b[0m8 \u001b[0m | \u001b[0m-0.000105\u001b[0m | \u001b[0m0.1 \u001b[0m |\n",
877 | "\n",
878 | " ## ->>>> PINNs simulation at speed = 0.25506179377329546\n",
879 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
880 | "5000/5000 [==============================] - 443s 89ms/step\n",
881 | "\n",
882 | " Total runtime is (min.) 7.377660123507182\n",
883 | "1/1 [==============================] - 0s 83ms/step\n",
884 | "| \u001b[0m9 \u001b[0m | \u001b[0m-9.066e-0\u001b[0m | \u001b[0m0.2551 \u001b[0m |\n",
885 | "\n",
886 | " ## ->>>> PINNs simulation at speed = 0.20751207571890762\n",
887 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
888 | "5000/5000 [==============================] - 375s 75ms/step\n",
889 | "\n",
890 | " Total runtime is (min.) 6.241973801453908\n",
891 | "1/1 [==============================] - 0s 119ms/step\n",
892 | "| \u001b[0m10 \u001b[0m | \u001b[0m-7.107e-0\u001b[0m | \u001b[0m0.2075 \u001b[0m |\n",
893 | "\n",
894 | " ## ->>>> PINNs simulation at speed = 0.29827013284790804\n",
895 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
896 | "5000/5000 [==============================] - 419s 84ms/step\n",
897 | "\n",
898 | " Total runtime is (min.) 6.982113985220591\n",
899 | "1/1 [==============================] - 0s 76ms/step\n",
900 | "| \u001b[0m11 \u001b[0m | \u001b[0m-0.000182\u001b[0m | \u001b[0m0.2983 \u001b[0m |\n",
901 | "\n",
902 | " ## ->>>> PINNs simulation at speed = 0.12646718809275764\n",
903 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
904 | "5000/5000 [==============================] - 481s 96ms/step\n",
905 | "\n",
906 | " Total runtime is (min.) 8.016359814008077\n",
907 | "1/1 [==============================] - 0s 81ms/step\n",
908 | "| \u001b[0m12 \u001b[0m | \u001b[0m-8.387e-0\u001b[0m | \u001b[0m0.1265 \u001b[0m |\n",
909 | "\n",
910 | " ## ->>>> PINNs simulation at speed = 0.18291510701869837\n",
911 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
912 | "5000/5000 [==============================] - 367s 73ms/step\n",
913 | "\n",
914 | " Total runtime is (min.) 6.108590332667033\n",
915 | "1/1 [==============================] - 0s 80ms/step\n",
916 | "| \u001b[95m13 \u001b[0m | \u001b[95m-6.506e-0\u001b[0m | \u001b[95m0.1829 \u001b[0m |\n",
917 | "\n",
918 | " ## ->>>> PINNs simulation at speed = 0.2295051729538426\n",
919 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
920 | "5000/5000 [==============================] - 510s 102ms/step\n",
921 | "\n",
922 | " Total runtime is (min.) 8.495574649175008\n",
923 | "1/1 [==============================] - 0s 133ms/step\n",
924 | "| \u001b[0m14 \u001b[0m | \u001b[0m-7.231e-0\u001b[0m | \u001b[0m0.2295 \u001b[0m |\n",
925 | "\n",
926 | " ## ->>>> PINNs simulation at speed = 0.17489332261182525\n",
927 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
928 | "5000/5000 [==============================] - 480s 96ms/step\n",
929 | "\n",
930 | " Total runtime is (min.) 8.002258733908336\n",
931 | "1/1 [==============================] - 0s 67ms/step\n",
932 | "| \u001b[0m15 \u001b[0m | \u001b[0m-6.664e-0\u001b[0m | \u001b[0m0.1749 \u001b[0m |\n",
933 | "\n",
934 | " ## ->>>> PINNs simulation at speed = 0.19438706454255616\n",
935 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
936 | "5000/5000 [==============================] - 365s 73ms/step\n",
937 | "\n",
938 | " Total runtime is (min.) 6.076679023106893\n",
939 | "1/1 [==============================] - 0s 67ms/step\n",
940 | "| \u001b[95m16 \u001b[0m | \u001b[95m-5.969e-0\u001b[0m | \u001b[95m0.1944 \u001b[0m |\n",
941 | "\n",
942 | " ## ->>>> PINNs simulation at speed = 0.1931523178425959\n",
943 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
944 | "5000/5000 [==============================] - 478s 96ms/step\n",
945 | "\n",
946 | " Total runtime is (min.) 7.9739015102386475\n",
947 | "1/1 [==============================] - 0s 71ms/step\n",
948 | "| \u001b[95m17 \u001b[0m | \u001b[95m-5.967e-0\u001b[0m | \u001b[95m0.1932 \u001b[0m |\n",
949 | "\n",
950 | " ## ->>>> PINNs simulation at speed = 0.1472501091609439\n",
951 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
952 | "5000/5000 [==============================] - 498s 100ms/step\n",
953 | "\n",
954 | " Total runtime is (min.) 8.299330997467042\n",
955 | "1/1 [==============================] - 0s 67ms/step\n",
956 | "| \u001b[0m18 \u001b[0m | \u001b[0m-7.572e-0\u001b[0m | \u001b[0m0.1473 \u001b[0m |\n",
957 | "\n",
958 | " ## ->>>> PINNs simulation at speed = 0.1864475687192167\n",
959 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
960 | "5000/5000 [==============================] - 395s 79ms/step\n",
961 | "\n",
962 | " Total runtime is (min.) 6.576291259129842\n",
963 | "1/1 [==============================] - 0s 106ms/step\n",
964 | "| \u001b[0m19 \u001b[0m | \u001b[0m-6.111e-0\u001b[0m | \u001b[0m0.1864 \u001b[0m |\n",
965 | "\n",
966 | " ## ->>>> PINNs simulation at speed = 0.20641322721099062\n",
967 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
968 | "5000/5000 [==============================] - 415s 83ms/step\n",
969 | "\n",
970 | " Total runtime is (min.) 6.909338291486105\n",
971 | "1/1 [==============================] - 0s 70ms/step\n",
972 | "| \u001b[0m20 \u001b[0m | \u001b[0m-6.846e-0\u001b[0m | \u001b[0m0.2064 \u001b[0m |\n",
973 | "\n",
974 | " ## ->>>> PINNs simulation at speed = 0.17467333008463468\n",
975 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
976 | "5000/5000 [==============================] - 407s 81ms/step\n",
977 | "\n",
978 | " Total runtime is (min.) 6.785109670956929\n",
979 | "1/1 [==============================] - 0s 98ms/step\n",
980 | "| \u001b[0m21 \u001b[0m | \u001b[0m-6.953e-0\u001b[0m | \u001b[0m0.1747 \u001b[0m |\n",
981 | "\n",
982 | " ## ->>>> PINNs simulation at speed = 0.19224016373696584\n",
983 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
984 | "5000/5000 [==============================] - 506s 101ms/step\n",
985 | "\n",
986 | " Total runtime is (min.) 8.428928422927857\n",
987 | "1/1 [==============================] - 0s 69ms/step\n",
988 | "| \u001b[0m22 \u001b[0m | \u001b[0m-6.054e-0\u001b[0m | \u001b[0m0.1922 \u001b[0m |\n",
989 | "\n",
990 | " ## ->>>> PINNs simulation at speed = 0.19200099153944267\n",
991 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
992 | "5000/5000 [==============================] - 437s 87ms/step\n",
993 | "\n",
994 | " Total runtime is (min.) 7.2850401679674786\n",
995 | "1/1 [==============================] - 0s 103ms/step\n",
996 | "| \u001b[0m23 \u001b[0m | \u001b[0m-6.077e-0\u001b[0m | \u001b[0m0.192 \u001b[0m |\n",
997 | "\n",
998 | " ## ->>>> PINNs simulation at speed = 0.19115332829277382\n",
999 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
1000 | "5000/5000 [==============================] - 335s 67ms/step\n",
1001 | "\n",
1002 | " Total runtime is (min.) 5.587451763947805\n",
1003 | "1/1 [==============================] - 0s 68ms/step\n",
1004 | "| \u001b[0m24 \u001b[0m | \u001b[0m-6.288e-0\u001b[0m | \u001b[0m0.1912 \u001b[0m |\n",
1005 | "\n",
1006 | " ## ->>>> PINNs simulation at speed = 0.19599276179575198\n",
1007 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
1008 | "5000/5000 [==============================] - 454s 91ms/step\n",
1009 | "\n",
1010 | " Total runtime is (min.) 7.566520047187805\n",
1011 | "1/1 [==============================] - 0s 101ms/step\n",
1012 | "| \u001b[0m25 \u001b[0m | \u001b[0m-6.409e-0\u001b[0m | \u001b[0m0.196 \u001b[0m |\n",
1013 | "\n",
1014 | " ## ->>>> PINNs simulation at speed = 0.1854055143664269\n",
1015 | "Optimizer: L-BFGS-B (maxiter=5000)\n",
1016 | "5000/5000 [==============================] - 456s 91ms/step\n",
1017 | "\n",
1018 | " Total runtime is (min.) 7.592611781756083\n",
1019 | "1/1 [==============================] - 0s 69ms/step\n",
1020 | "| \u001b[0m26 \u001b[0m | \u001b[0m-6.051e-0\u001b[0m | \u001b[0m0.1854 \u001b[0m |\n",
1021 | "\n",
1022 | " ## ->>>> PINNs simulation at speed = 0.186162721420857\n",
1023 | "Optimizer: L-BFGS-B (maxiter=5000)\n"
1024 | ]
1025 | }
1026 | ]
1027 | },
1028 | {
1029 | "cell_type": "markdown",
1030 | "source": [
1031 | "## Processing and plotting"
1032 | ],
1033 | "metadata": {
1034 | "id": "Bp5UWXSnE_YX"
1035 | }
1036 | },
1037 | {
1038 | "cell_type": "code",
1039 | "source": [
1040 | "#%% Process the BO results\n",
1041 | "# max, min, mean and sd target function/objective function value across different runs\n",
1042 | "max_mse_star_allruns, min_mse_star_allruns = np.max(mse_star_all), np.min(mse_star_all)\n",
1043 | "mean_mse_star_allruns, std_mse_star_allruns = np.mean(mse_star_all), np.std(mse_star_all)\n",
1044 | "\n",
1045 | "# optima corresponding to abovementioned optimal points\n",
1046 | "idx_max_mse_star_allruns = np.where(max_mse_star_allruns == mse_star_all)\n",
1047 | "idx_min_mse_star_allruns = np.where(min_mse_star_allruns == mse_star_all)\n",
1048 | "\n",
1049 | "max_cstar_allruns = cstar_all[idx_max_mse_star_allruns]\n",
1050 | "min_cstar_allruns = cstar_all[idx_min_mse_star_allruns]\n",
1051 | "mean_cstar_allruns = np.mean(cstar_all)\n",
1052 | "std_cstar_allruns = np.std(cstar_all)\n",
1053 | "\n",
1054 | "print(\"Max (best optimal) tf across runs = \",max_mse_star_allruns)\n",
1055 | "print(\"Min (worst optimal) tf across runs = \",min_mse_star_allruns)\n",
1056 | "print(\"Mean tf across runs = \",mean_mse_star_allruns)\n",
1057 | "print(\"Std tf across runs = \",std_mse_star_allruns)\n",
1058 | "\n",
1059 | "print(\"Max (best optimal) c* across runs = \",max_cstar_allruns)\n",
1060 | "print(\"Min (worst optimal) c* across runs = \",min_cstar_allruns)\n",
1061 | "print(\"Mean c* across runs = \",mean_cstar_allruns)\n",
1062 | "print(\"Std c* across runs = \",std_cstar_allruns)"
1063 | ],
1064 | "metadata": {
1065 | "id": "m45_nEHXEcel"
1066 | },
1067 | "execution_count": null,
1068 | "outputs": []
1069 | },
1070 | {
1071 | "cell_type": "code",
1072 | "source": [
1073 | "# plot best optimal run with the optima\n",
1074 | "idx_max_all = []\n",
1075 | "for i in range(mse_all_all.shape[0]):\n",
1076 | " idx_max = np.where(mse_all_all[i,:] == mse_star_all[i])\n",
1077 | " idx_max = idx_max[0][0]\n",
1078 | " idx_max_all.append(idx_max)\n",
1079 | "\n",
1080 | "mean_mse_all = np.mean(mse_all_all, axis=0)\n",
1081 | "std_mse_all = np.std(mse_all_all, axis=0)\n",
1082 | "mean_ic_all = np.mean(ic_all_all, axis=0)\n",
1083 | "std_ic_all = np.std(ic_all_all, axis=0)\n",
1084 | "\n",
1085 | "opt_mse_run = mse_all_all[idx_max_mse_star_allruns[0][0]]\n",
1086 | "opt_c_run = ic_all_all[idx_max_mse_star_allruns[0][0]]\n",
1087 | "opt_mse = mse_star_all[idx_max_mse_star_allruns[0][0]]\n",
1088 | "opt_c = cstar_all[idx_max_mse_star_allruns[0][0]]\n",
1089 | "\n",
1090 | "txt = 'c* = '+ str(round(opt_c,4))\n",
1091 | "plt.figure(figsize = (8, 6))\n",
1092 | "plt.plot(opt_c_run,opt_mse_run,'ob',markersize=6)\n",
1093 | "plt.plot(opt_c,opt_mse,'*r',markersize=8, label = 'Best optima')\n",
1094 | "#plt.text(0.75, -0.03, txt, fontsize=18, c = 'r')\n",
1095 | "plt.xlabel(\"velocity, c\",fontsize=20)\n",
1096 | "plt.ylabel(\"target function, g(c)\",fontsize=20)\n",
1097 | "plt.xticks(fontsize=20)\n",
1098 | "plt.yticks(fontsize=20)\n",
1099 | "plt.legend(fontsize = 14, loc='upper left')\n",
1100 | "plt.savefig('tfvsc_'+str(idx_data+1)+'.png', bbox_inches='tight', dpi=600)\n",
1101 | "plt.show()"
1102 | ],
1103 | "metadata": {
1104 | "id": "qaTRHKjgFDP3"
1105 | },
1106 | "execution_count": null,
1107 | "outputs": []
1108 | }
1109 | ],
1110 | "metadata": {
1111 | "colab": {
1112 | "provenance": [],
1113 | "gpuType": "T4"
1114 | },
1115 | "kernelspec": {
1116 | "display_name": "Python 3",
1117 | "name": "python3"
1118 | },
1119 | "accelerator": "GPU"
1120 | },
1121 | "nbformat": 4,
1122 | "nbformat_minor": 0
1123 | }
--------------------------------------------------------------------------------