├── images ├── BOPINNalgo.PNG └── BOPINN_methodolody.png ├── data ├── u_analytic_c=0.2t=0.25snr=39.36.mat ├── u_analytic_c=0.55t=0.25snr=38.91.mat └── u_analytic_c=0.85t=0.25snr=37.5.mat ├── LICENSE ├── lib ├── network.py ├── layer.py ├── pinn_wave.py └── optimizer.py ├── README.md ├── analytical.py ├── PINN.py ├── BOPINN.py └── BOPINN.ipynb /images/BOPINNalgo.PNG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mahindrautela/BOPINN/HEAD/images/BOPINNalgo.PNG -------------------------------------------------------------------------------- /images/BOPINN_methodolody.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mahindrautela/BOPINN/HEAD/images/BOPINN_methodolody.png -------------------------------------------------------------------------------- /data/u_analytic_c=0.2t=0.25snr=39.36.mat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mahindrautela/BOPINN/HEAD/data/u_analytic_c=0.2t=0.25snr=39.36.mat -------------------------------------------------------------------------------- /data/u_analytic_c=0.55t=0.25snr=38.91.mat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mahindrautela/BOPINN/HEAD/data/u_analytic_c=0.55t=0.25snr=38.91.mat -------------------------------------------------------------------------------- /data/u_analytic_c=0.85t=0.25snr=37.5.mat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mahindrautela/BOPINN/HEAD/data/u_analytic_c=0.85t=0.25snr=37.5.mat -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- 1 | MIT License 2 | 3 | Copyright (c) 2024 Mahindra Rautela 4 | 5 | Permission is hereby granted, free of charge, to any person obtaining a copy 6 | of this software and associated documentation files (the "Software"), to deal 7 | in the Software without restriction, including without limitation the rights 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 9 | copies of the Software, and to permit persons to whom the Software is 10 | furnished to do so, subject to the following conditions: 11 | 12 | The above copyright notice and this permission notice shall be included in all 13 | copies or substantial portions of the Software. 14 | 15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 21 | SOFTWARE. 22 | -------------------------------------------------------------------------------- /lib/network.py: -------------------------------------------------------------------------------- 1 | import tensorflow as tf 2 | 3 | class Network: 4 | """ 5 | Build a physics informed neural network (PINN) model for the wave equation. 6 | """ 7 | 8 | @classmethod 9 | def build(cls, num_inputs=2, layers=[64, 128, 128, 128, 128, 64], activation='tanh', num_outputs=1): 10 | """ 11 | Build a PINN model for the wave equation with input shape (t, x) and output shape u(t, x). 12 | 13 | Args: 14 | num_inputs: number of input variables. Default is 2 for (t, x). 15 | layers: number of hidden layers. 16 | activation: activation function in hidden layers. 17 | num_outpus: number of output variables. Default is 1 for u(t, x). 18 | 19 | Returns: 20 | keras network model. 21 | """ 22 | 23 | # input layer 24 | inputs = tf.keras.layers.Input(shape=(num_inputs,)) 25 | # hidden layers 26 | x = inputs 27 | for layer in layers: 28 | x = tf.keras.layers.Dense(layer, activation=activation, 29 | kernel_initializer='he_normal')(x) 30 | x = tf.keras.layers.Dropout(0.1)(x) 31 | # output layer 32 | outputs = tf.keras.layers.Dense(num_outputs, 33 | kernel_initializer='he_normal')(x) 34 | 35 | return tf.keras.models.Model(inputs=inputs, outputs=outputs) 36 | -------------------------------------------------------------------------------- /lib/layer.py: -------------------------------------------------------------------------------- 1 | import tensorflow as tf 2 | 3 | class GradientLayer(tf.keras.layers.Layer): 4 | """ 5 | Custom layer to compute 1st and 2nd derivatives for the wave equation. 6 | 7 | Attributes: 8 | model: keras network model. 9 | """ 10 | 11 | def __init__(self, model, **kwargs): 12 | """ 13 | Args: 14 | model: keras network model. 15 | """ 16 | 17 | self.model = model 18 | super().__init__(**kwargs) 19 | 20 | def call(self, tx): 21 | """ 22 | Computing 1st and 2nd derivatives for the wave equation. 23 | 24 | Args: 25 | tx: input variables (t, x). 26 | 27 | Returns: 28 | u: network output. 29 | du_dt: 1st derivative of t. 30 | du_dx: 1st derivative of x. 31 | d2u_dt2: 2nd derivative of t. 32 | d2u_dx2: 2nd derivative of x. 33 | """ 34 | 35 | with tf.GradientTape() as g: 36 | g.watch(tx) 37 | with tf.GradientTape() as gg: 38 | gg.watch(tx) 39 | u = self.model(tx) 40 | du_dtx = gg.batch_jacobian(u, tx) 41 | du_dt = du_dtx[..., 0] 42 | du_dx = du_dtx[..., 1] 43 | d2u_dtx2 = g.batch_jacobian(du_dtx, tx) 44 | d2u_dt2 = d2u_dtx2[..., 0, 0] 45 | d2u_dx2 = d2u_dtx2[..., 1, 1] 46 | 47 | return u, du_dt, du_dx, d2u_dt2, d2u_dx2 48 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # BOPINN (Bayesian optimized physics-informed neural network) 2 | BOPINN presents new paradigm to solve inverse problems by bringing an amalgamation of PINNs and BO. It uses BO (a gradient-free and global optimization scheme) and PINNs (a fast neural surrogate solver for PDEs). In BOPINN, a PINN utilizes a neural surrogate to solve the partial differential equation (wave propagation here). Bayesian optimization runs over the PINN model and estimates the optimum parameters (wave velocity in the medium here) using a single snapshot observation of the field. BOPINN queries the black-box PINN model at different wave velocities until it converges to the true wave velocity. The proposed method is simpler (uses single neural network), robust (capturs uncertainty) and flexible (useful in real-time and online settings) as compared to it's counterparts. 3 | 4 |

5 | 6 |

7 | 8 |

9 | 10 |

11 | 12 | ## About the repository: 13 | 1. Written in tensorflow 2.10 with cuda 11.8 and cudnn 8.x 14 | 2. The code uses BO repository from [bayesian-optimization](https://github.com/bayesian-optimization/BayesianOptimization). 15 | 3. "BOPINN.py" is the python file (run in spyder) and "BOPINN.ipynb" is a notebook (use colab or jupyter) 16 | 4. "PINN.py" is a PINN based solver for forward wave propagation problem. It's an auxillary code to understand the forward problem 17 | 5. "analytical.py" gives the exact solution of the wave equation with dirichlet BC and it is used to collect data (added white noise) 18 | 6. data folder contains the snapshot observation collected from "analytical.py" 19 | 7. lib folder has .py files required to run "PINN.py" and "BOPINN.py" 20 | 21 | For more information: 22 | 1. [Link](https://doi.org/10.48550/arXiv.2312.14064) of the paper: Bayesian optimized physics-informed neural network for estimating wave propagation velocities. 23 | 2. Please cite the paper if you are using code, paper or data. 24 | ``` 25 | @article{rautela2023bayesian, 26 | title={Bayesian optimized physics-informed neural network for estimating wave propagation velocities}, 27 | author={Rautela, Mahindra and Gopalakrishnan, S and Senthilnath, J}, 28 | journal={arXiv preprint arXiv:2312.14064}, 29 | year={2023} 30 | } 31 | ``` 32 | 33 | -------------------------------------------------------------------------------- /lib/pinn_wave.py: -------------------------------------------------------------------------------- 1 | import tensorflow as tf 2 | from .layer import GradientLayer 3 | 4 | class PINN: 5 | """ 6 | Build a physics informed neural network (PINN) model for the wave equation. 7 | 8 | Attributes: 9 | network: keras network model with input (t, x) and output u(t, x). 10 | c: wave velocity. 11 | grads: gradient layer. 12 | """ 13 | 14 | def __init__(self, network, c): 15 | """ 16 | Args: 17 | network: keras network model with input (t, x) and output u(t, x). 18 | c: wave velocity. Default is 1. 19 | """ 20 | 21 | self.network = network 22 | self.c = c 23 | self.grads = GradientLayer(self.network) 24 | 25 | def build(self): 26 | """ 27 | Build a PINN model for the wave equation. 28 | 29 | Returns: 30 | PINN model for the projectile motion with 31 | input: [ (t, x) relative to equation, 32 | (t=0, x) relative to initial condition, 33 | (t, x=bounds) relative to boundary condition ], 34 | output: [ u(t,x) relative to equation, 35 | u(t=0, x) relative to initial condition, 36 | du_dt(t=0, x) relative to initial derivative of t, 37 | u(t, x=bounds) relative to boundary condition ] 38 | """ 39 | 40 | # equation input: (t, x) 41 | tx_eqn = tf.keras.layers.Input(shape=(2,)) 42 | # initial condition input: (t=0, x) 43 | tx_ini = tf.keras.layers.Input(shape=(2,)) 44 | # boundary condition input: (t, x=-1) or (t, x=+1) 45 | tx_bnd = tf.keras.layers.Input(shape=(2,)) 46 | 47 | # compute gradients 48 | _, _, _, d2u_dt2, d2u_dx2 = self.grads(tx_eqn) 49 | 50 | # equation output being zero 51 | u_eqn = d2u_dt2 - self.c*self.c * d2u_dx2 52 | # initial condition output 53 | u_ini, du_dt_ini, _, _, _ = self.grads(tx_ini) 54 | # boundary condition output 55 | u_bnd = self.network(tx_bnd) # dirichlet 56 | #_, _, u_bnd, _, _ = self.grads(tx_bnd) # neumann 57 | 58 | # build the PINN model for the wave equation 59 | return tf.keras.models.Model( 60 | inputs=[tx_eqn, tx_ini, tx_bnd], 61 | outputs=[u_eqn, u_ini, du_dt_ini, u_bnd]) 62 | 63 | -------------------------------------------------------------------------------- /analytical.py: -------------------------------------------------------------------------------- 1 | import numpy as np 2 | import math 3 | import matplotlib.pyplot as plt 4 | from matplotlib.colors import Normalize 5 | from matplotlib.gridspec import GridSpec 6 | import os 7 | 8 | # Other variables 9 | L = 10 10 | n = L 11 | T = 1 12 | 13 | # speed 14 | C = [0.20, 0.55, 0.85] 15 | c = C[0] 16 | 17 | # snapshot time 18 | tfrac = np.array([0.25, 0.50, 0.75]) 19 | tilde_t = tfrac*T 20 | 21 | # number of scan points 22 | num_points = 5000 23 | 24 | # RMS function 25 | def RMS(S): 26 | rms = np.sqrt(np.mean(S**2)) 27 | return rms 28 | 29 | def u_analytic(t,x,c,L,n): 30 | # x and t in mesh form 31 | usol = -np.sin(math.pi*x)*np.cos(n*math.pi*c*t/L) 32 | return usol 33 | 34 | # Full analytical solution of the domain [0,L] and [0,T] 35 | t = np.linspace(0,T,num_points) 36 | x = np.linspace(0,L,num_points) 37 | x_mesh, t_mesh = np.meshgrid(x, t) 38 | usol_full = u_analytic(t_mesh, x_mesh, c, L, n) 39 | 40 | # index of snapshot time in the array 41 | idx = [int(p) for p in num_points*tfrac] 42 | 43 | # plot u(t,x) distribution as a color-map 44 | fig = plt.figure(figsize=(7,4)) 45 | gs = GridSpec(2, 3) # A grid layout to place subplots within a figure. 46 | plt.subplot(gs[0, :]) 47 | vmin, vmax = -1.0, +1.0 48 | plt.pcolormesh(t_mesh, x_mesh, usol_full, cmap='rainbow', shading = 'auto', norm=Normalize(vmin=vmin, vmax=vmax)) 49 | plt.xlabel('t') 50 | plt.ylabel('x') 51 | cbar = plt.colorbar(pad=0.05, aspect=10) 52 | cbar.set_label('u(t,x)') 53 | cbar.mappable.set_clim(vmin, vmax) 54 | 55 | # plot u(t=const, x) cross-sections 56 | for i, t_cs in enumerate(tilde_t): 57 | plt.subplot(gs[1, i]) 58 | plt.plot(x, usol_full[idx[i],:], 'b', linewidth = 2) 59 | plt.title('t={}'.format(t_cs)) 60 | plt.xlabel('x') 61 | plt.ylabel('u(t,x)') 62 | plt.ylim(-1,1) 63 | plt.tight_layout() 64 | plt.show() 65 | 66 | #%% usol at particular snapshot time 67 | from scipy.io import savemat 68 | 69 | # data storing 70 | path = "C:\MSR\data\PINNBO\data" 71 | 72 | # amplitude of noise 73 | beta_range = [0.0075] #[0.0075, 0.01, 0.025, 0.05] 74 | 75 | # these parameters need to be set 76 | usol_app = [] 77 | usol_n_app = [] 78 | for ii in range(len(C)): 79 | for jj in range(len(tilde_t)): 80 | for kk in range(len(beta_range)): 81 | c = C[ii] 82 | t_obs = tilde_t[jj] 83 | beta = beta_range[kk] 84 | 85 | # without noise 86 | tt = np.full(t.shape, t_obs) 87 | xx = np.linspace(0,L,num_points) 88 | xx_mesh, tt_mesh = np.meshgrid(xx, tt) 89 | usol = u_analytic(tt_mesh, xx_mesh, c, L, n) 90 | usol = usol[0,:] # all rows (time) are same 91 | usol_app.append(usol) 92 | 93 | # Add white noise to the data 94 | mu = 0 95 | sigma = 1 96 | noise = beta*(sigma*np.random.randn(num_points,1) + mu) 97 | 98 | # noisy data 99 | usol_n = usol[:,np.newaxis] + noise 100 | usol_n_app.append(usol_n) 101 | 102 | # signal to noise ratio 103 | snr = 20*np.log10(RMS(usol)/RMS(noise)) 104 | snr_percent = RMS(noise)/RMS(usol)*100 105 | 106 | f1 = "c="+str(c) 107 | f2 = "t="+str(t_obs) 108 | f3 = "snr="+str(np.round(snr,2)) 109 | 110 | plt.figure(figsize=(22,4)) 111 | fig, (ax1, ax2) = plt.subplots(1, 2,figsize=(10,4)) 112 | ax1.plot(xx,usol) 113 | ax1.set_title('Without noise', fontsize = 15) 114 | ax1.set(xlabel='x', ylabel='Normalized u(x,t)') 115 | ax1.set_ylim(-1.2,1.2) 116 | 117 | ax2.plot(xx,usol_n) 118 | ax2.set_title(f1+f2+f3, fontsize = 15) 119 | ax2.set(xlabel='x') 120 | ax2.set_ylim(-1.2,1.2) 121 | 122 | plt.show() 123 | 124 | # save data 125 | filename = "u_analytic_"+f1+f2+f3 126 | filepath = os.path.join(path, filename) 127 | mdic = {"a1": usol_n, "label": "experiment"} 128 | savemat(filepath+".mat", mdic) 129 | 130 | #%% analysis of experimental data 131 | usol_app = np.array(usol_app) 132 | usol_n_app = np.array(usol_n_app) 133 | color = ['k','tab:blue','tab:orange', 134 | 'tab:green','tab:red','tab:purple', 135 | 'tab:brown','tab:pink','tab:gray','tab:cyan'] 136 | 137 | plt.figure(figsize=(10,4)) 138 | for i in range(usol_app.shape[0]): 139 | plt.plot(xx,usol_app[i,:],color[i]) 140 | plt.legend(['1','2','3','4','5','6','7','8','9']) 141 | #plt.savefig('analytical_9_withoutnoise', dpi = 300) 142 | 143 | plt.figure(figsize=(10,4)) 144 | for i in range(usol_app.shape[0]): 145 | plt.plot(xx,usol_n_app[i,:],color[i]) 146 | plt.legend(['1','2','3','4','5','6','7','8','9']) 147 | #plt.savefig('analytical_9_withnoise', dpi = 300) 148 | -------------------------------------------------------------------------------- /PINN.py: -------------------------------------------------------------------------------- 1 | #import lib.tf_silent 2 | import numpy as np 3 | import tensorflow as tf 4 | import matplotlib.pyplot as plt 5 | from matplotlib.colors import Normalize 6 | from matplotlib.gridspec import GridSpec 7 | from lib.pinn_wave import PINN 8 | from lib.network import Network 9 | from lib.optimizer import L_BFGS_B 10 | import math 11 | import time 12 | 13 | # number of training samples 14 | num_train_samples = 25000 15 | 16 | # number of test samples 17 | num_test_samples = 5000 18 | 19 | c = 0.2 #scaled speed 20 | L = 10 21 | n = L 22 | T = 1 23 | 24 | # Initial conditions 25 | def u0(t): 26 | z = -np.sin(1*math.pi*t) 27 | return z 28 | 29 | def du0_dt(tx): 30 | with tf.GradientTape() as g: 31 | g.watch(tx) 32 | u = u0(tx) 33 | du_dt = g.batch_jacobian(u, tx)[..., 0] 34 | return du_dt 35 | 36 | # Analytical solution 37 | xx = np.linspace(0,L,num_test_samples) 38 | tt = np.linspace(0,T,num_test_samples) 39 | usol = np.zeros((num_test_samples,num_test_samples)) 40 | for i,xi in enumerate(xx): 41 | for j,tj in enumerate(tt): 42 | usol[i,j] = -np.sin(math.pi*xi)*np.cos(n*math.pi*c*tj/L) 43 | 44 | 45 | ######################################################################## 46 | ######################## collocation points ############################ 47 | ######################################################################## 48 | 49 | # create training input 50 | tx_eqn = np.random.rand(num_train_samples, 2) 51 | tx_eqn[..., 0] = T*tx_eqn[..., 0] # t = 0 ~ +1 52 | tx_eqn[..., 1] = L*tx_eqn[..., 1] # x = 0 ~ +10 53 | #print('\nShape of t_eqn ==>',tx_eqn.shape) 54 | 55 | tx_ini = np.random.rand(num_train_samples, 2) 56 | tx_ini[..., 0] = 0 # t = 0 57 | tx_ini[..., 1] = L*tx_ini[..., 1] # x = 0 ~ +10 58 | #print('\nShape of tx_ini ==>',tx_ini.shape) 59 | 60 | tx_bnd = np.random.rand(num_train_samples, 2) 61 | tx_bnd[..., 0] = T*tx_bnd[..., 0] # t = 0 ~ +1 62 | tx_bnd[..., 1] = L*np.round(tx_bnd[..., 1]) # x = 0 or +10 63 | #print('\nShape of tx_bnd ==>',tx_bnd.shape) 64 | 65 | u_zero = np.zeros((num_train_samples, 1)) 66 | u_ini = u0(tx_ini[:,1,None]) 67 | du_dt_ini = np.zeros((num_train_samples, 1)) 68 | 69 | ######################################################################### 70 | ########################### TRAINING PINNs ############################## 71 | ######################################################################### 72 | 73 | # build a core network model 74 | network = Network.build() 75 | #network.summary() 76 | 77 | # build a PINN model 78 | pinn = PINN(network,c).build() 79 | 80 | # train the model using L-BFGS-B algorithm 81 | begin = time.time() 82 | x_train = [tx_eqn, tx_ini, tx_bnd] 83 | y_train = [u_zero, u_ini, du_dt_ini, u_zero] 84 | lbfgs = L_BFGS_B(model=pinn, x_train=x_train, y_train=y_train) 85 | lbfgs.fit() 86 | end = time.time() 87 | totaltime = end-begin 88 | print("\n Total runtime of the program is (min.)",totaltime/60) 89 | 90 | ######################################################################### 91 | ######################## PREDICTION ##################################### 92 | ######################################################################### 93 | 94 | # predict u(t,x) distribution 95 | t_flat = np.linspace(0, T, num_test_samples) 96 | x_flat = np.linspace(0, L, num_test_samples) 97 | t, x = np.meshgrid(t_flat, x_flat) 98 | tx = np.stack([t.flatten(), x.flatten()], axis=-1) 99 | u = network.predict(tx, batch_size=num_test_samples) 100 | u = u.reshape(t.shape) 101 | 102 | # plot u(t,x) distribution as a color-map 103 | fig = plt.figure(figsize=(12,8)) 104 | gs = GridSpec(2, 3) # A grid layout to place subplots within a figure. 105 | plt.subplot(gs[0, :]) 106 | vmin, vmax = -1.0, +1.0 107 | plt.pcolormesh(t, x, u, cmap='rainbow', shading = 'auto', norm=Normalize(vmin=vmin, vmax=vmax)) 108 | plt.xlabel('t',fontsize=20) 109 | plt.ylabel('x',fontsize=20) 110 | plt.xticks(fontsize=20) 111 | plt.yticks(fontsize=20) 112 | cbar = plt.colorbar(pad=0.05, aspect=10) 113 | cbar.set_label('u(t,x)', fontsize=20) 114 | cbar.ax.tick_params(labelsize=20) 115 | cbar.mappable.set_clim(vmin, vmax) 116 | 117 | # plot u(t=const, x) cross-sections 118 | tfrac = np.array([0.25,0.5,0.75]) 119 | t_cross_sections = (T*tfrac).tolist() 120 | idx = [int(x) for x in (num_test_samples*tfrac)] 121 | 122 | for i, t_cs in enumerate(t_cross_sections): 123 | plt.subplot(gs[1, i]) 124 | full = np.full(t_flat.shape, t_cs) 125 | tx = np.stack([np.full(t_flat.shape, t_cs), x_flat], axis=-1) 126 | u = network.predict(tx, batch_size=num_test_samples) 127 | #print(u.shape) 128 | plt.plot(x_flat, u, '.b') 129 | plt.plot(x_flat, usol[:,idx[i]], 'r--', linewidth = 2) 130 | plt.title('t = {}'.format(t_cs),fontsize=20) 131 | plt.xlabel('x',fontsize=20) 132 | plt.ylabel('u(t,x)',fontsize=20) 133 | plt.xticks(fontsize=20) 134 | plt.yticks(fontsize=20) 135 | plt.ylim(-1,1) 136 | plt.legend(['Prediction','Exact'], loc = 'upper right',fontsize=8) 137 | plt.tight_layout() 138 | plt.savefig('PINNs_at_'+str(c)+'.png', transparent=True, dpi = 900) 139 | plt.show() 140 | 141 | -------------------------------------------------------------------------------- /lib/optimizer.py: -------------------------------------------------------------------------------- 1 | import scipy.optimize 2 | import numpy as np 3 | import tensorflow as tf 4 | 5 | class L_BFGS_B: 6 | """ 7 | Optimize the keras network model using L-BFGS-B algorithm. 8 | 9 | Attributes: 10 | model: optimization target model. 11 | samples: training samples. 12 | factr: convergence condition. typical values for factr are: 1e12 for low accuracy; 13 | 1e7 for moderate accuracy; 10 for extremely high accuracy. 14 | m: maximum number of variable metric corrections used to define the limited memory matrix. 15 | maxls: maximum number of line search steps (per iteration). 16 | maxiter: maximum number of iterations. 17 | metris: logging metrics. 18 | progbar: progress bar. 19 | """ 20 | 21 | def __init__(self, model, x_train, y_train, m=10, factr=1e7, pgtol=1e-5, 22 | epsilon=1e-8, maxiter=5000, maxls=50): 23 | """ 24 | Args: 25 | model: optimization target model. 26 | samples: training samples. 27 | factr: convergence condition. typical values for factr are: 1e12 for low accuracy; 28 | 1e7 for moderate accuracy; 10.0 for extremely high accuracy. 29 | m: maximum number of variable metric corrections used to define the limited memory matrix. 30 | maxls: maximum number of line search steps (per iteration). 31 | maxiter: maximum number of iterations. 32 | """ 33 | 34 | # set attributes 35 | self.model = model 36 | self.x_train = [ tf.constant(x, dtype=tf.float32) for x in x_train ] 37 | self.y_train = [ tf.constant(y, dtype=tf.float32) for y in y_train ] 38 | self.factr = factr 39 | self.m = m 40 | self.pgtol = pgtol 41 | self.epsilon = epsilon 42 | self.maxls = maxls 43 | self.maxiter = maxiter 44 | self.metrics = ['loss'] 45 | # initialize the progress bar 46 | self.progbar = tf.keras.callbacks.ProgbarLogger( 47 | count_mode='steps', stateful_metrics=self.metrics) 48 | self.progbar.set_params( { 49 | 'verbose':1, 'epochs':1, 'steps':self.maxiter, 'metrics':self.metrics}) 50 | 51 | def set_weights(self, flat_weights): 52 | """ 53 | Set weights to the model. 54 | 55 | Args: 56 | flat_weights: flatten weights. 57 | """ 58 | 59 | # get model weights 60 | shapes = [ w.shape for w in self.model.get_weights() ] 61 | # compute splitting indices 62 | split_ids = np.cumsum([ np.prod(shape) for shape in [0] + shapes ]) 63 | # reshape weights 64 | weights = [ flat_weights[from_id:to_id].reshape(shape) 65 | for from_id, to_id, shape in zip(split_ids[:-1], split_ids[1:], shapes) ] 66 | # set weights to the model 67 | self.model.set_weights(weights) 68 | 69 | @tf.function 70 | def tf_evaluate(self, x, y): 71 | """ 72 | Evaluate loss and gradients for weights as tf.Tensor. 73 | 74 | Args: 75 | x: input data. 76 | 77 | Returns: 78 | loss and gradients for weights as tf.Tensor. 79 | """ 80 | 81 | with tf.GradientTape() as g: 82 | loss = tf.reduce_mean(tf.keras.losses.mse(self.model(x), y)) 83 | grads = g.gradient(loss, self.model.trainable_variables) 84 | return loss, grads 85 | 86 | def evaluate(self, weights): 87 | """ 88 | Evaluate loss and gradients for weights as ndarray. 89 | 90 | Args: 91 | weights: flatten weights. 92 | 93 | Returns: 94 | loss and gradients for weights as ndarray. 95 | """ 96 | 97 | # update weights 98 | self.set_weights(weights) 99 | # compute loss and gradients for weights 100 | loss, grads = self.tf_evaluate(self.x_train, self.y_train) 101 | # convert tf.Tensor to flatten ndarray 102 | loss = loss.numpy().astype('float64') 103 | grads = np.concatenate([ g.numpy().flatten() for g in grads ]).astype('float64') 104 | 105 | return loss, grads 106 | 107 | def callback(self, weights): 108 | """ 109 | Callback that prints the progress to stdout. 110 | 111 | Args: 112 | weights: flatten weights. 113 | """ 114 | self.progbar.on_batch_begin(0) 115 | loss, _ = self.evaluate(weights) 116 | self.progbar.on_batch_end(0, logs=dict(zip(self.metrics, [loss]))) 117 | 118 | def fit(self): 119 | """ 120 | Train the model using L-BFGS-B algorithm. 121 | """ 122 | 123 | # get initial weights as a flat vector 124 | initial_weights = np.concatenate( 125 | [ w.flatten() for w in self.model.get_weights() ]) 126 | # optimize the weight vector 127 | print('Optimizer: L-BFGS-B (maxiter={})'.format(self.maxiter)) 128 | self.progbar.on_train_begin() 129 | self.progbar.on_epoch_begin(1) 130 | 131 | scipy.optimize.fmin_l_bfgs_b(func=self.evaluate, 132 | x0=initial_weights, 133 | factr=self.factr, 134 | pgtol=self.pgtol, 135 | epsilon=self.epsilon, 136 | m=self.m, 137 | maxls=self.maxls, 138 | maxiter=self.maxiter, 139 | callback=self.callback) 140 | 141 | 142 | # scipy.optimize.least_squares(func = self.evaluate, x0 = initial_weights) 143 | 144 | # scipy.optimize.minimize(fun = self.evaluate, 145 | # x0 = initial_weights, 146 | # method='L-BFGS-B', 147 | # jac= True, # If jac is True, fun is assumed to return the gradient along with the objective function 148 | # callback = self.callback, 149 | # options = {'disp': None, 150 | # 'maxcor': 200, 151 | # 'ftol': 1 * np.finfo(float).eps, #The iteration stops when (f^k - f^{k+1})/max{|f^k|,|f^{k+1}|,1} <= ftol 152 | # 'gtol': 5e-5, 153 | # 'maxfun': 50000, 154 | # 'maxiter': 1, 155 | # 'iprint': 50, #print update every 50 iterations 156 | # 'maxls': 50}) 157 | 158 | # scipy.optimize.minimize(fun=self.evaluate, 159 | # x0=initial_weights, 160 | # jac=True, 161 | # method='BFGS', 162 | # callback=self.callback, 163 | # options={'maxiter': 15000, 164 | # 'maxls': 20}) 165 | 166 | # scipy.optimize.minimize(fun = self.evaluate, 167 | # x0 = initial_weights, 168 | # args=(), 169 | # method='L-BFGS-B', 170 | # jac= True, 171 | # callback = self.callback, 172 | # options = {'disp': None, 173 | # 'maxcor': 200, 174 | # 'ftol': 1 * np.finfo(float).eps, #The iteration stops when (f^k - f^{k+1})/max{|f^k|,|f^{k+1}|,1} <= ftol 175 | # 'gtol': 5e-5, 176 | # 'maxfun': 50000, 177 | # 'maxiter': 1, 178 | # 'iprint': 50, #print update every 50 iterations 179 | # 'maxls': 50}) 180 | 181 | self.progbar.on_epoch_end(1) 182 | self.progbar.on_train_end() 183 | -------------------------------------------------------------------------------- /BOPINN.py: -------------------------------------------------------------------------------- 1 | import numpy as np 2 | import tensorflow as tf 3 | import matplotlib.pyplot as plt 4 | from lib.pinn_wave import PINN 5 | from lib.network import Network 6 | from lib.optimizer import L_BFGS_B 7 | import math 8 | from bayes_opt import BayesianOptimization, UtilityFunction 9 | import scipy.io 10 | import os 11 | from os.path import join 12 | import time 13 | 14 | # number of training samples 15 | num_train_samples = 25000 16 | 17 | # number of test samples 18 | num_test_samples = 5000 19 | 20 | # Other variables 21 | L = 10 22 | n = L 23 | T = 1 24 | 25 | # define x,t for PINNs prediction 26 | x_test = np.linspace(0,L,num_test_samples) 27 | t_test = np.linspace(0,T,num_test_samples) 28 | 29 | # upload the snapshot observation 30 | path = "E:\MSR\data\BOPINN\data" 31 | dir_list = os.listdir(path) 32 | print("Files in directory",dir_list) 33 | 34 | idx_data = 3 # 0,3,6 35 | data = dir_list[idx_data] 36 | print("Imported file", data) 37 | 38 | file = join(path, data) 39 | u_analy = scipy.io.loadmat(file) 40 | u_analy = u_analy['a1'] 41 | 42 | # plot the snapshot observation 43 | fig = plt.figure(figsize=(7,4)) 44 | plt.plot(x_test,u_analy, '-', linewidth = 2) 45 | plt.xlabel('$x$', fontsize = 15) 46 | plt.ylabel('Normalized u(x,t)', fontsize = 15) 47 | plt.xticks(fontsize = 12) 48 | plt.yticks(fontsize = 12) 49 | 50 | # time of observation 51 | tilde_t = 0.25 52 | 53 | #%% Initial conditions 54 | def u0(t): 55 | z = -np.sin(1*math.pi*t) 56 | return z 57 | 58 | def du0_dt(tx): 59 | with tf.GradientTape() as g: 60 | g.watch(tx) 61 | u = u0(tx) 62 | du_dt = g.batch_jacobian(u, tx)[..., 0] 63 | return du_dt 64 | 65 | def RMS(S): 66 | rms = np.sqrt(np.mean(S**2)) 67 | return rms 68 | 69 | #%% collocation points 70 | # create training input 71 | tx_eqn = np.random.rand(num_train_samples, 2) 72 | tx_eqn[..., 0] = T*tx_eqn[..., 0] # t = 0 ~ +1 73 | tx_eqn[..., 1] = L*tx_eqn[..., 1] # x = 0 ~ +10 74 | #print('\nShape of t_eqn ==>',tx_eqn.shape) 75 | 76 | tx_ini = np.random.rand(num_train_samples, 2) 77 | tx_ini[..., 0] = 0 # t = 0 78 | tx_ini[..., 1] = L*tx_ini[..., 1] # x = 0 ~ +10 79 | #print('\nShape of tx_ini ==>',tx_ini.shape) 80 | 81 | tx_bnd = np.random.rand(num_train_samples, 2) 82 | tx_bnd[..., 0] = T*tx_bnd[..., 0] # t = 0 ~ +1 83 | tx_bnd[..., 1] = L*np.round(tx_bnd[..., 1]) # x = 0 or +10 84 | #print('\nShape of tx_bnd ==>',tx_bnd.shape) 85 | 86 | # initial and boundary conditions 87 | u_zero = np.zeros((num_train_samples, 1)) 88 | u_ini = u0(tx_ini[:,1,None]) 89 | du_dt_ini = np.zeros((num_train_samples, 1)) 90 | 91 | #%% g(c) = (u_pred - u_true)^2; u_pred via PINNs 92 | 93 | def model_builder(ic): 94 | #ic = hp.Float('ic', min_value=0.1, max_value=1, step=10) 95 | print('\n ## ->>>> PINNs simulation at speed = ' + str(ic)) 96 | 97 | # build a PINN model 98 | network = Network.build() 99 | pinn = PINN(network,ic).build() 100 | 101 | # train the model using L-BFGS-B algorithm 102 | begin = time.time() 103 | x_train = [tx_eqn, tx_ini, tx_bnd] 104 | y_train = [u_zero, u_ini, du_dt_ini, u_zero] 105 | lbfgs = L_BFGS_B(model=pinn, x_train=x_train, y_train=y_train) 106 | lbfgs.fit() 107 | end = time.time() 108 | totaltime = end-begin 109 | print("\n Total runtime is (min.)",totaltime/60) 110 | 111 | # test the model 112 | tx = np.stack([np.full(t_test.shape, tilde_t), x_test], axis=-1) 113 | u_pred = network.predict(tx, batch_size=num_test_samples) 114 | 115 | # mse between u_pred via PINN and snapshot observation 116 | mse = -np.mean(np.square(u_analy - u_pred)) 117 | 118 | del network, pinn, lbfgs, u_pred 119 | 120 | return mse 121 | 122 | #%% Bayesian Optimization 123 | # Attributes of BO 124 | itt_explore = 5 125 | itt = 45 126 | itt_all = itt_explore + itt 127 | n_runs = 10 128 | 129 | # bounds of BO 130 | pbounds = {'ic': (0.1, 1)} 131 | 132 | # Start BO 133 | mse_star_all = [] 134 | cstar_all = [] 135 | mse_all_all = [] 136 | ic_all_all = [] 137 | 138 | for r in range(n_runs): 139 | print('\n ## ->>>> Run = ' + str(r)) 140 | 141 | # define the model 142 | optimizer = BayesianOptimization( 143 | f=model_builder, 144 | pbounds=pbounds, 145 | allow_duplicate_points=True) 146 | 147 | # utility function 148 | util = UtilityFunction(kind='ucb', 149 | kappa=2.576, 150 | kappa_decay=1, 151 | kappa_decay_delay=0) 152 | 153 | # run the model 154 | optimizer.maximize(init_points=itt_explore, 155 | n_iter=itt, 156 | acquisition_function=util) 157 | 158 | soln = optimizer.max 159 | resi = optimizer.res 160 | 161 | # optimum values 162 | mse_star = list(soln.values())[0] 163 | cstar = list(soln.values())[1] 164 | cstar2 = list(cstar.values())[0] 165 | 166 | # append all optimum values 167 | mse_star_all.append(mse_star) 168 | cstar_all.append(cstar2) 169 | 170 | # all run values 171 | mse_all = [] 172 | ic_all = [] 173 | for i,res in enumerate(resi): 174 | mse = list(res.values())[0] 175 | ic = list(res.values())[1] 176 | ic2 = list(ic.values())[0] 177 | 178 | # append all run values 179 | mse_all.append(mse) 180 | ic_all.append(ic2) 181 | 182 | mse_all_all.append(np.array(mse_all)) 183 | ic_all_all.append(np.array(ic_all)) 184 | 185 | del optimizer 186 | 187 | mse_all_all = np.array(mse_all_all) 188 | mse_star_all = np.array(mse_star_all) 189 | ic_all_all = np.array(ic_all_all) 190 | cstar_all = np.array(cstar_all) 191 | 192 | #%% Process the BO results 193 | # max, min, mean and sd target function/objective function value across different runs 194 | max_mse_star_allruns, min_mse_star_allruns = np.max(mse_star_all), np.min(mse_star_all) 195 | mean_mse_star_allruns, std_mse_star_allruns = np.mean(mse_star_all), np.std(mse_star_all) 196 | 197 | # optima corresponding to abovementioned optimal points 198 | idx_max_mse_star_allruns = np.where(max_mse_star_allruns == mse_star_all) 199 | idx_min_mse_star_allruns = np.where(min_mse_star_allruns == mse_star_all) 200 | 201 | max_cstar_allruns = cstar_all[idx_max_mse_star_allruns] 202 | min_cstar_allruns = cstar_all[idx_min_mse_star_allruns] 203 | mean_cstar_allruns = np.mean(cstar_all) 204 | std_cstar_allruns = np.std(cstar_all) 205 | 206 | print("Max (best optimal) tf across runs = ",max_mse_star_allruns) 207 | print("Min (least optimal) tf across runs = ",min_mse_star_allruns) 208 | print("Mean tf across runs = ",mean_mse_star_allruns) 209 | print("Std tf across runs = ",std_mse_star_allruns) 210 | 211 | print("Max (best optimal) c* across runs = ",max_cstar_allruns) 212 | print("Min (least optimal) c* across runs = ",min_cstar_allruns) 213 | print("Mean c* across runs = ",mean_cstar_allruns) 214 | print("Std c* across runs = ",std_cstar_allruns) 215 | 216 | #%% plot the BO results 217 | # plot best optimal run with the optima 218 | idx_max_all = [] 219 | for i in range(mse_all_all.shape[0]): 220 | idx_max = np.where(mse_all_all[i,:] == mse_star_all[i]) 221 | idx_max = idx_max[0][0] 222 | idx_max_all.append(idx_max) 223 | 224 | mean_mse_all = np.mean(mse_all_all, axis=0) 225 | std_mse_all = np.std(mse_all_all, axis=0) 226 | mean_ic_all = np.mean(ic_all_all, axis=0) 227 | std_ic_all = np.std(ic_all_all, axis=0) 228 | 229 | opt_mse_run = mse_all_all[idx_max_mse_star_allruns[0][0]] 230 | opt_c_run = ic_all_all[idx_max_mse_star_allruns[0][0]] 231 | opt_mse = mse_star_all[idx_max_mse_star_allruns[0][0]] 232 | opt_c = cstar_all[idx_max_mse_star_allruns[0][0]] 233 | 234 | # tf vs c 235 | txt = 'c* = '+ str(round(opt_c,4)) 236 | plt.figure(figsize = (8, 6)) 237 | plt.plot(opt_c_run,opt_mse_run,'ob',markersize=6) 238 | plt.plot(opt_c,opt_mse,'*r',markersize=8, label = 'Best optima') 239 | #plt.text(0.75, -0.03, txt, fontsize=18, c = 'r') 240 | plt.xlabel("velocity, c",fontsize=20) 241 | plt.ylabel("target function, g(c)",fontsize=20) 242 | plt.xticks(fontsize=20) 243 | plt.yticks(fontsize=20) 244 | plt.legend(fontsize = 14, loc='upper left') 245 | plt.savefig('tfvsc_'+str(idx_data+1)+'.png', bbox_inches='tight', dpi=600) 246 | plt.show() -------------------------------------------------------------------------------- /BOPINN.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "source": [ 6 | "## Colab computing infra available\n", 7 | "### Preliminaries\n", 8 | "#### 1. Runtime -> Change runtime type -> T4 GPU\n", 9 | "#### 2. Upload data folder from github repository on your google drive\n", 10 | "#### 3. Except first three cells, this notebook can be run on jupyter.\n", 11 | "#### 4. For 3., pip install bayesian-optimization is performed in anaconda tensorflow environment." 12 | ], 13 | "metadata": { 14 | "id": "XW60sZt3HGKv" 15 | } 16 | }, 17 | { 18 | "cell_type": "code", 19 | "source": [ 20 | "#GPU count and name\n", 21 | "!nvidia-smi -L\n", 22 | "!lscpu |grep 'Model name'\n", 23 | "#no.of sockets i.e available slots for physical processors\n", 24 | "!lscpu | grep 'Socket(s):'\n", 25 | "#no.of cores each processor is having\n", 26 | "!lscpu | grep 'Core(s) per socket:'\n", 27 | "#no.of threads each core is having\n", 28 | "!lscpu | grep 'Thread(s) per core'\n", 29 | "!lscpu | grep \"L3 cache\"\n", 30 | "#if it had turbo boost it would've shown Min and Max MHz also but it is only showing current frequency this means it always operates at 2.3GHz\n", 31 | "!lscpu | grep \"MHz\"\n", 32 | "#memory that we can use\n", 33 | "!cat /proc/meminfo | grep 'MemAvailable'\n", 34 | "#hard disk that we can use\n", 35 | "!df -h / | awk '{print $4}'" 36 | ], 37 | "metadata": { 38 | "id": "8iHIF9ANB7W-", 39 | "colab": { 40 | "base_uri": "https://localhost:8080/" 41 | }, 42 | "outputId": "677a2eac-9246-478b-f44c-cbeef270bda4" 43 | }, 44 | "execution_count": null, 45 | "outputs": [ 46 | { 47 | "output_type": "stream", 48 | "name": "stdout", 49 | "text": [ 50 | "GPU 0: Tesla T4 (UUID: GPU-2429e038-2c60-04b9-d3a5-5573f49827da)\n", 51 | "Model name: Intel(R) Xeon(R) CPU @ 2.30GHz\n", 52 | "Socket(s): 1\n", 53 | "Core(s) per socket: 1\n", 54 | "Thread(s) per core: 2\n", 55 | "L3 cache: 45 MiB (1 instance)\n", 56 | "MemAvailable: 12416136 kB\n", 57 | "Avail\n", 58 | "52G\n" 59 | ] 60 | } 61 | ] 62 | }, 63 | { 64 | "cell_type": "code", 65 | "source": [ 66 | "# mount google drive\n", 67 | "from google.colab import drive\n", 68 | "drive.mount('/content/gdrive')\n", 69 | "path = 'gdrive/MyDrive/BOPINN/data'" 70 | ], 71 | "metadata": { 72 | "id": "q_ae9KDsC2Q1", 73 | "colab": { 74 | "base_uri": "https://localhost:8080/" 75 | }, 76 | "outputId": "6d816703-0158-473b-a2c5-95e4b09b1c99" 77 | }, 78 | "execution_count": null, 79 | "outputs": [ 80 | { 81 | "output_type": "stream", 82 | "name": "stdout", 83 | "text": [ 84 | "Drive already mounted at /content/gdrive; to attempt to forcibly remount, call drive.mount(\"/content/gdrive\", force_remount=True).\n" 85 | ] 86 | } 87 | ] 88 | }, 89 | { 90 | "cell_type": "code", 91 | "source": [ 92 | "# install Bayesian optimization library \"https://github.com/bayesian-optimization/BayesianOptimization\"\n", 93 | "%pip install bayesian-optimization==1.4.1\n", 94 | "from bayes_opt import BayesianOptimization,UtilityFunction" 95 | ], 96 | "metadata": { 97 | "colab": { 98 | "base_uri": "https://localhost:8080/" 99 | }, 100 | "id": "CrbZE4FvZhbf", 101 | "outputId": "7cbc93bf-ae8b-4936-9fa9-70eb3727dcfb" 102 | }, 103 | "execution_count": null, 104 | "outputs": [ 105 | { 106 | "output_type": "stream", 107 | "name": "stdout", 108 | "text": [ 109 | "Requirement already satisfied: bayesian-optimization==1.4.1 in /usr/local/lib/python3.10/dist-packages (1.4.1)\n", 110 | "Requirement already satisfied: numpy>=1.9.0 in /usr/local/lib/python3.10/dist-packages (from bayesian-optimization==1.4.1) (1.23.5)\n", 111 | "Requirement already satisfied: scipy>=1.0.0 in /usr/local/lib/python3.10/dist-packages (from bayesian-optimization==1.4.1) (1.11.4)\n", 112 | "Requirement already satisfied: scikit-learn>=0.18.0 in /usr/local/lib/python3.10/dist-packages (from bayesian-optimization==1.4.1) (1.2.2)\n", 113 | "Requirement already satisfied: colorama in /usr/local/lib/python3.10/dist-packages (from bayesian-optimization==1.4.1) (0.4.6)\n", 114 | "Requirement already satisfied: joblib>=1.1.1 in /usr/local/lib/python3.10/dist-packages (from scikit-learn>=0.18.0->bayesian-optimization==1.4.1) (1.3.2)\n", 115 | "Requirement already satisfied: threadpoolctl>=2.0.0 in /usr/local/lib/python3.10/dist-packages (from scikit-learn>=0.18.0->bayesian-optimization==1.4.1) (3.2.0)\n" 116 | ] 117 | } 118 | ] 119 | }, 120 | { 121 | "cell_type": "markdown", 122 | "source": [ 123 | "## In-built classes" 124 | ], 125 | "metadata": { 126 | "id": "qECf7VXwCvKO" 127 | } 128 | }, 129 | { 130 | "cell_type": "markdown", 131 | "source": [ 132 | "### Gradient Tape" 133 | ], 134 | "metadata": { 135 | "id": "GQQzlB87IQS1" 136 | } 137 | }, 138 | { 139 | "cell_type": "code", 140 | "source": [ 141 | "import tensorflow as tf\n", 142 | "import numpy as np\n", 143 | "import matplotlib.pyplot as plt\n", 144 | "\n", 145 | "class GradientLayer(tf.keras.layers.Layer):\n", 146 | " \"\"\"\n", 147 | " Custom layer to compute 1st and 2nd derivatives for the wave equation.\n", 148 | "\n", 149 | " Attributes:\n", 150 | " model: keras network model.\n", 151 | " \"\"\"\n", 152 | "\n", 153 | " def __init__(self, model, **kwargs):\n", 154 | " \"\"\"\n", 155 | " Args:\n", 156 | " model: keras network model.\n", 157 | " \"\"\"\n", 158 | "\n", 159 | " self.model = model\n", 160 | " super().__init__(**kwargs)\n", 161 | "\n", 162 | " def call(self, tx):\n", 163 | " \"\"\"\n", 164 | " Computing 1st and 2nd derivatives for the wave equation.\n", 165 | "\n", 166 | " Args:\n", 167 | " tx: input variables (t, x).\n", 168 | "\n", 169 | " Returns:\n", 170 | " u: network output.\n", 171 | " du_dt: 1st derivative of t.\n", 172 | " du_dx: 1st derivative of x.\n", 173 | " d2u_dt2: 2nd derivative of t.\n", 174 | " d2u_dx2: 2nd derivative of x.\n", 175 | " \"\"\"\n", 176 | "\n", 177 | " with tf.GradientTape() as g:\n", 178 | " g.watch(tx)\n", 179 | " with tf.GradientTape() as gg:\n", 180 | " gg.watch(tx)\n", 181 | " u = self.model(tx)\n", 182 | " du_dtx = gg.batch_jacobian(u, tx)\n", 183 | " du_dt = du_dtx[..., 0]\n", 184 | " du_dx = du_dtx[..., 1]\n", 185 | " d2u_dtx2 = g.batch_jacobian(du_dtx, tx)\n", 186 | " d2u_dt2 = d2u_dtx2[..., 0, 0]\n", 187 | " d2u_dx2 = d2u_dtx2[..., 1, 1]\n", 188 | "\n", 189 | " return u, du_dt, du_dx, d2u_dt2, d2u_dx2" 190 | ], 191 | "metadata": { 192 | "id": "8GmwN5gSIOr2" 193 | }, 194 | "execution_count": null, 195 | "outputs": [] 196 | }, 197 | { 198 | "cell_type": "markdown", 199 | "source": [ 200 | "### PINNs" 201 | ], 202 | "metadata": { 203 | "id": "e7-8pYNbDJEv" 204 | } 205 | }, 206 | { 207 | "cell_type": "code", 208 | "source": [ 209 | "class PINN:\n", 210 | " \"\"\"\n", 211 | " Build a physics informed neural network (PINN) model for the wave equation.\n", 212 | "\n", 213 | " Attributes:\n", 214 | " network: keras network model with input (t, x) and output u(t, x).\n", 215 | " c: wave velocity.\n", 216 | " grads: gradient layer.\n", 217 | " \"\"\"\n", 218 | "\n", 219 | " def __init__(self, network, c):\n", 220 | " \"\"\"\n", 221 | " Args:\n", 222 | " network: keras network model with input (t, x) and output u(t, x).\n", 223 | " c: wave velocity. Default is 1.\n", 224 | " \"\"\"\n", 225 | "\n", 226 | " self.network = network\n", 227 | " self.c = c\n", 228 | " self.grads = GradientLayer(self.network)\n", 229 | "\n", 230 | " def build(self):\n", 231 | " \"\"\"\n", 232 | " Build a PINN model for the wave equation.\n", 233 | "\n", 234 | " Returns:\n", 235 | " PINN model for the projectile motion with\n", 236 | " input: [ (t, x) relative to equation,\n", 237 | " (t=0, x) relative to initial condition,\n", 238 | " (t, x=bounds) relative to boundary condition ],\n", 239 | " output: [ u(t,x) relative to equation,\n", 240 | " u(t=0, x) relative to initial condition,\n", 241 | " du_dt(t=0, x) relative to initial derivative of t,\n", 242 | " u(t, x=bounds) relative to boundary condition ]\n", 243 | " \"\"\"\n", 244 | "\n", 245 | " # equation input: (t, x)\n", 246 | " tx_eqn = tf.keras.layers.Input(shape=(2,))\n", 247 | " # initial condition input: (t=0, x)\n", 248 | " tx_ini = tf.keras.layers.Input(shape=(2,))\n", 249 | " # boundary condition input: (t, x=-1) or (t, x=+1)\n", 250 | " tx_bnd = tf.keras.layers.Input(shape=(2,))\n", 251 | "\n", 252 | " # compute gradients\n", 253 | " _, _, _, d2u_dt2, d2u_dx2 = self.grads(tx_eqn)\n", 254 | "\n", 255 | " # equation output being zero\n", 256 | " u_eqn = d2u_dt2 - self.c*self.c * d2u_dx2\n", 257 | " # initial condition output\n", 258 | " u_ini, du_dt_ini, _, _, _ = self.grads(tx_ini)\n", 259 | " # boundary condition output\n", 260 | " u_bnd = self.network(tx_bnd) # dirichlet\n", 261 | " #_, _, u_bnd, _, _ = self.grads(tx_bnd) # neumann\n", 262 | "\n", 263 | " # build the PINN model for the wave equation\n", 264 | " return tf.keras.models.Model(\n", 265 | " inputs=[tx_eqn, tx_ini, tx_bnd],\n", 266 | " outputs=[u_eqn, u_ini, du_dt_ini, u_bnd])" 267 | ], 268 | "metadata": { 269 | "id": "N_6QYlj4C04v" 270 | }, 271 | "execution_count": null, 272 | "outputs": [] 273 | }, 274 | { 275 | "cell_type": "markdown", 276 | "source": [ 277 | "### Network for PINN" 278 | ], 279 | "metadata": { 280 | "id": "ZWPMeef1DLeA" 281 | } 282 | }, 283 | { 284 | "cell_type": "code", 285 | "source": [ 286 | "class Network:\n", 287 | " \"\"\"\n", 288 | " Build a physics informed neural network (PINN) model for the wave equation.\n", 289 | " \"\"\"\n", 290 | "\n", 291 | " @classmethod\n", 292 | " def build(cls, num_inputs=2, layers=[64, 128, 128, 128, 128, 64], activation='tanh', num_outputs=1):\n", 293 | " \"\"\"\n", 294 | " Build a PINN model for the wave equation with input shape (t, x) and output shape u(t, x).\n", 295 | "\n", 296 | " Args:\n", 297 | " num_inputs: number of input variables. Default is 2 for (t, x).\n", 298 | " layers: number of hidden layers.\n", 299 | " activation: activation function in hidden layers.\n", 300 | " num_outpus: number of output variables. Default is 1 for u(t, x).\n", 301 | "\n", 302 | " Returns:\n", 303 | " keras network model.\n", 304 | " \"\"\"\n", 305 | "\n", 306 | " # input layer\n", 307 | " inputs = tf.keras.layers.Input(shape=(num_inputs,))\n", 308 | " # hidden layers\n", 309 | " x = inputs\n", 310 | " for layer in layers:\n", 311 | " x = tf.keras.layers.Dense(layer, activation=activation,\n", 312 | " kernel_initializer='he_normal')(x)\n", 313 | " x = tf.keras.layers.Dropout(0.1)(x)\n", 314 | " # output layer\n", 315 | " outputs = tf.keras.layers.Dense(num_outputs,\n", 316 | " kernel_initializer='he_normal')(x)\n", 317 | "\n", 318 | " return tf.keras.models.Model(inputs=inputs, outputs=outputs)" 319 | ], 320 | "metadata": { 321 | "id": "YqrofsFgDNXR" 322 | }, 323 | "execution_count": null, 324 | "outputs": [] 325 | }, 326 | { 327 | "cell_type": "markdown", 328 | "source": [ 329 | "### Optimizer for PINN" 330 | ], 331 | "metadata": { 332 | "id": "ipTUkVObDT3M" 333 | } 334 | }, 335 | { 336 | "cell_type": "code", 337 | "source": [ 338 | "import scipy.optimize\n", 339 | "\n", 340 | "class L_BFGS_B:\n", 341 | " \"\"\"\n", 342 | " Optimize the keras network model using L-BFGS-B algorithm.\n", 343 | "\n", 344 | " Attributes:\n", 345 | " model: optimization target model.\n", 346 | " samples: training samples.\n", 347 | " factr: convergence condition. typical values for factr are: 1e12 for low accuracy;\n", 348 | " 1e7 for moderate accuracy; 10 for extremely high accuracy.\n", 349 | " m: maximum number of variable metric corrections used to define the limited memory matrix.\n", 350 | " maxls: maximum number of line search steps (per iteration).\n", 351 | " maxiter: maximum number of iterations.\n", 352 | " metris: logging metrics.\n", 353 | " progbar: progress bar.\n", 354 | " \"\"\"\n", 355 | "\n", 356 | " def __init__(self, model, x_train, y_train, m=10, factr=1e7, pgtol=1e-5,\n", 357 | " epsilon=1e-8, maxiter=5000, maxls=50):\n", 358 | " \"\"\"\n", 359 | " Args:\n", 360 | " model: optimization target model.\n", 361 | " samples: training samples.\n", 362 | " factr: convergence condition. typical values for factr are: 1e12 for low accuracy;\n", 363 | " 1e7 for moderate accuracy; 10.0 for extremely high accuracy.\n", 364 | " m: maximum number of variable metric corrections used to define the limited memory matrix.\n", 365 | " maxls: maximum number of line search steps (per iteration).\n", 366 | " maxiter: maximum number of iterations.\n", 367 | " \"\"\"\n", 368 | "\n", 369 | " # set attributes\n", 370 | " self.model = model\n", 371 | " self.x_train = [ tf.constant(x, dtype=tf.float32) for x in x_train ]\n", 372 | " self.y_train = [ tf.constant(y, dtype=tf.float32) for y in y_train ]\n", 373 | " self.factr = factr\n", 374 | " self.m = m\n", 375 | " self.pgtol = pgtol\n", 376 | " self.epsilon = epsilon\n", 377 | " self.maxls = maxls\n", 378 | " self.maxiter = maxiter\n", 379 | " self.metrics = ['loss']\n", 380 | " # initialize the progress bar\n", 381 | " self.progbar = tf.keras.callbacks.ProgbarLogger(\n", 382 | " count_mode='steps', stateful_metrics=self.metrics)\n", 383 | " self.progbar.set_params( {\n", 384 | " 'verbose':1, 'epochs':1, 'steps':self.maxiter, 'metrics':self.metrics})\n", 385 | "\n", 386 | " def set_weights(self, flat_weights):\n", 387 | " \"\"\"\n", 388 | " Set weights to the model.\n", 389 | "\n", 390 | " Args:\n", 391 | " flat_weights: flatten weights.\n", 392 | " \"\"\"\n", 393 | "\n", 394 | " # get model weights\n", 395 | " shapes = [ w.shape for w in self.model.get_weights() ]\n", 396 | " # compute splitting indices\n", 397 | " split_ids = np.cumsum([ np.prod(shape) for shape in [0] + shapes ])\n", 398 | " # reshape weights\n", 399 | " weights = [ flat_weights[from_id:to_id].reshape(shape)\n", 400 | " for from_id, to_id, shape in zip(split_ids[:-1], split_ids[1:], shapes) ]\n", 401 | " # set weights to the model\n", 402 | " self.model.set_weights(weights)\n", 403 | "\n", 404 | " @tf.function\n", 405 | " def tf_evaluate(self, x, y):\n", 406 | " \"\"\"\n", 407 | " Evaluate loss and gradients for weights as tf.Tensor.\n", 408 | "\n", 409 | " Args:\n", 410 | " x: input data.\n", 411 | "\n", 412 | " Returns:\n", 413 | " loss and gradients for weights as tf.Tensor.\n", 414 | " \"\"\"\n", 415 | "\n", 416 | " with tf.GradientTape() as g:\n", 417 | " loss = tf.reduce_mean(tf.keras.losses.mse(self.model(x), y))\n", 418 | " grads = g.gradient(loss, self.model.trainable_variables)\n", 419 | " return loss, grads\n", 420 | "\n", 421 | " def evaluate(self, weights):\n", 422 | " \"\"\"\n", 423 | " Evaluate loss and gradients for weights as ndarray.\n", 424 | "\n", 425 | " Args:\n", 426 | " weights: flatten weights.\n", 427 | "\n", 428 | " Returns:\n", 429 | " loss and gradients for weights as ndarray.\n", 430 | " \"\"\"\n", 431 | "\n", 432 | " # update weights\n", 433 | " self.set_weights(weights)\n", 434 | " # compute loss and gradients for weights\n", 435 | " loss, grads = self.tf_evaluate(self.x_train, self.y_train)\n", 436 | " # convert tf.Tensor to flatten ndarray\n", 437 | " loss = loss.numpy().astype('float64')\n", 438 | " grads = np.concatenate([ g.numpy().flatten() for g in grads ]).astype('float64')\n", 439 | "\n", 440 | " return loss, grads\n", 441 | "\n", 442 | " def callback(self, weights):\n", 443 | " \"\"\"\n", 444 | " Callback that prints the progress to stdout.\n", 445 | "\n", 446 | " Args:\n", 447 | " weights: flatten weights.\n", 448 | " \"\"\"\n", 449 | " self.progbar.on_batch_begin(0)\n", 450 | " loss, _ = self.evaluate(weights)\n", 451 | " self.progbar.on_batch_end(0, logs=dict(zip(self.metrics, [loss])))\n", 452 | "\n", 453 | " def fit(self):\n", 454 | " \"\"\"\n", 455 | " Train the model using L-BFGS-B algorithm.\n", 456 | " \"\"\"\n", 457 | "\n", 458 | " # get initial weights as a flat vector\n", 459 | " initial_weights = np.concatenate(\n", 460 | " [ w.flatten() for w in self.model.get_weights() ])\n", 461 | " # optimize the weight vector\n", 462 | " print('Optimizer: L-BFGS-B (maxiter={})'.format(self.maxiter))\n", 463 | " self.progbar.on_train_begin()\n", 464 | " self.progbar.on_epoch_begin(1)\n", 465 | "\n", 466 | " scipy.optimize.fmin_l_bfgs_b(func=self.evaluate,\n", 467 | " x0=initial_weights,\n", 468 | " factr=self.factr,\n", 469 | " pgtol=self.pgtol,\n", 470 | " epsilon=self.epsilon,\n", 471 | " m=self.m,\n", 472 | " maxls=self.maxls,\n", 473 | " maxiter=self.maxiter,\n", 474 | " callback=self.callback)\n", 475 | "\n", 476 | " self.progbar.on_epoch_end(1)\n", 477 | " self.progbar.on_train_end()\n" 478 | ], 479 | "metadata": { 480 | "id": "RDynBdklDSqh" 481 | }, 482 | "execution_count": null, 483 | "outputs": [] 484 | }, 485 | { 486 | "cell_type": "markdown", 487 | "source": [ 488 | "## Upload data (snapshot observation)" 489 | ], 490 | "metadata": { 491 | "id": "WpYtKf8CDl7P" 492 | } 493 | }, 494 | { 495 | "cell_type": "code", 496 | "source": [ 497 | "#from bayes_opt import BayesianOptimization, UtilityFunction\n", 498 | "import math\n", 499 | "import scipy.io\n", 500 | "import os\n", 501 | "from os.path import join\n", 502 | "import time\n", 503 | "\n", 504 | "# number of training samples: found 25000 points is optimal for the resolution of u(x,t) in PINN\n", 505 | "num_train_samples = 25000\n", 506 | "\n", 507 | "# number of test samples\n", 508 | "num_test_samples = 5000\n", 509 | "\n", 510 | "# Other variables\n", 511 | "L = 10\n", 512 | "n = L\n", 513 | "T = 1\n", 514 | "\n", 515 | "# define x,t for PINNs prediction\n", 516 | "x_test = np.linspace(0,L,num_test_samples)\n", 517 | "t_test = np.linspace(0,T,num_test_samples)\n", 518 | "\n", 519 | "# upload the snapshot observation\n", 520 | "dir_list = os.listdir(path) # path defined in 2 cell\n", 521 | "print(\"Files in directory\",dir_list)\n", 522 | "idx_data = 0 # 0,1,2 # which file\n", 523 | "data = dir_list[idx_data]\n", 524 | "print(\"Imported file\", data)\n", 525 | "\n", 526 | "file = join(path, data)\n", 527 | "u_analy = scipy.io.loadmat(file)\n", 528 | "u_analy = u_analy['a1']\n", 529 | "\n", 530 | "# plot the snapshot observation\n", 531 | "fig = plt.figure(figsize=(7,4))\n", 532 | "plt.plot(x_test,u_analy, '-', linewidth = 2)\n", 533 | "plt.title(\"Snapshot observation at = 0.25s\",fontsize=15)\n", 534 | "plt.xlabel('$x$', fontsize = 15)\n", 535 | "plt.ylabel('Normalized u(x,t)', fontsize = 15)\n", 536 | "plt.xticks(fontsize = 12)\n", 537 | "plt.yticks(fontsize = 12)\n", 538 | "\n", 539 | "# time of observation = for PINN prediction of u(x,t) at tilde_t\n", 540 | "tilde_t = 0.25" 541 | ], 542 | "metadata": { 543 | "id": "_3cuJlPqCHZd", 544 | "colab": { 545 | "base_uri": "https://localhost:8080/", 546 | "height": 459 547 | }, 548 | "outputId": "d5169459-39aa-4294-d7cb-127b58634e5e" 549 | }, 550 | "execution_count": null, 551 | "outputs": [ 552 | { 553 | "output_type": "stream", 554 | "name": "stdout", 555 | "text": [ 556 | "Files in directory ['u_analytic_c=0.2t=0.25snr=39.36.mat', 'u_analytic_c=0.55t=0.25snr=38.91.mat', 'u_analytic_c=0.85t=0.25snr=37.5.mat']\n", 557 | "Imported file u_analytic_c=0.2t=0.25snr=39.36.mat\n" 558 | ] 559 | }, 560 | { 561 | "output_type": "display_data", 562 | "data": { 563 | "text/plain": [ 564 | "
" 565 | ], 566 | "image/png": "\n" 567 | }, 568 | "metadata": {} 569 | } 570 | ] 571 | }, 572 | { 573 | "cell_type": "markdown", 574 | "source": [ 575 | "## Collocation points" 576 | ], 577 | "metadata": { 578 | "id": "mPj-1ODfEFhe" 579 | } 580 | }, 581 | { 582 | "cell_type": "code", 583 | "source": [ 584 | "#%% Initial conditions\n", 585 | "def u0(t):\n", 586 | " z = -np.sin(1*math.pi*t)\n", 587 | " return z\n", 588 | "\n", 589 | "def du0_dt(tx):\n", 590 | " with tf.GradientTape() as g:\n", 591 | " g.watch(tx)\n", 592 | " u = u0(tx)\n", 593 | " du_dt = g.batch_jacobian(u, tx)[..., 0]\n", 594 | " return du_dt\n", 595 | "\n", 596 | "def RMS(S):\n", 597 | " rms = np.sqrt(np.mean(S**2))\n", 598 | " return rms\n", 599 | "\n", 600 | "#%% collocation points\n", 601 | "# create training input\n", 602 | "tx_eqn = np.random.rand(num_train_samples, 2)\n", 603 | "tx_eqn[..., 0] = T*tx_eqn[..., 0] # t = 0 ~ +1\n", 604 | "tx_eqn[..., 1] = L*tx_eqn[..., 1] # x = 0 ~ +10\n", 605 | "#print('\\nShape of t_eqn ==>',tx_eqn.shape)\n", 606 | "\n", 607 | "tx_ini = np.random.rand(num_train_samples, 2)\n", 608 | "tx_ini[..., 0] = 0 # t = 0\n", 609 | "tx_ini[..., 1] = L*tx_ini[..., 1] # x = 0 ~ +10\n", 610 | "#print('\\nShape of tx_ini ==>',tx_ini.shape)\n", 611 | "\n", 612 | "tx_bnd = np.random.rand(num_train_samples, 2)\n", 613 | "tx_bnd[..., 0] = T*tx_bnd[..., 0] # t = 0 ~ +1\n", 614 | "tx_bnd[..., 1] = L*np.round(tx_bnd[..., 1]) # x = 0 or +10\n", 615 | "#print('\\nShape of tx_bnd ==>',tx_bnd.shape)\n", 616 | "\n", 617 | "# initial and boundary conditions\n", 618 | "u_zero = np.zeros((num_train_samples, 1))\n", 619 | "u_ini = u0(tx_ini[:,1,None])\n", 620 | "du_dt_ini = np.zeros((num_train_samples, 1))" 621 | ], 622 | "metadata": { 623 | "id": "xHHrWjfvCeaP" 624 | }, 625 | "execution_count": null, 626 | "outputs": [] 627 | }, 628 | { 629 | "cell_type": "markdown", 630 | "source": [ 631 | "## Target function or objective function for BOPINN" 632 | ], 633 | "metadata": { 634 | "id": "_3hVo0wKEOyZ" 635 | } 636 | }, 637 | { 638 | "cell_type": "code", 639 | "source": [ 640 | "#%% Target function or ojective function, g(c) = (u_pred - u_true)^2; u_pred via PINNs\n", 641 | "def model_builder(ic):\n", 642 | " #ic = hp.Float('ic', min_value=0.1, max_value=1, step=10)\n", 643 | " print('\\n ## ->>>> PINNs simulation at speed = ' + str(ic))\n", 644 | "\n", 645 | " # build a PINN model\n", 646 | " network = Network.build()\n", 647 | " pinn = PINN(network,ic).build()\n", 648 | "\n", 649 | " # train the model using L-BFGS-B algorithm\n", 650 | " begin = time.time()\n", 651 | " x_train = [tx_eqn, tx_ini, tx_bnd]\n", 652 | " y_train = [u_zero, u_ini, du_dt_ini, u_zero]\n", 653 | " lbfgs = L_BFGS_B(model=pinn, x_train=x_train, y_train=y_train)\n", 654 | " lbfgs.fit()\n", 655 | " end = time.time()\n", 656 | " totaltime = end-begin\n", 657 | " print(\"\\n Total runtime is (min.)\",totaltime/60)\n", 658 | "\n", 659 | " # test the model\n", 660 | " tx = np.stack([np.full(t_test.shape, tilde_t), x_test], axis=-1)\n", 661 | " u_pred = network.predict(tx, batch_size=num_test_samples)\n", 662 | "\n", 663 | " # mse between u_pred via PINN and snapshot observation\n", 664 | " mse = -np.mean(np.square(u_analy - u_pred))\n", 665 | "\n", 666 | " del network, pinn, lbfgs, u_pred\n", 667 | "\n", 668 | " return mse" 669 | ], 670 | "metadata": { 671 | "id": "Q2NA5OvMCg64" 672 | }, 673 | "execution_count": null, 674 | "outputs": [] 675 | }, 676 | { 677 | "cell_type": "markdown", 678 | "source": [ 679 | "## Training" 680 | ], 681 | "metadata": { 682 | "id": "bJ-eT6gwEYSH" 683 | } 684 | }, 685 | { 686 | "cell_type": "code", 687 | "source": [ 688 | "#%% Bayesian Optimization\n", 689 | "# Attributes of BO\n", 690 | "itt_explore = 5\n", 691 | "itt = 45\n", 692 | "itt_all = itt_explore + itt\n", 693 | "n_runs = 10 # reduce this if colab has limited capability\n", 694 | "\n", 695 | "# bounds of BO\n", 696 | "pbounds = {'ic': (0.1, 1)}\n", 697 | "\n", 698 | "# Start BO\n", 699 | "mse_star_all = []\n", 700 | "cstar_all = []\n", 701 | "mse_all_all = []\n", 702 | "ic_all_all = []\n", 703 | "\n", 704 | "for r in range(n_runs):\n", 705 | " print('\\n ## ->>>> Run = ' + str(r))\n", 706 | "\n", 707 | " # define the model\n", 708 | " optimizer = BayesianOptimization(\n", 709 | " f=model_builder,\n", 710 | " pbounds=pbounds,\n", 711 | " allow_duplicate_points=True)\n", 712 | "\n", 713 | " # utility function\n", 714 | " util = UtilityFunction(kind='ucb',\n", 715 | " kappa=2.576,\n", 716 | " xi=0.0,\n", 717 | " kappa_decay=1,\n", 718 | " kappa_decay_delay=0)\n", 719 | "\n", 720 | " # run the model\n", 721 | " optimizer.maximize(init_points=itt_explore,\n", 722 | " n_iter=itt,\n", 723 | " acquisition_function=util)\n", 724 | "\n", 725 | " soln = optimizer.max\n", 726 | " resi = optimizer.res\n", 727 | "\n", 728 | " # optimum values\n", 729 | " mse_star = list(soln.values())[0]\n", 730 | " cstar = list(soln.values())[1]\n", 731 | " cstar2 = list(cstar.values())[0]\n", 732 | "\n", 733 | " # append all optimum values\n", 734 | " mse_star_all.append(mse_star)\n", 735 | " cstar_all.append(cstar2)\n", 736 | "\n", 737 | " # all run values\n", 738 | " mse_all, ic_all = [], []\n", 739 | " for i,res in enumerate(resi):\n", 740 | " mse = list(res.values())[0]\n", 741 | " ic = list(res.values())[1]\n", 742 | " ic2 = list(ic.values())[0]\n", 743 | "\n", 744 | " # append all run values\n", 745 | " mse_all.append(mse)\n", 746 | " ic_all.append(ic2)\n", 747 | "\n", 748 | " mse_all_all.append(np.array(mse_all))\n", 749 | " ic_all_all.append(np.array(ic_all))\n", 750 | "\n", 751 | " del optimizer\n", 752 | "\n", 753 | "mse_all_all = np.array(mse_all_all)\n", 754 | "mse_star_all = np.array(mse_star_all)\n", 755 | "ic_all_all = np.array(ic_all_all)\n", 756 | "cstar_all = np.array(cstar_all)" 757 | ], 758 | "metadata": { 759 | "id": "Mp27Bsy8Cl4P", 760 | "colab": { 761 | "base_uri": "https://localhost:8080/" 762 | }, 763 | "outputId": "27b03b23-b1dc-4b7b-c550-c7633601a453" 764 | }, 765 | "execution_count": null, 766 | "outputs": [ 767 | { 768 | "metadata": { 769 | "tags": null 770 | }, 771 | "name": "stdout", 772 | "output_type": "stream", 773 | "text": [ 774 | "\n", 775 | " ## ->>>> Run = 0\n", 776 | "| iter | target | ic |\n", 777 | "-------------------------------------\n", 778 | "\n", 779 | " ## ->>>> PINNs simulation at speed = 0.4372813898716186\n", 780 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 781 | "5000/5000 [==============================] - 523s 105ms/step\n", 782 | "\n", 783 | " Total runtime is (min.) 8.710416158040365\n", 784 | "1/1 [==============================] - 0s 127ms/step\n", 785 | "| \u001b[0m1 \u001b[0m | \u001b[0m-0.001148\u001b[0m | \u001b[0m0.4373 \u001b[0m |\n", 786 | "\n", 787 | " ## ->>>> PINNs simulation at speed = 0.353260871860698\n", 788 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 789 | "5000/5000 [==============================] - 457s 91ms/step\n", 790 | "\n", 791 | " Total runtime is (min.) 7.620774328708649\n", 792 | "1/1 [==============================] - 0s 108ms/step\n", 793 | "| \u001b[95m2 \u001b[0m | \u001b[95m-0.000404\u001b[0m | \u001b[95m0.3533 \u001b[0m |\n", 794 | "\n", 795 | " ## ->>>> PINNs simulation at speed = 0.9598970605863492\n", 796 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 797 | "5000/5000 [==============================] - 1106s 221ms/step\n", 798 | "\n", 799 | " Total runtime is (min.) 18.436524299780526\n", 800 | "1/1 [==============================] - 0s 105ms/step\n", 801 | "| \u001b[0m3 \u001b[0m | \u001b[0m-0.03358 \u001b[0m | \u001b[0m0.9599 \u001b[0m |\n", 802 | "\n", 803 | " ## ->>>> PINNs simulation at speed = 0.868646025552868\n", 804 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 805 | "5000/5000 [==============================] - 779s 156ms/step\n", 806 | "\n", 807 | " Total runtime is (min.) 12.977701457341512\n", 808 | "1/1 [==============================] - 0s 68ms/step\n", 809 | "| \u001b[0m4 \u001b[0m | \u001b[0m-0.02251 \u001b[0m | \u001b[0m0.8686 \u001b[0m |\n", 810 | "\n", 811 | " ## ->>>> PINNs simulation at speed = 0.15795893544754053\n", 812 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 813 | "5000/5000 [==============================] - 502s 100ms/step\n" 814 | ] 815 | }, 816 | { 817 | "metadata": { 818 | "tags": null 819 | }, 820 | "name": "stderr", 821 | "output_type": "stream", 822 | "text": [ 823 | "WARNING:tensorflow:5 out of the last 5 calls to .predict_function at 0x79d518d530a0> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for more details.\n" 824 | ] 825 | }, 826 | { 827 | "metadata": { 828 | "tags": null 829 | }, 830 | "name": "stdout", 831 | "output_type": "stream", 832 | "text": [ 833 | "\n", 834 | " Total runtime is (min.) 8.373841834068298\n", 835 | "1/1 [==============================] - 0s 109ms/step\n", 836 | "| \u001b[95m5 \u001b[0m | \u001b[95m-7.06e-05\u001b[0m | \u001b[95m0.158 \u001b[0m |\n", 837 | "\n", 838 | " ## ->>>> PINNs simulation at speed = 0.35322383568991045\n", 839 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 840 | "5000/5000 [==============================] - 616s 123ms/step\n" 841 | ] 842 | }, 843 | { 844 | "metadata": { 845 | "tags": null 846 | }, 847 | "name": "stderr", 848 | "output_type": "stream", 849 | "text": [ 850 | "WARNING:tensorflow:6 out of the last 6 calls to .predict_function at 0x79d50627e170> triggered tf.function retracing. Tracing is expensive and the excessive number of tracings could be due to (1) creating @tf.function repeatedly in a loop, (2) passing tensors with different shapes, (3) passing Python objects instead of tensors. For (1), please define your @tf.function outside of the loop. For (2), @tf.function has reduce_retracing=True option that can avoid unnecessary retracing. For (3), please refer to https://www.tensorflow.org/guide/function#controlling_retracing and https://www.tensorflow.org/api_docs/python/tf/function for more details.\n" 851 | ] 852 | }, 853 | { 854 | "output_type": "stream", 855 | "name": "stdout", 856 | "text": [ 857 | "\n", 858 | " Total runtime is (min.) 10.258907715479532\n", 859 | "1/1 [==============================] - 0s 107ms/step\n", 860 | "| \u001b[0m6 \u001b[0m | \u001b[0m-0.000410\u001b[0m | \u001b[0m0.3532 \u001b[0m |\n", 861 | "\n", 862 | " ## ->>>> PINNs simulation at speed = 0.6265603597846434\n", 863 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 864 | "5000/5000 [==============================] - 702s 140ms/step\n", 865 | "\n", 866 | " Total runtime is (min.) 11.704780928293864\n", 867 | "1/1 [==============================] - 0s 105ms/step\n", 868 | "| \u001b[0m7 \u001b[0m | \u001b[0m-0.005768\u001b[0m | \u001b[0m0.6266 \u001b[0m |\n", 869 | "\n", 870 | " ## ->>>> PINNs simulation at speed = 0.10004206006951194\n", 871 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 872 | "5000/5000 [==============================] - 364s 73ms/step\n", 873 | "\n", 874 | " Total runtime is (min.) 6.072018718719482\n", 875 | "1/1 [==============================] - 0s 112ms/step\n", 876 | "| \u001b[0m8 \u001b[0m | \u001b[0m-0.000105\u001b[0m | \u001b[0m0.1 \u001b[0m |\n", 877 | "\n", 878 | " ## ->>>> PINNs simulation at speed = 0.25506179377329546\n", 879 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 880 | "5000/5000 [==============================] - 443s 89ms/step\n", 881 | "\n", 882 | " Total runtime is (min.) 7.377660123507182\n", 883 | "1/1 [==============================] - 0s 83ms/step\n", 884 | "| \u001b[0m9 \u001b[0m | \u001b[0m-9.066e-0\u001b[0m | \u001b[0m0.2551 \u001b[0m |\n", 885 | "\n", 886 | " ## ->>>> PINNs simulation at speed = 0.20751207571890762\n", 887 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 888 | "5000/5000 [==============================] - 375s 75ms/step\n", 889 | "\n", 890 | " Total runtime is (min.) 6.241973801453908\n", 891 | "1/1 [==============================] - 0s 119ms/step\n", 892 | "| \u001b[0m10 \u001b[0m | \u001b[0m-7.107e-0\u001b[0m | \u001b[0m0.2075 \u001b[0m |\n", 893 | "\n", 894 | " ## ->>>> PINNs simulation at speed = 0.29827013284790804\n", 895 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 896 | "5000/5000 [==============================] - 419s 84ms/step\n", 897 | "\n", 898 | " Total runtime is (min.) 6.982113985220591\n", 899 | "1/1 [==============================] - 0s 76ms/step\n", 900 | "| \u001b[0m11 \u001b[0m | \u001b[0m-0.000182\u001b[0m | \u001b[0m0.2983 \u001b[0m |\n", 901 | "\n", 902 | " ## ->>>> PINNs simulation at speed = 0.12646718809275764\n", 903 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 904 | "5000/5000 [==============================] - 481s 96ms/step\n", 905 | "\n", 906 | " Total runtime is (min.) 8.016359814008077\n", 907 | "1/1 [==============================] - 0s 81ms/step\n", 908 | "| \u001b[0m12 \u001b[0m | \u001b[0m-8.387e-0\u001b[0m | \u001b[0m0.1265 \u001b[0m |\n", 909 | "\n", 910 | " ## ->>>> PINNs simulation at speed = 0.18291510701869837\n", 911 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 912 | "5000/5000 [==============================] - 367s 73ms/step\n", 913 | "\n", 914 | " Total runtime is (min.) 6.108590332667033\n", 915 | "1/1 [==============================] - 0s 80ms/step\n", 916 | "| \u001b[95m13 \u001b[0m | \u001b[95m-6.506e-0\u001b[0m | \u001b[95m0.1829 \u001b[0m |\n", 917 | "\n", 918 | " ## ->>>> PINNs simulation at speed = 0.2295051729538426\n", 919 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 920 | "5000/5000 [==============================] - 510s 102ms/step\n", 921 | "\n", 922 | " Total runtime is (min.) 8.495574649175008\n", 923 | "1/1 [==============================] - 0s 133ms/step\n", 924 | "| \u001b[0m14 \u001b[0m | \u001b[0m-7.231e-0\u001b[0m | \u001b[0m0.2295 \u001b[0m |\n", 925 | "\n", 926 | " ## ->>>> PINNs simulation at speed = 0.17489332261182525\n", 927 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 928 | "5000/5000 [==============================] - 480s 96ms/step\n", 929 | "\n", 930 | " Total runtime is (min.) 8.002258733908336\n", 931 | "1/1 [==============================] - 0s 67ms/step\n", 932 | "| \u001b[0m15 \u001b[0m | \u001b[0m-6.664e-0\u001b[0m | \u001b[0m0.1749 \u001b[0m |\n", 933 | "\n", 934 | " ## ->>>> PINNs simulation at speed = 0.19438706454255616\n", 935 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 936 | "5000/5000 [==============================] - 365s 73ms/step\n", 937 | "\n", 938 | " Total runtime is (min.) 6.076679023106893\n", 939 | "1/1 [==============================] - 0s 67ms/step\n", 940 | "| \u001b[95m16 \u001b[0m | \u001b[95m-5.969e-0\u001b[0m | \u001b[95m0.1944 \u001b[0m |\n", 941 | "\n", 942 | " ## ->>>> PINNs simulation at speed = 0.1931523178425959\n", 943 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 944 | "5000/5000 [==============================] - 478s 96ms/step\n", 945 | "\n", 946 | " Total runtime is (min.) 7.9739015102386475\n", 947 | "1/1 [==============================] - 0s 71ms/step\n", 948 | "| \u001b[95m17 \u001b[0m | \u001b[95m-5.967e-0\u001b[0m | \u001b[95m0.1932 \u001b[0m |\n", 949 | "\n", 950 | " ## ->>>> PINNs simulation at speed = 0.1472501091609439\n", 951 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 952 | "5000/5000 [==============================] - 498s 100ms/step\n", 953 | "\n", 954 | " Total runtime is (min.) 8.299330997467042\n", 955 | "1/1 [==============================] - 0s 67ms/step\n", 956 | "| \u001b[0m18 \u001b[0m | \u001b[0m-7.572e-0\u001b[0m | \u001b[0m0.1473 \u001b[0m |\n", 957 | "\n", 958 | " ## ->>>> PINNs simulation at speed = 0.1864475687192167\n", 959 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 960 | "5000/5000 [==============================] - 395s 79ms/step\n", 961 | "\n", 962 | " Total runtime is (min.) 6.576291259129842\n", 963 | "1/1 [==============================] - 0s 106ms/step\n", 964 | "| \u001b[0m19 \u001b[0m | \u001b[0m-6.111e-0\u001b[0m | \u001b[0m0.1864 \u001b[0m |\n", 965 | "\n", 966 | " ## ->>>> PINNs simulation at speed = 0.20641322721099062\n", 967 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 968 | "5000/5000 [==============================] - 415s 83ms/step\n", 969 | "\n", 970 | " Total runtime is (min.) 6.909338291486105\n", 971 | "1/1 [==============================] - 0s 70ms/step\n", 972 | "| \u001b[0m20 \u001b[0m | \u001b[0m-6.846e-0\u001b[0m | \u001b[0m0.2064 \u001b[0m |\n", 973 | "\n", 974 | " ## ->>>> PINNs simulation at speed = 0.17467333008463468\n", 975 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 976 | "5000/5000 [==============================] - 407s 81ms/step\n", 977 | "\n", 978 | " Total runtime is (min.) 6.785109670956929\n", 979 | "1/1 [==============================] - 0s 98ms/step\n", 980 | "| \u001b[0m21 \u001b[0m | \u001b[0m-6.953e-0\u001b[0m | \u001b[0m0.1747 \u001b[0m |\n", 981 | "\n", 982 | " ## ->>>> PINNs simulation at speed = 0.19224016373696584\n", 983 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 984 | "5000/5000 [==============================] - 506s 101ms/step\n", 985 | "\n", 986 | " Total runtime is (min.) 8.428928422927857\n", 987 | "1/1 [==============================] - 0s 69ms/step\n", 988 | "| \u001b[0m22 \u001b[0m | \u001b[0m-6.054e-0\u001b[0m | \u001b[0m0.1922 \u001b[0m |\n", 989 | "\n", 990 | " ## ->>>> PINNs simulation at speed = 0.19200099153944267\n", 991 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 992 | "5000/5000 [==============================] - 437s 87ms/step\n", 993 | "\n", 994 | " Total runtime is (min.) 7.2850401679674786\n", 995 | "1/1 [==============================] - 0s 103ms/step\n", 996 | "| \u001b[0m23 \u001b[0m | \u001b[0m-6.077e-0\u001b[0m | \u001b[0m0.192 \u001b[0m |\n", 997 | "\n", 998 | " ## ->>>> PINNs simulation at speed = 0.19115332829277382\n", 999 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 1000 | "5000/5000 [==============================] - 335s 67ms/step\n", 1001 | "\n", 1002 | " Total runtime is (min.) 5.587451763947805\n", 1003 | "1/1 [==============================] - 0s 68ms/step\n", 1004 | "| \u001b[0m24 \u001b[0m | \u001b[0m-6.288e-0\u001b[0m | \u001b[0m0.1912 \u001b[0m |\n", 1005 | "\n", 1006 | " ## ->>>> PINNs simulation at speed = 0.19599276179575198\n", 1007 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 1008 | "5000/5000 [==============================] - 454s 91ms/step\n", 1009 | "\n", 1010 | " Total runtime is (min.) 7.566520047187805\n", 1011 | "1/1 [==============================] - 0s 101ms/step\n", 1012 | "| \u001b[0m25 \u001b[0m | \u001b[0m-6.409e-0\u001b[0m | \u001b[0m0.196 \u001b[0m |\n", 1013 | "\n", 1014 | " ## ->>>> PINNs simulation at speed = 0.1854055143664269\n", 1015 | "Optimizer: L-BFGS-B (maxiter=5000)\n", 1016 | "5000/5000 [==============================] - 456s 91ms/step\n", 1017 | "\n", 1018 | " Total runtime is (min.) 7.592611781756083\n", 1019 | "1/1 [==============================] - 0s 69ms/step\n", 1020 | "| \u001b[0m26 \u001b[0m | \u001b[0m-6.051e-0\u001b[0m | \u001b[0m0.1854 \u001b[0m |\n", 1021 | "\n", 1022 | " ## ->>>> PINNs simulation at speed = 0.186162721420857\n", 1023 | "Optimizer: L-BFGS-B (maxiter=5000)\n" 1024 | ] 1025 | } 1026 | ] 1027 | }, 1028 | { 1029 | "cell_type": "markdown", 1030 | "source": [ 1031 | "## Processing and plotting" 1032 | ], 1033 | "metadata": { 1034 | "id": "Bp5UWXSnE_YX" 1035 | } 1036 | }, 1037 | { 1038 | "cell_type": "code", 1039 | "source": [ 1040 | "#%% Process the BO results\n", 1041 | "# max, min, mean and sd target function/objective function value across different runs\n", 1042 | "max_mse_star_allruns, min_mse_star_allruns = np.max(mse_star_all), np.min(mse_star_all)\n", 1043 | "mean_mse_star_allruns, std_mse_star_allruns = np.mean(mse_star_all), np.std(mse_star_all)\n", 1044 | "\n", 1045 | "# optima corresponding to abovementioned optimal points\n", 1046 | "idx_max_mse_star_allruns = np.where(max_mse_star_allruns == mse_star_all)\n", 1047 | "idx_min_mse_star_allruns = np.where(min_mse_star_allruns == mse_star_all)\n", 1048 | "\n", 1049 | "max_cstar_allruns = cstar_all[idx_max_mse_star_allruns]\n", 1050 | "min_cstar_allruns = cstar_all[idx_min_mse_star_allruns]\n", 1051 | "mean_cstar_allruns = np.mean(cstar_all)\n", 1052 | "std_cstar_allruns = np.std(cstar_all)\n", 1053 | "\n", 1054 | "print(\"Max (best optimal) tf across runs = \",max_mse_star_allruns)\n", 1055 | "print(\"Min (worst optimal) tf across runs = \",min_mse_star_allruns)\n", 1056 | "print(\"Mean tf across runs = \",mean_mse_star_allruns)\n", 1057 | "print(\"Std tf across runs = \",std_mse_star_allruns)\n", 1058 | "\n", 1059 | "print(\"Max (best optimal) c* across runs = \",max_cstar_allruns)\n", 1060 | "print(\"Min (worst optimal) c* across runs = \",min_cstar_allruns)\n", 1061 | "print(\"Mean c* across runs = \",mean_cstar_allruns)\n", 1062 | "print(\"Std c* across runs = \",std_cstar_allruns)" 1063 | ], 1064 | "metadata": { 1065 | "id": "m45_nEHXEcel" 1066 | }, 1067 | "execution_count": null, 1068 | "outputs": [] 1069 | }, 1070 | { 1071 | "cell_type": "code", 1072 | "source": [ 1073 | "# plot best optimal run with the optima\n", 1074 | "idx_max_all = []\n", 1075 | "for i in range(mse_all_all.shape[0]):\n", 1076 | " idx_max = np.where(mse_all_all[i,:] == mse_star_all[i])\n", 1077 | " idx_max = idx_max[0][0]\n", 1078 | " idx_max_all.append(idx_max)\n", 1079 | "\n", 1080 | "mean_mse_all = np.mean(mse_all_all, axis=0)\n", 1081 | "std_mse_all = np.std(mse_all_all, axis=0)\n", 1082 | "mean_ic_all = np.mean(ic_all_all, axis=0)\n", 1083 | "std_ic_all = np.std(ic_all_all, axis=0)\n", 1084 | "\n", 1085 | "opt_mse_run = mse_all_all[idx_max_mse_star_allruns[0][0]]\n", 1086 | "opt_c_run = ic_all_all[idx_max_mse_star_allruns[0][0]]\n", 1087 | "opt_mse = mse_star_all[idx_max_mse_star_allruns[0][0]]\n", 1088 | "opt_c = cstar_all[idx_max_mse_star_allruns[0][0]]\n", 1089 | "\n", 1090 | "txt = 'c* = '+ str(round(opt_c,4))\n", 1091 | "plt.figure(figsize = (8, 6))\n", 1092 | "plt.plot(opt_c_run,opt_mse_run,'ob',markersize=6)\n", 1093 | "plt.plot(opt_c,opt_mse,'*r',markersize=8, label = 'Best optima')\n", 1094 | "#plt.text(0.75, -0.03, txt, fontsize=18, c = 'r')\n", 1095 | "plt.xlabel(\"velocity, c\",fontsize=20)\n", 1096 | "plt.ylabel(\"target function, g(c)\",fontsize=20)\n", 1097 | "plt.xticks(fontsize=20)\n", 1098 | "plt.yticks(fontsize=20)\n", 1099 | "plt.legend(fontsize = 14, loc='upper left')\n", 1100 | "plt.savefig('tfvsc_'+str(idx_data+1)+'.png', bbox_inches='tight', dpi=600)\n", 1101 | "plt.show()" 1102 | ], 1103 | "metadata": { 1104 | "id": "qaTRHKjgFDP3" 1105 | }, 1106 | "execution_count": null, 1107 | "outputs": [] 1108 | } 1109 | ], 1110 | "metadata": { 1111 | "colab": { 1112 | "provenance": [], 1113 | "gpuType": "T4" 1114 | }, 1115 | "kernelspec": { 1116 | "display_name": "Python 3", 1117 | "name": "python3" 1118 | }, 1119 | "accelerator": "GPU" 1120 | }, 1121 | "nbformat": 4, 1122 | "nbformat_minor": 0 1123 | } --------------------------------------------------------------------------------