个人笔记-SAPINNs-2DHelmholtz

import tensorflow as tf
import numpy as np
import matplotlib.pyplot as plt
import time
import scipy.io
import math
import matplotlib.gridspec as gridspec
from plotting import newfig
from mpl_toolkits.axes_grid1 import make_axes_locatable
from tensorflow import keras
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, Input
from tensorflow.keras import layers, activations
from scipy.interpolate import griddata
from eager_lbfgs import lbfgs, Struct
from pyDOE import lhs

#define size of the network   (设置全连接神经网络的各层神经元的结构)
#全连接的神经网络的结构如下,输入的神经元是2个,输出的是1个。
#因此模型的输入应该是(batchsize,2),也就是说有batchsize那么多个(x,y),而输出则是(batchsize,1)。
layer_sizes = [2, 50, 50, 50, 50, 1]

sizes_w = []
sizes_b = []
for i, width in enumerate(layer_sizes):
    if i != 1:
        sizes_w.append(int(width * layer_sizes[1]))
        sizes_b.append(int(width if i != 0 else layer_sizes[1]))
def set_weights(model, w, sizes_w, sizes_b):
        for i, layer in enumerate(model.layers[0:]):
            start_weights = sum(sizes_w[:i]) + sum(sizes_b[:i])
            end_weights = sum(sizes_w[:i+1]) + sum(sizes_b[:i])
            weights = w[start_weights:end_weights]
            w_div = int(sizes_w[i] / sizes_b[i])
            weights = tf.reshape(weights, [w_div, sizes_b[i]])
            biases = w[end_weights:end_weights + sizes_b[i]]
            weights_biases = [weights, biases]
            layer.set_weights(weights_biases)
def get_weights(model):
    w = []
    for layer in model.layers[0:]:
        weights_biases = layer.get_weights()
        weights = weights_biases[0].flatten()
        biases = weights_biases[1]
        w.extend(weights)
        w.extend(biases)

    w = tf.convert_to_tensor(w)
    return w

def neural_net(layer_sizes):
    model = Sequential()
    model.add(layers.InputLayer(input_shape=(layer_sizes[0],)))
    for width in layer_sizes[1:-1]:
        model.add(layers.Dense(
            width, activation=tf.nn.tanh,
            kernel_initializer="glorot_normal"))
    model.add(layers.Dense(
            layer_sizes[-1], activation=None,
            kernel_initializer="glorot_normal"))
    return model


u_model = neural_net(layer_sizes)
def loss(x_f, y_f,
         x_lb, y_lb,
         x_ub, y_ub,
         x_rb, y_rb,
         x_lftb, ylftb,
         col_weights):

    f_u_pred = f_model(x_f, y_f)

    u_lb_pred = u_model(tf.concat([x_lb, y_lb],1))
    u_ub_pred = u_model(tf.concat([x_ub, y_ub],1))
    u_rb_pred = u_model(tf.concat([x_rb, y_rb],1))
    u_lftb_pred = u_model(tf.concat([x_lftb, y_lftb],1))

    mse_b_u = tf.reduce_mean(tf.square(u_lb_pred - 0)) + \
            tf.reduce_mean(tf.square(u_ub_pred - 0)) + \
            tf.reduce_mean(tf.square(u_rb_pred - 0)) + \
            tf.reduce_mean(tf.square(u_lftb_pred - 0))
    
    mse_f_u = tf.reduce_mean(tf.square(col_weights*f_u_pred))

    return  mse_b_u + mse_f_u , mse_b_u, mse_f_u
def f_model(x, y):
        with tf.GradientTape(persistent=True) as tape:
            tape.watch(x)
            tape.watch(y)

            u = u_model(tf.concat([x, y],1))
            
            u_x = tape.gradient(u, x)
            u_y = tape.gradient(u, y)

        u_xx = tape.gradient(u_x, x)

        u_yy = tape.gradient(u_y, y)
		
		#q(x,y)---forcing
        del tape
        a1 = 1.0
        a2 = 4.0
        ksq = 1.0 #k^2
        forcing = - (a1*math.pi)**2*np.sin(a1*math.pi*x)*np.sin(a2*math.pi*y) - \
                    (a2*math.pi)**2*np.sin(a1*math.pi*x)*np.sin(a2*math.pi*y) + \
                    ksq*np.sin(a1*math.pi*x)*np.sin(a2*math.pi*y)

        f_u = u_xx + u_yy + ksq*u - forcing

        return f_u
def fit(x_f, t_f, x_lb, y_lb, x_ub, y_ub, x_rb, y_rb, x_lftb, y_lftb, col_weights, tf_iter, newton_iter):

    batch_sz = N_f
    n_batches =  N_f // batch_sz
    start_time = time.time()
    tf_optimizer = tf.keras.optimizers.Adam(lr = 0.001, beta_1=.99)
    tf_optimizer_coll = tf.keras.optimizers.Adam(lr = 0.001, beta_1=.99)

    print("starting Adam training")
    for epoch in range(tf_iter):
        for i in range(n_batches):

            x_f_batch = x_f[i*batch_sz:(i*batch_sz + batch_sz),]
            y_f_batch = y_f[i*batch_sz:(i*batch_sz + batch_sz),]

            with tf.GradientTape(persistent=True) as tape:
                loss_value, mse_b, mse_f = loss(x_f, y_f, x_lb, y_lb, x_ub, y_ub, x_rb, y_rb, x_lftb, y_lftb, col_weights)
                grads = tape.gradient(loss_value, u_model.trainable_variables)
                grads_col = tape.gradient(loss_value, col_weights)
            tf_optimizer.apply_gradients(zip(grads, u_model.trainable_variables))
            tf_optimizer_coll.apply_gradients(zip([-grads_col], [col_weights]))


            del tape

            elapsed = time.time() - start_time
            print('It: %d, Time: %.2f' % (epoch, elapsed))
            tf.print(f"mse_b: {mse_b}  mse_f: {mse_f}   total loss: {loss_value}")
            start_time = time.time()


    print("Starting L-BFGS training")

    loss_and_flat_grad = get_loss_and_flat_grad(x_f, y_f, x_lb, y_lb, x_ub, y_ub, x_rb, y_rb, x_lftb, y_lftb, col_weights)

    lbfgs(loss_and_flat_grad,
      get_weights(u_model),
      Struct(), maxIter=newton_iter, learningRate=0.8)
def get_loss_and_flat_grad(x_f, y_f, x_lb, y_lb, x_ub, y_ub, x_rb, y_rb, x_lftb, y_lftb, col_weights):
    def loss_and_flat_grad(w):
        with tf.GradientTape() as tape:
            set_weights(u_model, w, sizes_w, sizes_b)
            loss_value, _, _ = loss(x_f, y_f, x_lb, y_lb, x_ub, y_ub, x_rb, y_rb, x_lftb, y_lftb, col_weights)
        grad = tape.gradient(loss_value, u_model.trainable_variables)
        grad_flat = []
        for g in grad:
            grad_flat.append(tf.reshape(g, [-1]))
        grad_flat = tf.concat(grad_flat, 0)
        #print(loss_value, grad_flat)
        return loss_value, grad_flat

    return loss_and_flat_grad
def predict(X_star):
    X_star = tf.convert_to_tensor(X_star, dtype=tf.float32)
    u_star = u_model(X_star)

    f_u_star = f_model(X_star[:,0:1],
                 X_star[:,1:2])

    return u_star.numpy(), f_u_star.numpy()

--------------------------------------------------------------------从main这里开始看--------------------------------------------------------------------------------------
因此,我们可以理解为PINNs模型的输入就是自变量的坐标点,一个个坐标点摞起来,每行是一个坐标(x,y),而输出的值就是那个坐标所对应的u(x,y)。而PINNs的输入分为边界点和内部点,在源代码中用u和f区分。我们知道这类偏微分方程求解时,需要确定边界条件和初始条件才能让解唯一。因此边界和初始的值是事先给定的,对于PINNs模型来说,就是初边值的点是监督学习的部分。而内部的点由于实现不知道其解u的值,所以是非监督学习,我们的目标就是让神经网络的输出满足方程,来解出内部点中u的值。举个例子,初边值的点应该有label,如果用(x,y,u)的数据结构表示的话,即(0.5,0,-1),(-1,0.5,0),其中前一个点上用初始条件给出的,后一个点是边界条件给出的。对于内部点,则只需要给出(x,y)即可,如(0.3,0.5),应在定义域x ∈ [−1, 1], y ∈ [-1, 1] 中取出足够多的点进行非监督学习。明白了模型的输入输出,就可以看明白该代码中main函数开头的数据预处理的部分了.

lb = np.array([-1.0]) #lower boundary
ub = np.array([1.0]) #upper boundary
rb = np.array([1.0]) #right boundary
lftb = np.array([-1.0]) #left boundary

N0 = 200   # 初值点的数量
N_b = 100 #25 per upper and lower boundary, so 50 total   # 边值点的数量
N_f = 100000  # 内部点的数量

col_weights = tf.Variable(tf.random.uniform([N_f, 1]))
u_weights = tf.Variable(100*tf.random.uniform([N0, 1]))


nx, ny = (1001,1001) #mesh size
x = np.linspace(-1, 1, nx) #x是网格点的x方向的空间序列
y = np.linspace(-1, 1, ny) #y是网格点的y方向的空间序列


xv, yv = np.meshgrid(x,y)

x = np.reshape(x, (-1,1))
y = np.reshape(y, (-1,1))


Exact_u = np.sin(math.pi*xv)*np.sin(4*math.pi*yv) #已知的精确解

# 随机打乱一下点的排序,避免训练时输入有规律的输入
idx_x = np.random.choice(x.shape[0], N0, replace=False)
x0 = x[idx_x,:]
u0 = Exact_u[idx_x,0:1]
# 其中x0代表初值点的坐标,u0代表初值对应的具体的值,即x0的label

idx_y = np.random.choice(y.shape[0], N_b, replace=False)
yb = y[idx_y, :]

# 制作内部点的数据集X_f
# lhs这个函数是随机生成N_f个0-1的数据,2代表生成的维度,因为(x,y)所以设置为2
# 因此这一行代表在定义域内随机生成N_f个(x,y)坐标
X_f = lb + (ub-lb)*lhs(2, N_f)

x_f = tf.convert_to_tensor(X_f[:,0:1], dtype=tf.float32)
y_f = tf.convert_to_tensor(X_f[:,1:2], dtype=tf.float32)


X0 = np.concatenate((x0, 0*x0), 1) # (x0, 0)
X_lb = np.concatenate(( yb, 0*yb + lb[0]), 1) # lower boundary (x, -1)
X_ub = np.concatenate(( yb, 0*yb + ub[0]), 1)  # upper boundary (x, 1)
X_rb = np.concatenate((0*yb + rb[0], yb), 1) # right boundary (1, y)
X_lftb = np.concatenate((0*yb + lftb[0], yb), 1) # left boundary (-1,y)


x0 = X0[:,0:1]
y0 = X0[:,1:2]

x_lb = tf.convert_to_tensor(X_lb[:,0:1], dtype=tf.float32)
y_lb = tf.convert_to_tensor(X_lb[:,1:2], dtype=tf.float32)

x_ub = tf.convert_to_tensor(X_ub[:,0:1], dtype=tf.float32)
y_ub = tf.convert_to_tensor(X_ub[:,1:2], dtype=tf.float32)

x_rb = tf.convert_to_tensor(X_rb[:,0:1], dtype=tf.float32)
y_rb = tf.convert_to_tensor(X_rb[:,1:2], dtype=tf.float32)

x_lftb = tf.convert_to_tensor(X_lftb[:,0:1], dtype=tf.float32)
y_lftb = tf.convert_to_tensor(X_lftb[:,1:2], dtype=tf.float32)

#Fit helmholtz (调用model的fit方法开始进行训练)
fit(x_f, y_f, x_lb, y_lb, x_ub, y_ub, x_rb, y_rb, x_lftb, y_lftb, col_weights,
    tf_iter = 10000, newton_iter = 10000)

#generate mesh for plotting
X, Y = np.meshgrid(x,y)

X_star = np.hstack((X.flatten()[:,None], Y.flatten()[:,None]))
u_star = Exact_u.flatten()[:,None]


lb = np.array([-1.0, -1.0])
ub = np.array([1.0, 1])

# 调用model的predict方法传入坐标X_star获得对应的结果u_pred和方程偏差 f_u_pred
u_pred, f_u_pred = predict(X_star)

# 计算error
error_u = np.linalg.norm(u_star-u_pred,2)/np.linalg.norm(u_star,2)

# 打印error
print('Error u: %e' % (error_u))



U_pred = griddata(X_star, u_pred.flatten(), (X, Y), method='cubic')


FU_pred = griddata(X_star, f_u_pred.flatten(), (X, Y), method='cubic')

######################################################################
############################# Plotting ###############################
######################################################################

fig, ax = newfig(1.3, 1.0)
ax.axis('off')

####### Row 0: h(t,x) ##################
gs0 = gridspec.GridSpec(1, 2)
gs0.update(top=1-0.06, bottom=1-1/3, left=0.15, right=0.85, wspace=0)
ax = plt.subplot(gs0[:, :])

h = ax.imshow(U_pred, interpolation='nearest', cmap='YlGnBu',
              extent=[lb[1], ub[1], lb[0], ub[0]],
              origin='lower', aspect='auto')
divider = make_axes_locatable(ax)
cax = divider.append_axes("right", size="5%", pad=0.05)
fig.colorbar(h, cax=cax)


line = np.linspace(x.min(), x.max(), 2)[:,None]
ax.plot(y[250]*np.ones((2,1)), line, 'k--', linewidth = 1)
ax.plot(y[500]*np.ones((2,1)), line, 'k--', linewidth = 1)
ax.plot(y[750]*np.ones((2,1)), line, 'k--', linewidth = 1)

ax.set_xlabel('$x$')
ax.set_ylabel('$y$')
leg = ax.legend(frameon=False, loc = 'best')

ax.set_title('$u(x,y)$', fontsize = 10)

####### Row 1: h(t,x) slices ##################
gs1 = gridspec.GridSpec(1, 3)
gs1.update(top=1-1/3, bottom=0, left=0.1, right=0.9, wspace=0.5)

ax = plt.subplot(gs1[0, 0])
ax.plot(x,Exact_u[:,250], 'b-', linewidth = 2, label = 'Exact')
ax.plot(x,U_pred[:,250], 'r--', linewidth = 2, label = 'Prediction')
ax.set_xlabel('$y$')
ax.set_ylabel('$u(x,y)$')
ax.set_title('$y = %.2f$' % (y[250]), fontsize = 10)
ax.axis('square')
ax.set_xlim([-1.1,1.1])
ax.set_ylim([-1.1,1.1])

ax = plt.subplot(gs1[0, 1])
ax.plot(x,Exact_u[:,500], 'b-', linewidth = 2, label = 'Exact')
ax.plot(x,U_pred[:,500], 'r--', linewidth = 2, label = 'Prediction')
ax.set_xlabel('$y$')
ax.set_ylabel('$u(x,y)$')
ax.axis('square')
ax.set_xlim([-1.1,1.1])
ax.set_ylim([-1.1,1.1])
ax.set_title('$x = %.2f$' % (y[500]), fontsize = 10)
ax.legend(loc='upper center', bbox_to_anchor=(0.5, -0.3), ncol=5, frameon=False)

ax = plt.subplot(gs1[0, 2])
ax.plot(x,Exact_u[:,750], 'b-', linewidth = 2, label = 'Exact')
ax.plot(x,U_pred[:,750], 'r--', linewidth = 2, label = 'Prediction')
ax.set_xlabel('$y$')
ax.set_ylabel('$u(x,y)$')
ax.axis('square')
ax.set_xlim([-1.1,1.1])
ax.set_ylim([-1.1,1.1])
ax.set_title('$x = %.2f$' % (y[750]), fontsize = 10)

#plot prediction
fig, ax = plt.subplots()

ec = plt.imshow(U_pred, interpolation='nearest', cmap='rainbow',
            extent=[-1.0, 1.0, -1.0, 1.0],
            origin='lower', aspect='auto')


ax.autoscale_view()
ax.set_xlabel('$y$')
ax.set_ylabel('$x$')
cbar = plt.colorbar(ec)
cbar.set_label('$u(x,y)$')
plt.title("Predicted $u(x,y)$",fontdict = {'fontsize': 14})
plt.show()


#show f_u_pred, we want this to be ~0 across the whole domain
fig, ax = plt.subplots()

ec = plt.imshow(FU_pred, interpolation='nearest', cmap='rainbow',
            extent=[-1.0, 1, -1.0, 1.0],
            origin='lower', aspect='auto')

#ax.add_collection(ec)
ax.autoscale_view()
ax.set_xlabel('$x$')
ax.set_ylabel('$t$')
cbar = plt.colorbar(ec)
cbar.set_label('$\overline{f}_u$ prediction')
plt.show()

#plot prediction error
fig, ax = plt.subplots()

ec = plt.imshow((U_pred - Exact_u), interpolation='nearest', cmap='YlGnBu',
            extent=[-1.0, 1.0, -1.0, 1.0],
            origin='lower', aspect='auto')

#ax.add_collection(ec)
ax.autoscale_view()
ax.set_xlabel('$t$')
ax.set_ylabel('$x$')
cbar = plt.colorbar(ec)
cbar.set_label('$u$ prediction error')
#plt.title("Prediction Error",fontdict = {'fontsize': 14})
plt.show()

# print collocation point weights
plt.scatter(x_f, y_f, c = col_weights.numpy(), s = col_weights.numpy()/100)
plt.show()

你可能感兴趣的:(个人笔记,Python,TensorFlow,python,tensorflow,开发语言)