自定义层函数需要继承layers.Layer,自定义网络需要继承keras.Model。
其内部需要定义两个函数:
1、__init__初始化函数,内部需要定义构造形式;
2、call函数,内部需要定义计算形式及返回值。
#self def layer
class MyDense(layers.Layer):#inherit layers.Layer
def __init__(self,input_dim,output_dim):#init
super(MyDense,self).__init__()
self.kernal = self.add_variable('w',[input_dim,output_dim])
self.bias = self.add_variable('b',[output_dim])
def call(self,inputs,training=None):#compute
out = inputs @ self.kernal + self.bias
return out
#self def network
class MyModel(keras.Model):#inherit keras.Model
def __init__(self):#init
super(MyModel,self).__init__()
self.fc1 = MyDense(input_dim=28*28,output_dim=512)
self.fc2 = MyDense(input_dim=512, output_dim=256)
self.fc3 = MyDense(input_dim=256, output_dim=128)
self.fc4 = MyDense(input_dim=128, output_dim=64)
self.fc5 = MyDense(input_dim=64, output_dim=32)
self.fc6 = MyDense(input_dim=32, output_dim=10)
def call(self,inputs,training=None):#compute inputs.shape = [b,28*28]
x = self.fc1(inputs)
x = tf.nn.relu(x)
x = self.fc2(x)
x = tf.nn.relu(x)
x = self.fc3(x)
x = tf.nn.relu(x)
x = self.fc4(x)
x = tf.nn.relu(x)
x = self.fc5(x)
x = tf.nn.relu(x)
x = self.fc6(x)
return x
自定义的层和网络在使用上与正常一样,并无任何区别。
import tensorflow as tf
from tensorflow import keras
from tensorflow.keras import layers,Sequential,optimizers,datasets,metrics
def preprocess(x,y):
x = tf.cast(tf.reshape(x,[-1]),dtype=tf.float32)/255.
y = tf.cast(tf.one_hot(y,depth=10),dtype=tf.int32)
return x,y
#load_data
(x_train,y_train),(x_val,y_val) = datasets.mnist.load_data()
print('data: ',x_train.shape,y_train.shape,x_val.shape,y_val.shape)
db = tf.data.Dataset.from_tensor_slices((x_train,y_train))
db = db.map(preprocess).shuffle(60000).batch(128)
db_val = tf.data.Dataset.from_tensor_slices((x_val,y_val))
db_val = db_val.map(preprocess).batch(128)
#self def layer
class MyDense(layers.Layer):#inherit layers.Layer
def __init__(self,input_dim,output_dim):#init
super(MyDense,self).__init__()
self.kernal = self.add_variable('w',[input_dim,output_dim])
self.bias = self.add_variable('b',[output_dim])
def call(self,inputs,training=None):#compute
out = inputs @ self.kernal + self.bias
return out
#self def network
class MyModel(keras.Model):#inherit keras.Model
def __init__(self):#init
super(MyModel,self).__init__()
self.fc1 = MyDense(input_dim=28*28,output_dim=512)
self.fc2 = MyDense(input_dim=512, output_dim=256)
self.fc3 = MyDense(input_dim=256, output_dim=128)
self.fc4 = MyDense(input_dim=128, output_dim=64)
self.fc5 = MyDense(input_dim=64, output_dim=32)
self.fc6 = MyDense(input_dim=32, output_dim=10)
def call(self,inputs,training=None):#compute inputs.shape = [b,28*28]
x = self.fc1(inputs)
x = tf.nn.relu(x)
x = self.fc2(x)
x = tf.nn.relu(x)
x = self.fc3(x)
x = tf.nn.relu(x)
x = self.fc4(x)
x = tf.nn.relu(x)
x = self.fc5(x)
x = tf.nn.relu(x)
x = self.fc6(x)
return x
network = MyModel()
network.build(input_shape=[None,28*28])
network.summary()
#build network
network = Sequential([
layers.Dense(512,activation=tf.nn.relu),
layers.Dense(256,activation=tf.nn.relu),
layers.Dense(128,activation=tf.nn.relu),
layers.Dense(64,activation=tf.nn.relu),
layers.Dense(32,activation=tf.nn.relu),
layers.Dense(10)
])
network.build(input_shape=[None,28*28])
network.summary()
#input para
network.compile(optimizer=optimizers.Adam(lr=1e-2),
loss = tf.losses.CategoricalCrossentropy(from_logits=True),
metrics = ['accuracy'])
#run network
network.fit(db,epochs=20,validation_data=db_val,validation_freq=1)