tensorflow利用Inception-v3实现迁移学习

1、Tensorflow 实现迁移学习。
#photo地址:
#http://download.tensorflow.org/example_images/flower_photos.tgz
#Inception-v3模型
#源码下载和Inception-v3模型见:https://download.csdn.net/download/casgj16/10699954
2、代码

import glob
import os.path
import random
import numpy as np
import  tensorflow as tf
from tensorflow.python.platform import gfile

#Inception-v3模型瓶颈层得节点个数
BOTTLENECK_TENSOR_SIZE=2048

BOTTLENECK_TENSOR_NAME='pool_3/_reshape:0'

JPEG_DATA_TENSOR_NAME='DecodeJpeg/contents:0'

MODEL_DIR='../CNN/inception_dec_2015'

MODEL_FILE='tensorflow_inception_graph.pb'

CACHE_DIR='../CNN/bottleneck'

INPUT_DATA='../CNN/flower_photos'

#验证得数据百分比
VALIDATION_PERCENTAGE=10
#测试得数据百分比
TEST_PERCENTAGE=10

#定义神经网络得设置
LEARNING_RATE=0.01
STEPS=4000
BATCH=100

#从数据文件夹读取所有得图片列表并按训练、验证、测试数据分开
def create_image_lists(testing_percentage, validation_percentage):
    result = {}
    sub_dirs = [x[0] for x in os.walk(INPUT_DATA)]
    is_root_dir = True
    for sub_dir in sub_dirs:
        if is_root_dir:
            is_root_dir = False
            continue

        extensions = ['jpg', 'jpeg', 'JPG', 'JPEG']

        file_list = []
        dir_name = os.path.basename(sub_dir)
        for extension in extensions:
            file_glob = os.path.join(INPUT_DATA, dir_name, '*.' + extension)
            file_list.extend(glob.glob(file_glob))
        if not file_list:
            continue

        label_name = dir_name.lower()

        # 初始化
        training_images = []
        testing_images = []
        validation_images = []
        for file_name in file_list:
            base_name = os.path.basename(file_name)

            # 随机划分数据
            chance = np.random.randint(100)  #产生一个<100得正整数
            if chance < validation_percentage:
                validation_images.append(base_name)
            elif chance < (testing_percentage + validation_percentage):
                testing_images.append(base_name)
            else:
                training_images.append(base_name)

        result[label_name] = {
            'dir': dir_name,
            'training': training_images,
            'testing': testing_images,
            'validation': validation_images,
        }
    return result


#获取给定类别category中index图片的地址
def get_image_path(image_lists,image_dir,label_name,index,category):
    label_lists=image_lists[label_name]
    category_list=label_lists[category]
    mod_index=index% len(category_list)

    base_name=category_list[mod_index]
    sub_dir=label_lists['dir']

    full_path=os.path.join(image_dir,sub_dir,base_name)
    return full_path


def get_bottleneck_path(image_lists,label_name,index,category):
    return get_image_path(image_lists,CACHE_DIR,
           label_name,index,category)+'.txt'


def run_bottleneck_on_image(sess,image_data,image_data_tensor,bottleneck_tensor):
    bottleneck_values=sess.run(bottleneck_tensor,
                               {image_data_tensor:image_data})
    bottleneck_values=np.squeeze(bottleneck_values)
    return bottleneck_values


#获取一张图片对应得特征向量
def get_or_create_bottleneck( sess,image_lists,label_name,index,
        category,jpeg_data_tensor,bottleneck_tensor):

    # 获取一张图片对应得特征向量文本得路径
    label_lists=image_lists[label_name]
    sub_dir=label_lists['dir']
    sub_dir_path=os.path.join(CACHE_DIR,sub_dir)
    if not os.path.exists(sub_dir_path):
        os.makedirs(sub_dir_path)
    bottleneck_path=get_bottleneck_path(
        image_lists,label_name,index,category
    )

    #如果这个特征向量文件不存在,则通过Inception-v3模型来 创建一个
    if not os.path.exists(bottleneck_path):
        # get_image_path 获取给定类别category中index图片的地址
        image_path=get_image_path(
            image_lists,INPUT_DATA,label_name,index,category)
        image_data=gfile.FastGFile(image_path,'rb').read()

        bottleneck_values=run_bottleneck_on_image(
            sess,image_data,jpeg_data_tensor,bottleneck_tensor
        )

        #将计算得特征向量存入文件
        bottleneck_string=','.join(str(x) for x in bottleneck_values)
        with open(bottleneck_path,'w') as bottleneck_file:
           bottleneck_file.write(bottleneck_string)
    else:
        #直接从文件中读取图爿对应得特征向量
        with open(bottleneck_path,'r') as bottleneck_file:
            bottleneck_string=bottleneck_file.read()
        bottleneck_values=[float(x) for x in bottleneck_string.split(',')]

    return bottleneck_values


#返回一个类别为category 的 how_many数量的集合 数据块 和 标签快
def get_random_cache_bottlenecks(sess,n_classes,image_lists,how_many,category,
        jpeg_data_tensor,bottleneck_tensor):
    bottlenecks=[]
    ground_truths=[]
    for _ in range(how_many):
        #随机一个类别
        label_index=random.randrange(n_classes)
        label_name=list(image_lists.keys())[label_index]

        # 随机一个图片编号
        image_index=random.randrange(65536)

        # get_or_create_bottleneck 获取一张图片对应得特征向量
        bottleneck=get_or_create_bottleneck(
            sess,image_lists,label_name,image_index,category,
            jpeg_data_tensor,bottleneck_tensor)

        #对一个标签
        ground_truth=np.zeros(n_classes,dtype=np.float32)
        ground_truth[label_index]=1.0

        bottlenecks.append(bottleneck)
        ground_truths.append(ground_truth)
    return bottlenecks,ground_truths


#获取testing的所有数据
def get_test_bottlenecks(sess,image_lists,n_classes,
            jpeg_data_tensor,bottleneck_tensor):
    bottlenecks=[]
    ground_truths=[]
    label_name_list=list(image_lists.keys())

    for label_index,label_name in enumerate(label_name_list):
        category='testing'
        for index,unused_base_name in enumerate(
            image_lists[label_name][category]):

            # get_or_create_bottleneck 获取一张图片对应得特征向量
            bottleneck=get_or_create_bottleneck(
                sess,image_lists,label_name,index,category,
                jpeg_data_tensor,bottleneck_tensor
            )
            #对应的label
            ground_truth=np.zeros(n_classes,dtype=np.float32)
            ground_truth[label_index]=1.0

            bottlenecks.append(bottleneck)
            ground_truths.append(ground_truth)

    return bottlenecks,ground_truths


def sss():
    image_lists=create_image_lists(TEST_PERCENTAGE,VALIDATION_PERCENTAGE)
    n_classes=len(image_lists.keys())
    #print(n_classes) #5

    # 读取已经训练好的Inception-v3模型。
    with gfile.FastGFile(os.path.join(MODEL_DIR,MODEL_FILE),'rb') as f:
        graph_def=tf.GraphDef()
        graph_def.ParseFromString(f.read())

    bottleneck_tensor,jpeg_data_tensor=tf.import_graph_def(
        graph_def,
        return_elements=[BOTTLENECK_TENSOR_NAME,JPEG_DATA_TENSOR_NAME]
    )

    # 定义新的神经网络输入
    bottleneck_input=tf.placeholder(
        tf.float32,[None,BOTTLENECK_TENSOR_SIZE],
        name='BottleneckInputPlaceholder')

    # 定义新的标准答案输入
    ground_truth_input=tf.placeholder(
        tf.float32,[None,n_classes],name='GroundTruthInput'
    )

    # 定义一层全链接层
    with tf.name_scope('final_training_ops'):
        weights=tf.Variable(tf.truncated_normal(
            [BOTTLENECK_TENSOR_SIZE,n_classes],stddev=0.001
        ))
        biases=tf.Variable(tf.zeros([n_classes]))
        logits=tf.matmul(bottleneck_input,weights)+biases
        final_tensor=tf.nn.softmax(logits)

    #定义交叉熵损失函数
    cross_entropy=tf.nn.softmax_cross_entropy_with_logits(
        logits,ground_truth_input
    )
    cross_entropy_mean=tf.reduce_mean(cross_entropy)
    train_step=tf.train.GradientDescentOptimizer(LEARNING_RATE).minimize(cross_entropy_mean)


    #计算正确率
    with tf.name_scope('evaluation'):
        correct_prediction=tf.equal(tf.argmax(final_tensor,1),tf.argmax(ground_truth_input,1))

        evaluation_step=tf.reduce_mean(
            tf.cast(correct_prediction,tf.float32)
        )

    with tf.Session() as sess:
        init=tf.initialize_all_variables()
        sess.run(init)

        #训练过程
        for i in range(STEPS):
            ##get_random_cache_bottlenecks
            # 返回一个类别为 'training'的 BATCH数量 的集合
            train_bottlenecks,train_ground_truth=get_random_cache_bottlenecks(
                  sess,n_classes,image_lists,BATCH,
                  'training', jpeg_data_tensor,bottleneck_tensor)

            sess.run(train_step,feed_dict={bottleneck_input:train_bottlenecks,
                                ground_truth_input:train_ground_truth})

            if i%100==0 or i+1==STEPS:

                #验证集
                validation_bottlenecks, validation_groiund_truth=\
                    get_random_cache_bottlenecks(sess,n_classes,image_lists,BATCH,
                    'validation',jpeg_data_tensor,bottleneck_tensor
                )
                validation_accuracy=sess.run(
                    evaluation_step,feed_dict={
                        bottleneck_input:validation_bottlenecks,
                        ground_truth_input:validation_groiund_truth
                    }
                )
                print('Step %d: Validation accuracy on random sampled %d examples= %.1f%%'%
                      (i,BATCH,validation_accuracy*100))

                # 测试集
                test_bottlenecks,test_ground_truth=get_test_bottlenecks(
                  sess,image_lists,n_classes,jpeg_data_tensor,bottleneck_tensor
                )
                test_accuracy=sess.run(evaluation_step,feed_dict={
                   bottleneck_input:test_bottlenecks,
                   ground_truth_input:test_ground_truth
                })
                print('Final test accuracy= %.1f %%'%(test_accuracy*100))

sss()


3、结果:

tensorflow利用Inception-v3实现迁移学习_第1张图片

 

 

你可能感兴趣的:(tensorflow实战)