实验记录1

19类实验记录

一.实验简介

1.实验索引

实验代码:https://github.com/salmanmaq/segmentationNetworks
实验数据集:https://www.kaggle.com/salmanmaq/m2caiseg

2.实验介绍

本次实验通过segmentationNetworks网络训练m2caiseg数据集,并统计了IoU,Precision,Recall,F1四个评估指标。

3.实验环境

本次实验使用kaggle notebook,默认torch版本为1.4。

二.实验内容

1.实验设计

由于存在torch版本不同的问题,根据shell脚本中参数配置,我对代码做出了本分修改。

'''
Training for combined laparoscopic image segmentation and tool presense
classification
'''

import argparse
import os
import shutil

import numpy as np
import cv2
from PIL import Image

import torch
import torch.nn as nn
import torch.nn.parallel
import torch.backends.cudnn as cudnn
import torch.optim as optim
from torch.autograd import Variable
import torch.utils.data
import torchvision.transforms as transforms
import torch.nn.functional as F

import utils
from model.segnetPlusClass import segnetPlusClass
from datasets.miccaiSegPlusClassDataLoader import miccaiSegPlusClassDataset
from torchvision.transforms import InterpolationMode
parser = argparse.ArgumentParser(description='PyTorch SegNet Training')
parser.add_argument('-j', '--workers', default=4, type=int, metavar='N',
            help='number of data loading workers (default: 4)')
parser.add_argument('--epochs', default=500, type=int, metavar='N',
            help='number of total epochs to run')
parser.add_argument('--start-epoch', default=0, type=int, metavar='N',
            help='manual epoch number (useful on restarts)')
parser.add_argument('--batchSize', default=2, type=int,
            help='Mini-batch size (default: 4)')
parser.add_argument('--lr', '--learning-rate', default=0.005, type=float,
            metavar='LR', help='initial learning rate')
parser.add_argument('--wd', '--weight_dacay', default=0.0005, type=float,
            help='initial learning rate')
parser.add_argument('--bnMomentum', default=0.1, type=float,
            help='Batch Norm Momentum (default: 0.1)')
parser.add_argument('--imageSize', default=256, type=int,
            help='height/width of the input image to the network')
parser.add_argument('--resizedImageSize', default=224, type=int,
            help='height/width of the resized image to the network')
parser.add_argument('--print-freq', '-p', default=1, type=int, metavar='N',
            help='print frequency (default:1)')
parser.add_argument('--resume', default='/kaggle/input/checkpoint485/checkpoint_485.tar', type=str, metavar='PATH',
            help='path to latest checkpoint (default: none)')
parser.add_argument('-e', '--evaluate', dest='evaluate', action='store_true',
            help='evaluate model on validation set')
parser.add_argument('--save-dir', dest='save_dir',
            help='The directory used to save the trained models',
            default='/kaggle/working/save_MiccaiSegPlusClass', type=str)
parser.add_argument('--saveTest', default='True', type=str,
            help='Saves the validation/test images if True')
​
best_prec1 = np.inf
use_gpu = torch.cuda.is_available()
​
   
​
def train(train_loader, model, criterion, optimizer, scheduler, epoch, key):
    '''
        Run one training epoch
    '''# Switch to train mode
    model.train()for i, (img, seg_gt, class_gt) in enumerate(train_loader):# For TenCrop Data Augmentation
        img = img.view(-1,3,args.resizedImageSize,args.resizedImageSize)
        img = normalize(img, torch.Tensor([0.295, 0.204, 0.197]), torch.Tensor([0.221, 0.188, 0.182]))
        seg_gt = seg_gt.view(-1,3,args.resizedImageSize,args.resizedImageSize)# Process the network inputs and outputs
        gt_temp = seg_gt * 255
        seg_label = generateLabel4CE(gt_temp, key)
​
        class_label = class_gt
        for _ in range(9):
            class_label = torch.cat((class_label, class_gt), 0)
​
        img, seg_label, class_label = Variable(img), Variable(seg_label), Variable(class_label).float()if use_gpu:
            img = img.cuda()
            seg_label = seg_label.cuda()
            class_label = class_label.cuda()# Compute output
        classified, segmented = model(img)
        seg_loss = model.dice_loss(segmented, seg_label)
        class_loss = criterion(classified, class_label)
        total_loss = seg_loss + class_loss
​
        # Compute gradient and do SGD step
        optimizer.zero_grad()
        total_loss.backward()
        optimizer.step()
​
        scheduler.step(#total_loss.mean().data[0]
                        total_loss.mean().item() )
        print('[{:d}/{:d}][{:d}/{:d}] Total Loss: {:.4f}, Segmentation Loss: {:.4f}, Classification Loss: {:.4f}'.format(epoch,
            args.epochs-1, i, len(train_loader)-1,  total_loss.mean().item(),
            seg_loss.mean().item(), class_loss.mean().item()))
​
        displaySamples(img, segmented, seg_gt, use_gpu, key, args.saveTest, epoch,
                             i,args.save_dir)
​
​
def validate(val_loader, model, criterion, epoch, key, evaluator):
    '''
        Run evaluation
    '''# Switch to evaluate mode
    model.eval()for i, (img, seg_gt, class_gt) in enumerate(val_loader):# Process the network inputs and outputs
        img = normalize(img, torch.Tensor([0.295, 0.204, 0.197]), torch.Tensor([0.221, 0.188, 0.182]))
        gt_temp = seg_gt * 255
        seg_label = generateLabel4CE(gt_temp, key)
        oneHotGT = generateOneHot(gt_temp, key)
​
        img, seg_label, class_label = Variable(img), Variable(seg_label), Variable(class_gt).float()if use_gpu:
            img = img.cuda()
            seg_label = seg_label.cuda()
            class_label = class_label.cuda()# Compute output
        classified, segmented = model(img)
        seg_loss = model.dice_loss(segmented, seg_label)
        class_loss = criterion(classified, class_label)
        total_loss = seg_loss + class_loss
​
        print('[{:d}/{:d}][{:d}/{:d}] Total Loss: {:.4f}, Segmentation Loss: {:.4f}, Classification Loss: {:.4f}'.format(epoch,
            args.epochs-1, i, len(val_loader)-1, total_loss.mean().item(),
            seg_loss.mean().item(), class_loss.mean().item()))
        displaySamples(img, segmented, seg_gt, use_gpu, key,
                             args.saveTest,
                             epoch,
                             i, args.save_dir)
        evaluator.addBatch(segmented, oneHotGT)def save_checkpoint(state, filename='checkpoint.pth.tar'):
    '''
        Save the training model
    '''
    torch.save(state, filename)

主函数

global args, best_prec1
args =  parser.parse_known_args()[0]
print(args)

if args.saveTest == 'True':
    args.saveTest = True
elif args.saveTest == 'False':
    args.saveTest = False

# Check if the save directory exists or not
if not os.path.exists(args.save_dir):
    os.makedirs(args.save_dir)

cudnn.benchmark = True

data_transforms = {
    'train': transforms.Compose([
        transforms.Resize((args.imageSize, args.imageSize), interpolation=InterpolationMode.NEAREST),
        transforms.TenCrop(args.resizedImageSize),
        transforms.Lambda(lambda crops: torch.stack([transforms.ToTensor()(crop) for crop in crops])),
        #transforms.Lambda(lambda normalized: torch.stack([transforms.Normalize([0.295, 0.204, 0.197], [0.221, 0.188, 0.182])(crop) for crop in normalized]))
        #transforms.RandomResizedCrop(224, interpolation=Image.NEAREST),
        #transforms.RandomHorizontalFlip(),
        #transforms.RandomVerticalFlip(),
        #transforms.ToTensor(),
    ]),
    'test': transforms.Compose([
        transforms.Resize((args.resizedImageSize, args.resizedImageSize), interpolation=InterpolationMode.NEAREST),
        transforms.ToTensor(),
        #transforms.Normalize([0.295, 0.204, 0.197], [0.221, 0.188, 0.182])
    ]),
}

# Data Loading
data_dir = '/kaggle/input/m2caiseg/m2caiSeg dataset'
    #'/home/salman/pytorch/segmentationNetworks/datasets/miccaiSegRefined'
# json path for class definitions
json_path = '/kaggle/input/segnet/segmentationNetworks/datasets/miccaiSegClasses.json'

image_datasets = {x: miccaiSegPlusClassDataset(os.path.join(data_dir, x), data_transforms[x],
                    json_path) for x in ['train', 'test']}

dataloaders = {x: torch.utils.data.DataLoader(image_datasets[x],
                                              batch_size=args.batchSize,
                                              shuffle=True,
                                              #num_workers=args.workers
                                              num_workers=0
                                              )
              for x in ['train', 'test']}
dataset_sizes = {x: len(image_datasets[x]) for x in ['train', 'test']}

# Get the dictionary for the id and RGB value pairs for the dataset
classes = image_datasets['train'].classes
#key = utils.disentangleKey(classes)
key = disentangleKey(classes)
num_classes = len(key)

# Initialize the model
model = segnetPlusClass(0.1, args.resizedImageSize, num_classes)

# Optionally resume from a checkpoint
if args.resume:
    if os.path.isfile(args.resume):
        print("=> loading checkpoint '{}'".format(args.resume))
        checkpoint = torch.load(args.resume,map_location='cpu')
        #args.start_epoch = checkpoint['epoch']
        pretrained_dict = checkpoint['state_dict']
        pretrained_dict = {k: v for k, v in pretrained_dict.items() if k in model.state_dict()}
        model.state_dict().update(pretrained_dict)
        model.load_state_dict(model.state_dict())
        print("=> loaded checkpoint (epoch {})".format(checkpoint['epoch']))
    else:
        print("=> no checkpoint found at '{}'".format(args.resume))

    # # Freeze the encoder weights
    # for param in model.encoder.parameters():
    #     param.requires_grad = False

    optimizer = optim.Adam(model.parameters(), lr = args.lr, weight_decay = args.wd)
else:
    optimizer = optim.Adam(model.parameters(), lr = args.lr, weight_decay = args.wd)

    # Load the saved model
if os.path.isfile(args.resume):
    print("=> loading checkpoint '{}'".format(args.resume))
    checkpoint = torch.load(args.resume,map_location='cpu')
    args.start_epoch = checkpoint['epoch']
    model.load_state_dict(checkpoint['state_dict'])
    print("=> loaded checkpoint (epoch {})".format(checkpoint['epoch']))
else:
    print("=> no checkpoint found at '{}'".format(args.resume))

print(model)

# Define loss function (criterion)
criterion = nn.BCEWithLogitsLoss()

# Use a learning rate scheduler
scheduler = optim.lr_scheduler.StepLR(optimizer, step_size=10, gamma=0.5)

if use_gpu:
    model.cuda()
    criterion.cuda()

    # Initialize an evaluation Object
#evaluator = utils.Evaluate(key, use_gpu)
evaluator = Evaluate(key, use_gpu)

for epoch in range(args.start_epoch, args.epochs):
        #adjust_learning_rate(optimizer, epoch)

        # Train for one epoch
        print('>>>>>>>>>>>>>>>>>>>>>>>Training<<<<<<<<<<<<<<<<<<<<<<<')
        train(dataloaders['train'], model, criterion, optimizer, scheduler, epoch, key)

        # Evaulate on validation set

        print('>>>>>>>>>>>>>>>>>>>>>>>Testing<<<<<<<<<<<<<<<<<<<<<<<')
        validate(dataloaders['test'], model, criterion, epoch, key, evaluator)

        # Calculate the metrics
        print('>>>>>>>>>>>>>>>>>> Evaluating the Metrics <<<<<<<<<<<<<<<<<')
        IoU = evaluator.getIoU()
        print('Mean IoU: {}, Class-wise IoU: {}'.format(torch.mean(IoU), IoU))
        PRF1 = evaluator.getPRF1()
        precision, recall, F1 = PRF1[0], PRF1[1], PRF1[2]
        print('Mean Precision: {}, Class-wise Precision: {}'.format(torch.mean(precision), precision))
        print('Mean Recall: {}, Class-wise Recall: {}'.format(torch.mean(recall), recall))
        print('Mean F1: {}, Class-wise F1: {}'.format(torch.mean(F1), F1))
        evaluator.reset()

        save_checkpoint({
            'epoch': epoch + 1,
            'state_dict': model.state_dict(),
            'optimizer': optimizer.state_dict(),
        }, filename=os.path.join(
             args.save_dir,
            'checkpoint_{}.tar'.format(epoch)))

2.实验结果

(1)四个指标统计结果

CLASS IoU Precision Recall F1 score
unknown 0.0067 0.0242 0.0093 0.0134
grasper 0.0125 0.0629 0.0154 0.0247
bipolar 0.0000 0.0000 0.0000 0.0000
hook 0.0283 0.1145 0.0362 0.0550
scissors 0.0000 0.0000 0.0000 0.0000
clipper 0.0000 0.0000 0.0000 0.0000
irrigator 0.0000 0.0000 0.0000 0.0000
specimen-bag 0.0062 0.0074 0.0358 0.0123
trocars 0.0000 0.0000 0.0000 0.0000
clip 0.0000 0.0000 0.0000 0.0000
liver 0.4107 0.5464 0.6231 0.5822
gall-bladder 0.2414 0.5823 0.2919 0.3889
fat 0.3282 0.5291 0.5291 0.4636
upperwall 0.1121 0.1426 0.3445 0.2017
artery 0.0033 0.0045 0.0117 0.0065
intestine 0.0155 0.0987 0.0181 0.0305
bile 0.0000 0.0000 0.0000 0.0000
blood 0.0000 0.0000 0.0000 0.0000
black 0.7584 0.7716 0.9780 0.8626
mean 0.10122497950342797 0.1518024896855643 0.1488112080484951 0.14063145694832613

(3)实验图片

实验记录1_第1张图片

你可能感兴趣的:(深度学习,pytorch,python)