水云仙君

Pytorch搭建EfficientNet网络和Openmax

B站账号@狼群里的小杨，记得点赞收藏加关注，一键三连哦！

EfficientNet

代码

这是一个用包含40个类别的垃圾数据集做的开放场景实验。训练过程中仅使用24个训练类，测试时使用40个垃圾类别。
garbage数据集下载
首先是训练的代码。
task_garbage.py

'''
@File  :task_gabage.py
@Author:cjh
@Date  :2022/1/16 14:45
@Desc  :
'''
import random

import torch
import torch.nn as nn
import torch.optim as optim
import torch.nn.functional as F
import torch.backends.cudnn as cudnn

import torchvision
import numpy as np
import torchvision.transforms as transforms
from torchvision.transforms import autoaugment

import os
import argparse
import sys
import warnings
warnings.filterwarnings("ignore")


# os.chdir(os.path.dirname('X:/PyCharm/211211-DL-OSR/DL_OSR/model/OpenMax'))
# sys.path.append("../..")
from torch.optim import lr_scheduler

import backbones.cifar10 as models
from datasets import GARBAGE40_Dataset
from utils import adjust_learning_rate, progress_bar, Logger, mkdir_p, Evaluation

from openmax import compute_train_score_and_mavs_and_dists,fit_weibull,openmax
from Modelbuilder import Network
from Plotter import plot_feature
from garbage_transform import Resize, Cutout, RandomErasing
from garbage_loss import LabelSmoothSoftmaxCE, LabelSmoothingLoss, FocalLoss
from checkpoints import efficientnet
# from pytorch_toolbelt import losses as L

parser=argparse.ArgumentParser()
parser.add_argument('--lr',default=0.01,type=float,help='learning rate')
# ./checkpoints/garbage/ResNet/ResNet18.pth
parser.add_argument('--resume',default=None,type=str,metavar='PATH',help='path to load lastest pth')
parser.add_argument('--arch',default='EfficientNet_B5',type=str,help='choosing network')
parser.add_argument('--bs',default=8,type=int,help='batch size')
parser.add_argument('--es',default=40,type=int,help='epoches')
parser.add_argument('--train_class_num',default=24,type=int,help='classes used in training')
parser.add_argument('--test_class_num',default=40,type=int,help='classes used in testing')
parser.add_argument('--includes_all_train_class',default=True,action='store_true',
                    help='testing uses all known classes')
parser.add_argument('--embed_dim', default=2, type=int, help='embedding feature dimension')
parser.add_argument('--evaluate',default=False,action='store_true',help='evaluating')

parser.add_argument('--weibull_tail', default=20, type=int, help='Classes used in testing')
parser.add_argument('--weibull_alpha', default=5, type=int, help='Classes used in testing')
parser.add_argument('--weibull_threshold', default=0.9, type=float, help='Classes used in testing')

# Parameters for stage plotting
# parser.add_argument('--plot', default=False, action='store_true', help='Plotting the training set.')
# parser.add_argument('--plot_max', default=0, type=int, help='max examples to plot in each class, 0 indicates all.')
# parser.add_argument('--plot_quality', default=200, type=int, help='DPI of plot figure')

args=parser.parse_args()

def main():
    device = 'cuda' if torch.cuda.is_available() else 'cpu'
    print(device)
    best_acc = 0  # best test accuracy
    start_epoch = 0  # start from epoch 0 or last checkpoint epoch

    # checkpoint
    args.checkpoint = './checkpoints/garbage/' + args.arch
    if not os.path.isdir(args.checkpoint):
        mkdir_p(args.checkpoint)

    # folder to save figures
    args.plotfolder = './checkpoints/garbage/' + args.arch + '/plotter'
    if not os.path.isdir(args.plotfolder):
        mkdir_p(args.plotfolder)

    # Data
    print('==> Preparing data..')
    picture_size = 256
    train_transforms = transforms.Compose([

        Resize((int(288 * (256 / 224)), int(288 * (256 / 224)))),
        transforms.CenterCrop((picture_size, picture_size)),
        transforms.RandomAffine(degrees=0, translate=(0.05, 0.05)),
        transforms.RandomVerticalFlip(),
        autoaugment.AutoAugment(),
        transforms.ToTensor(),
        transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
        Cutout(probability=0.5, size=64, mean=[0.0, 0.0, 0.0]),
        RandomErasing(probability=0.0, mean=[0.485, 0.456, 0.406]),
    ])
    test_transforms = transforms.Compose([
        Resize((int(288 * (256 / 224)), int(288 * (256 / 224)))),
        transforms.CenterCrop((picture_size, picture_size)),
        transforms.ToTensor(),
        transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
    ])

    random.seed(42)
    train_classes = random.sample(range(0, 40), args.train_class_num)
    test_classes=train_classes+[999]

    trainset = GARBAGE40_Dataset(root='../../data/garbage', train=True,
                                 transform=train_transforms,
                     train_class_num=args.train_class_num, test_class_num=args.test_class_num,
                     includes_all_train_class=args.includes_all_train_class,
                                 train_classes=train_classes)
    testset = GARBAGE40_Dataset(root='../../data/garbage', train=False,
                                transform=test_transforms,
                    train_class_num=args.train_class_num, test_class_num=args.test_class_num,
                    includes_all_train_class=args.includes_all_train_class,
                                train_classes=train_classes)
    # data loader
    trainloader = torch.utils.data.DataLoader(trainset, batch_size=args.bs, shuffle=True, num_workers=0)
    testloader = torch.utils.data.DataLoader(testset, batch_size=args.bs, shuffle=False, num_workers=0)

    #Model
    # net=Network(backbone=args.arch,num_classes=args.train_class_num, embed_dim=args.embed_dim)
    # fea_dim = net.classifier.in_features
    # net = net.to(device)
    if args.arch=='ResNet18':
        net = torchvision.models.resnet18(pretrained=True).to(device)
        model_wight_path = "checkpoints/garbage/ResNet18/best_model.pth"
        assert os.path.exists(model_wight_path), "file {} dose not exist.".format(model_wight_path)  # 若路径不存在，则打印信息
        net.load_state_dict(torch.load(model_wight_path, map_location=device), strict=False)
        net.fc = nn.Sequential(
            nn.Linear(net.fc.in_features, 256),
            nn.ReLU(),
            nn.Dropout(0.4),
            nn.Linear(256, args.train_class_num)
        )

    if args.arch == 'ResNet50':
        net = torchvision.models.resnet50(pretrained=True).to(device)
        model_wight_path = "checkpoints/garbage/ResNet50/best_model.pth"
        assert os.path.exists(model_wight_path), "file {} dose not exist.".format(model_wight_path)  # 若路径不存在，则打印信息
        net.load_state_dict(torch.load(model_wight_path, map_location=device), strict=False)
        net.fc = nn.Sequential(
            nn.Linear(net.fc.in_features, 256),
            nn.ReLU(),
            nn.Dropout(0.4),
            nn.Linear(256, args.train_class_num)
        )
    if args.arch == 'EfficientNet_B5':
        # net = torchvision.models.efficientnet_b5(pretrained=True).to(device)
        net = efficientnet.efficientnet_b5().to(device)
        # model_wight_path = "checkpoints/garbage/EfficientNet_B5/efficientnetb5.pth"
        model_wight_path = "checkpoints/garbage/EfficientNet_B5/best_model.pth"
        assert os.path.exists(model_wight_path), "file {} dose not exist.".format(model_wight_path)  # 若路径不存在，则打印信息
        net.load_state_dict(torch.load(model_wight_path, map_location=device), strict=False)
        net.classifier= nn.Sequential(
            nn.Dropout(p=0.4, inplace=True),
            nn.Linear(2048, args.train_class_num),
        )
    if args.arch == 'EfficientNet_B7':
        # net = torchvision.models.efficientnet_b7(pretrained=True).to(device)
        net = efficientnet.efficientnet_b7().to(device)
        net.classifier= nn.Sequential(
            nn.Dropout(p=0.4, inplace=True),
            nn.Linear(2048, args.train_class_num),
        )
    if args.arch == 'ResNext101_32x16d_wsl':
        net = torch.hub.load('facebookresearch/WSL-Images', 'resnext101_32x16d_wsl')
        net.fc = nn.Sequential(
            nn.Dropout(0.2),
            nn.Linear(2048, args.train_class_num)
        )


    if args.arch == 'Resnext101_32x8d_wsl':
        net = torch.hub.load('facebookresearch/WSL-Images', 'resnext101_32x8d_wsl')
        net.fc = nn.Sequential(
            nn.Dropout(0.2),
            nn.Linear(2048, args.train_class_num)
        )
    if args.arch == 'Resnext50_32x4d':
        net = torchvision.models.resnext50_32x4d(pretrained=True).to(device)
        net.fc = nn.Sequential(
            nn.Dropout(0.2),
            nn.Linear(2048, args.train_class_num)
        )
    # from efficientnet_pytorch import EfficientNet
    # model = EfficientNet.from_pretrained('efficientnet-b0')
    # model = EfficientNet.from_pretrained(,num_classes=args.train_class_num)
    if args.arch == 'EfficientNet_B3':
        net = torchvision.models.efficientnet_b3(pretrained=True).to(device)
        net.classifier= nn.Sequential(
            nn.Linear(1536, 256),
            nn.ReLU(),
            nn.Dropout(p=0.4),
            nn.Linear(256, args.train_class_num),

            # nn.Dropout(p=0.4, inplace=True),
            # nn.Linear(1024, args.train_class_num),
        )

    if device == 'cuda':
        net = torch.nn.DataParallel(net)
        cudnn.benchmark = True
    if args.resume!=None:
        # Load checkpoint.
        if os.path.isfile(args.resume):
            print('==> Resuming from checkpoint..')

            #for cpu load cuda model
            checkpoint = torch.load(args.resume,map_location=torch.device('cpu'))
            net.load_state_dict({k.replace('module.', ''): v for k, v in checkpoint['net'].items()})

            #for gpu load cuda model for cpu load cpu model
            # checkpoint = torch.load(args.resume)
            # net.load_state_dict(checkpoint['net'])


            # best_acc = checkpoint['acc']
            # print("BEST_ACCURACY: "+str(best_acc))
            start_epoch = checkpoint['epoch']
            logger = Logger(os.path.join(args.checkpoint, 'log.txt'), resume=True)
        else:
            print("=> no checkpoint found at '{}'".format(args.resume))
    else:
        logger = Logger(os.path.join(args.checkpoint, 'log.txt'))
        logger.set_names(['Epoch', 'Learning Rate', 'Train Loss','Train Acc.', 'Test Loss', 'Test Acc.'])

    criterion = nn.CrossEntropyLoss()
    # criterion = LabelSmoothSoftmaxCE(lb_pos=0.9, lb_neg=5e-3)
    # criterion = LabelSmoothingLoss(classes=args.train_class_num, smoothing=0.1)
    # criterion = FocalLoss(alpha=0.25)


    optimizer = optim.SGD(net.parameters(), lr=args.lr, momentum=0.9, weight_decay=5e-4)
    # optimizer = optim.RAdam(net.parameters(),lr=args.lr,betas=(0.9, 0.999), eps=1e-8,weight_decay=5e-4)
    # scheduler = lr_scheduler.ReduceLROnPlateau(optimizer, mode='max', factor=0.7, patience=3, verbose=True)
    scheduler = lr_scheduler.ReduceLROnPlateau(optimizer, mode='min', factor=0.2, patience=2, verbose=False)
    scheduler = lr_scheduler.CosineAnnealingWarmRestarts(optimizer, T_0=3, T_mult=2)
    scheduler = lr_scheduler.CosineAnnealingWarmRestarts(optimizer, T_0=2, T_mult=2,eta_min = 1e-5)

    scheduler = lr_scheduler.StepLR(optimizer, step_size=8, gamma=0.5)

    # epoch=0
    best_ac=0
    if not args.evaluate:
        for epoch in range(start_epoch, args.es):
            print('\nEpoch: %d   Learning rate: %f' % (epoch+1, optimizer.param_groups[0]['lr']))
            # adjust_learning_rate(optimizer, epoch, args.lr, step=20)
            train_loss, train_acc = train(net, trainloader, optimizer, criterion, device, train_classes)
            if epoch == args.es - 1:
                save_model(net, None, epoch, os.path.join(args.checkpoint,'last_model.pth'))
            test_loss, test_acc = 0, 0
            try:
                test_loss, test_acc = test(epoch, net, trainloader, testloader, criterion, device, test_classes)
            except:
                pass
            # scheduler.step(test_loss)
            scheduler.step(train_loss)

            if best_ac<test_acc:
                best_ac=test_acc
                print("The best Acc: ",best_ac)
                # save_model(net, None, epoch, os.path.join(args.checkpoint, 'best_model.pth'))
                torch.save(net.state_dict(), os.path.join(args.checkpoint, 'best_model.pth'))
                # save_model(net, best_ac, epoch, os.path.join(args.checkpoint, 'best_model.pth'))
            #
            logger.append([epoch+1, optimizer.param_groups[0]['lr'], train_loss, train_acc, test_loss, test_acc])
            # plot_feature(net, trainloader, device, args.plotfolder,train_classes, epoch=epoch,
            #              plot_class_num=args.train_class_num, maximum=args.plot_max, plot_quality=args.plot_quality)
            # if (epoch+1)%20==0:
            #     try:
            #         test(epoch, net, trainloader, testloader, criterion, device,test_classes)
            #     except:
            #         pass
    test(99999, net, trainloader, testloader, criterion, device, test_classes)
    # plot_feature(net, testloader, device, args.plotfolder,train_classes, epoch="test",
    #              plot_class_num=args.train_class_num+1, maximum=args.plot_max, plot_quality=args.plot_quality)
    logger.close()

# Training
def train(net,trainloader,optimizer,criterion,device,train_classes):
    net.train()
    train_loss = 0
    correct = 0
    total = 0
    for batch_idx, (inputs, targets) in enumerate(trainloader):
        onehot_targets_index=[train_classes.index(i) for i in targets]
        targets=torch.LongTensor(onehot_targets_index)

        inputs, targets = inputs.to(device), targets.to(device)
        optimizer.zero_grad()
        outputs = net(inputs)

        # onehot_targets=torch.zeros((outputs.shape[0],outputs.shape[1]))
        # onehot_targets[range(outputs.shape[0]), onehot_targets_index]=1

        loss = criterion(outputs, targets)
        # loss = torch.nn.functional.cross_entropy(outputs, targets)
        loss.backward()
        optimizer.step()

        train_loss += loss.item()
        _, predicted = outputs.max(1)
        total += targets.size(0)
        correct += predicted.eq(targets).sum().item()

        progress_bar(batch_idx, len(trainloader), 'Loss: %.3f | Acc: %.3f%% (%d/%d)'
            % (train_loss/(batch_idx+1), 100.*correct/total, correct, total))
    return train_loss/(batch_idx+1), correct/total



def test(epoch, net, trainloader, testloader, criterion, device, test_classes):
    net.eval()

    test_loss = 0
    correct = 0
    total = 0

    scores, labels = [], []
    with torch.no_grad():
        for batch_idx, (inputs, targets) in enumerate(testloader):
            onehot_targets_index = [test_classes.index(i) for i in targets]
            targets = torch.LongTensor(onehot_targets_index)

            # image_2 = transforms.RandomAffine(degrees=0, translate=(0.05, 0.05))(inputs).to(device)
            # image_3 = transforms.RandomHorizontalFlip()(inputs).to(device)
            # image_4 = Cutout(probability=0.5, size=64, mean=[0.0, 0.0, 0.0])(inputs).to(device)
            # image_5 = transforms.RandomVerticalFlip()(inputs).to(device)

            inputs, targets = inputs.to(device), targets.to(device)


            # output1 = net(inputs)
            # output2 = net(image_2)
            # output3 = net(image_3)
            # output4 = net(image_4)
            # output5 = net(image_5)


            outputs = net(inputs)
            # outputs = (output1+output2+output3+output4+output5)/5


            # loss = criterion(outputs, targets)
            # test_loss += loss.item()
            _, predicted = outputs.max(1)

            scores.append(outputs)
            labels.append(targets)

            total += targets.size(0)
            correct += predicted.eq(targets).sum().item()

            progress_bar(batch_idx, len(testloader))

    # Get the prdict results.
    scores = torch.cat(scores,dim=0).cpu().numpy()
    labels = torch.cat(labels,dim=0).cpu().numpy()
    scores = np.array(scores)[:, np.newaxis, :]
    labels = np.array(labels)

    if args.train_class_num != args.test_class_num:
        # Fit the weibull distribution from training data.
        print("Fittting Weibull distribution...")
        _, mavs, dists = compute_train_score_and_mavs_and_dists(args.train_class_num, trainloader, device, net, test_classes)
        categories = list(range(0, args.train_class_num))
        weibull_model = fit_weibull(mavs, dists, categories, args.weibull_tail, "euclidean")

        pred_softmax, pred_softmax_threshold, pred_openmax = [], [], []
        score_softmax, score_openmax = [], []
        for score in scores:
            so, ss = openmax(weibull_model, categories, score,
                             0.5, args.weibull_alpha, "euclidean")
            # print(f"so  {so} \n ss  {ss}")# openmax_prob, softmax_prob
            pred_softmax.append(np.argmax(ss))
            pred_softmax_threshold.append(np.argmax(ss) if np.max(ss) >= args.weibull_threshold else args.train_class_num)
            pred_openmax.append(np.argmax(so) if np.max(so) >= args.weibull_threshold else args.train_class_num)

            score_softmax.append(ss)
            score_openmax.append(so)

        print("Evaluation...")
        # test_loss += criterion(torch.Tensor(score_softmax), torch.from_numpy(labels))
        test_loss += criterion(torch.Tensor(score_openmax), torch.from_numpy(labels))

        eval_softmax = Evaluation(pred_softmax, labels, score_softmax)
        eval_softmax_threshold = Evaluation(pred_softmax_threshold, labels, score_softmax)
        eval_openmax = Evaluation(pred_openmax, labels, score_openmax)

        torch.save(eval_softmax, os.path.join(args.checkpoint, 'eval_softmax.pkl'))
        torch.save(eval_softmax_threshold, os.path.join(args.checkpoint, 'eval_softmax_threshold.pkl'))
        torch.save(eval_openmax, os.path.join(args.checkpoint, 'eval_openmax.pkl'))


        print(f"Softmax accuracy is %.3f" % (eval_softmax.accuracy))
        print(f"Softmax F1 is %.3f" % (eval_softmax.f1_measure))
        print(f"Softmax f1_macro is %.3f" % (eval_softmax.f1_macro))
        print(f"Softmax f1_macro_weighted is %.3f" % (eval_softmax.f1_macro_weighted))
        print(f"Softmax area_under_roc is %.3f" % (eval_softmax.area_under_roc))
        print(f"_________________________________________")

        print(f"SoftmaxThreshold accuracy is %.3f" % (eval_softmax_threshold.accuracy))
        print(f"SoftmaxThreshold F1 is %.3f" % (eval_softmax_threshold.f1_measure))
        print(f"SoftmaxThreshold f1_macro is %.3f" % (eval_softmax_threshold.f1_macro))
        print(f"SoftmaxThreshold f1_macro_weighted is %.3f" % (eval_softmax_threshold.f1_macro_weighted))
        print(f"SoftmaxThreshold area_under_roc is %.3f" % (eval_softmax_threshold.area_under_roc))
        print(f"_________________________________________")

        print(f"OpenMax accuracy is %.3f" % (eval_openmax.accuracy))
        print(f"OpenMax F1 is %.3f" % (eval_openmax.f1_measure))
        print(f"OpenMax f1_macro is %.3f" % (eval_openmax.f1_macro))
        print(f"OpenMax f1_macro_weighted is %.3f" % (eval_openmax.f1_macro_weighted))
        print(f"OpenMax area_under_roc is %.3f" % (eval_openmax.area_under_roc))
        print(f"_________________________________________")

        with open(os.path.join(args.checkpoint, "garbage.csv"),"ab") as f:
            np.savetxt(f,np.array([epoch]))
            np.savetxt(f, np.array([eval_softmax.f1_measure, eval_softmax.f1_macro,
                                    eval_softmax.f1_macro_weighted,
                                    eval_softmax.area_under_roc]).reshape(1, 4),
                       fmt='%.4f')
            np.savetxt(f, np.array([eval_softmax_threshold.f1_measure,
                                    eval_softmax_threshold.f1_macro,
                                    eval_softmax_threshold.f1_macro_weighted,
                                    eval_softmax_threshold.area_under_roc
                                    ]).reshape(1, 4),
                                    fmt='%.4f')
            np.savetxt(f, eval_softmax_threshold.confusion_matrix, fmt='%d')
            np.savetxt(f, np.array([eval_openmax.f1_measure, eval_openmax.f1_macro,
                                    eval_openmax.f1_macro_weighted,
                                    eval_openmax.area_under_roc]).reshape(1, 4),
                                    fmt='%.4f')
            np.savetxt(f, eval_openmax.confusion_matrix, fmt='%d')
    else:
        def softmax(x):
            e_x = np.exp(x - np.max(x))
            return e_x / e_x.sum()

        pred_softmax,score_softmax=[],[]
        for score in scores:
            softmax_prob = softmax(np.array(score.ravel()))
            pred_softmax.append(np.argmax(softmax_prob))
            score_softmax.append(softmax_prob)

        eval_softmax = Evaluation(pred_softmax, labels, score_softmax)
        print(f"Softmax accuracy is %.3f" % (eval_softmax.accuracy))
        print(f"Softmax F1 is %.3f" % (eval_softmax.f1_measure))
        print(f"Softmax f1_macro is %.3f" % (eval_softmax.f1_macro))
        print(f"Softmax f1_macro_weighted is %.3f" % (eval_softmax.f1_macro_weighted))
        print(f"Softmax area_under_roc is %.3f" % (eval_softmax.area_under_roc))
        print(f"_________________________________________")

        with open(os.path.join(args.checkpoint, "garbage_closed.csv"),"ab") as f:
            np.savetxt(f,np.array([epoch]))
            np.savetxt(f, np.array([eval_softmax.f1_measure, eval_softmax.f1_macro,
                                    eval_softmax.f1_macro_weighted,
                                    eval_softmax.area_under_roc]).reshape(1, 4),
                       fmt='%.4f')
            np.savetxt(f, eval_softmax.confusion_matrix, fmt='%d')

    return test_loss/(batch_idx+1), correct/total

def save_model(net, acc, epoch, path):
    print('Saving..')
    state = {
        'net': net.state_dict(),
        'testacc': acc,
        'epoch': epoch,
    }
    # torch.save(state, path)
    torch.save(net.state_dict(), path)

if __name__=="__main__":
    main()

efficientnet.py

'''
python3.7
-*- coding: UTF-8 -*-
@Project -> File   ：pythonProject -> efficientNet
@IDE    ：PyCharm
@Author ：YangShouWei
@USER: 
@Date   ：2022/3/15 21:41:59
@LastEditor:
'''

import math
import copy
from functools import partial
from collections import OrderedDict
from typing import Optional, Callable

import torch
from torch import nn
from torch import Tensor
from torch.nn import functional as F

def _make_divisible(ch, divisior=8, min_ch=None):
    """
    This function is taken from the original tf repo.
    It ensures that all layers have a channel number that is divisible by 8
    """
    if min_ch is None:
        min_ch = divisior
    new_ch = max(min_ch, int(ch + divisior / 2) // divisior * divisior)
    # Make sure that round down does not go down by more than 10%
    if new_ch < 0.9 * ch:
        new_ch += divisior
    return new_ch

def drop_path(x, drop_prob: float = 0., training:bool = False):
    """
    Drop paths (Stochastic Depth) per sample (when applied in main path of residual blocks).

    This function is taken from the rwightman
    """
    if drop_prob == 0. or not training:
        return x
    keep_prob = 1 - drop_prob
    shape = (x.shape[0],) + (1,) * (x.ndim - 1) # work with diff dim tensor, not just 2D ConvNets
    random_tensor = keep_prob + torch.rand(shape, dtype=x.dtype, device=x.device)
    random_tensor.floor_() #binarize
    output = x.div(keep_prob) * random_tensor
    return output

class DropPath(nn.Module):
    """
    Drop paths (Stochastic Depth) per sample (when applied in main path of residual blocks).
    """
    def __init__(self, drop_prob=None):
        super(DropPath, self).__init__()
        self.drop_prob = drop_prob

    def forward(self, x):
        return drop_path(x, self.drop_prob, self.training)


class ConvBNActivation(nn.Sequential):
    def __init__(self,
                 in_planes: int,
                 out_planes:int,
                 kernel_size : int = 3,
                 stride: int = 1,
                 groups: int = 1,
                 norm_layer: Optional[Callable[..., nn.Module]] = None,
                 activation_layer:Optional[Callable[..., nn.Module]] = None):
        padding = (kernel_size - 1) // 2
        if norm_layer is None:
            norm_layer = nn.BatchNorm2d
        if activation_layer is None:
            activation_layer = nn.SiLU

        super(ConvBNActivation, self).__init__(nn.Conv2d(in_channels=in_planes,
                                               out_channels=out_planes,
                                               kernel_size=kernel_size,
                                               stride=stride,
                                               padding=padding,
                                               groups=groups,
                                               bias=False),
                                               norm_layer(out_planes),
                                               activation_layer())










class SqueezeExcitation(nn.Module):
    def __init__(self,
                 input_c:int, # block input channel
                 expand_c:int, # block expand channel
                 squeeze_factor:int = 4):
        super(SqueezeExcitation, self).__init__()
        squeeze_c = input_c // squeeze_factor
        self.fc1 = nn.Conv2d(expand_c,squeeze_c, 1)
        self.ac1 = nn.SiLU()
        self.fc2 = nn.Conv2d(squeeze_c, expand_c, 1)
        self.ac2 = nn.Sigmoid()

    def forward(self,  x:Tensor):
        scale = F.adaptive_avg_pool2d(x, output_size=(1, 1))
        scale = self.fc1(scale)
        scale = self.ac1(scale)
        scale = self.fc2(scale)
        scale = self.ac2(scale)

        return scale * x

class InvertedResidualConfig:
    #kernel_size, in_channel, out_channel, exp_ratio, strides, use_SE, drop_connect_rate
    def __init__(self,
                 kernel: int,
                 input_c: int,
                 out_c: int,
                 expanded_ratio: int, # 1 or 6
                 stride: int,          # 1 or 2
                 use_se: bool,          # True
                 drop_rate: float,
                 index: str,           #1a, 2a, 2b, ...
                 width_coefficient:float):
        self.input_c = self.adjust_channels(input_c, width_coefficient)
        self.kernel = kernel
        self.expanded_c = self.input_c * expanded_ratio
        self.out_c =self.adjust_channels(out_c, width_coefficient)
        self.use_se = use_se
        self.stride = stride
        self.drop_rate = drop_rate
        self.index = index

    @staticmethod # 静态方法
    def adjust_channels(channels: int, width_coefficient: float):
        return _make_divisible(channels * width_coefficient, 8) # 通道数乘以倍率因子然后取最接近8的倍数的数


class InvertedResidual(nn.Module):
    def __init__(self,
                 cnf:InvertedResidualConfig,
                 norm_layer: Callable[..., nn.Module]):
        super(InvertedResidual, self).__init__()

        if cnf.stride not in [1, 2]:
            raise ValueError("illegal stride value")
        self.use_res_connect = (cnf.stride == 1 and cnf.input_c == cnf.out_c) # 判断是否使用残差连接
        layers = OrderedDict()
        activation_layer = nn.SiLU


        # expand
        if cnf.expanded_c != cnf.input_c:
            layers.update({"expand_conv": ConvBNActivation(cnf.input_c,
                                                           cnf.expanded_c,
                                                           kernel_size=1,
                                                           norm_layer=norm_layer,
                                                           activation_layer=activation_layer)})

        # depthwise
        layers.update({"dwconv":ConvBNActivation(cnf.expanded_c,
                                                 cnf.expanded_c,
                                                 kernel_size=cnf.kernel,
                                                 stride=cnf.stride,
                                                 groups=cnf.expanded_c,
                                                 norm_layer=norm_layer,
                                                 activation_layer=activation_layer)})

        if cnf.use_se:
            layers.update({"se": SqueezeExcitation(cnf.input_c,
                                                   cnf.expanded_c)})

        #project
        layers.update({"project_conv": ConvBNActivation(cnf.expanded_c,
                                                        cnf.out_c,
                                                        kernel_size=1,
                                                        norm_layer=norm_layer,
                                                        activation_layer=nn.Identity)}) # identity表示不做任何处理


        self.block = nn.Sequential(layers)
        self.out_channels = cnf.out_c
        self.is_strided = cnf.stride > 1

        #只有在使用shortcut连接时才使用dropout层
        if self.use_res_connect and cnf.drop_rate > 0:
            self.dropout = DropPath(cnf.drop_rate)
        else:
            self.dropout = nn.Identity()



    def forward(self, x:Tensor) -> Tensor:
        result = self.block(x)
        result = self.dropout(result)
        if self.use_res_connect:
            result += x

        return result





class EfficientNet(nn.Module):
    def __init__(self,
                 width_coefficient: float,
                 depth_coefficient: float,
                 num_classes: int = 1000,
                 dropout_rate: float = 0.2,
                 drop_connect_rate: float = 0.2,
                 block: Optional[Callable[..., nn.Module]] = None,
                 norm_layer :Optional[Callable[..., nn.Module]] = None):
        super(EfficientNet, self).__init__()

        # kernel_size, in_channel, out_channel, exp_ratio, strides, use_SE, drop_connect_rate, repeats
        deafault_cnf = [[3, 32, 16, 1, 1, True, drop_connect_rate, 1],
                        [3, 16, 24, 6, 2, True, drop_connect_rate, 2],
                        [5, 24, 40, 6, 2, True, drop_connect_rate, 2],
                        [3, 40, 80, 6, 2, True, drop_connect_rate, 3],
                        [5, 80, 112, 6, 1, True, drop_connect_rate, 3],
                        [5, 112, 192, 6, 2, True, drop_connect_rate, 4],
                        [3, 192, 320, 6, 1, True, drop_connect_rate, 1],]
        def round_repeats(repeats):
            """Round number of repeats based on depth multiplier."""
            return int(math.ceil(depth_coefficient * repeats))

        if block is None:
            block = InvertedResidual

        if norm_layer is None:
            norm_layer = partial(nn.BatchNorm2d, eps=1e-3, momentum=0.1)

        adjust_channels = partial(InvertedResidualConfig.adjust_channels,
                                  width_coefficient=width_coefficient)

        #bneck inverted_residual_setting
        bneck_conf = partial(InvertedResidualConfig, width_coefficient=width_coefficient)


        b = 0
        num_blocks = float(sum(round_repeats(i[-1]) for i in deafault_cnf))
        inverted_residual_setting = []
        for stage, args in enumerate(deafault_cnf):
            cnf = copy.copy(args)
            for i in range(round_repeats(cnf.pop(-1))):
                if i > 0:
                    # stride equal 1 expcept first cnf
                    cnf[-3] = 1 #strides
                    cnf[1] = cnf[2]  # input_channel equal output_channel

                cnf[-1] = args[-2] * b / num_blocks # update dropout ratio
                index = str(stage + 1) + chr(i + 97) # 1a, 2a, 2b
                inverted_residual_setting.append(bneck_conf(*cnf, index))
                b += 1


        #create layers
        layers = OrderedDict()

        # first conv
        layers.update({'stem_conv': ConvBNActivation(in_planes=3,
                                                     out_planes=adjust_channels(32),
                                                     kernel_size=3,
                                                     stride=2,
                                                     norm_layer=norm_layer)})
        # building inverted residual blocks
        for cnf in inverted_residual_setting:
            layers.update({cnf.index: block(cnf, norm_layer)})

        # build top
        last_conv_input_c = inverted_residual_setting[-1].out_c
        last_conv_output_c = adjust_channels(1280)
        layers.update({"top": ConvBNActivation(in_planes=last_conv_input_c,
                                               out_planes=last_conv_output_c,
                                               kernel_size=1,
                                               norm_layer=norm_layer
                                               )})
        self.features = nn.Sequential(layers)
        self.avgpool = nn.AdaptiveAvgPool2d(1)

        classifier = []
        if dropout_rate > 0:
            classifier.append(nn.Dropout(p=dropout_rate, inplace=True))
        classifier.append(nn.Linear(last_conv_output_c, num_classes))
        self.classifier = nn.Sequential(*classifier)

        # initial weights
        for m in self.modules():
            if isinstance(m, nn.Conv2d):
                nn.init.kaiming_normal_(m.weight, mode="fan_out")
                if m.bias is not None:
                    nn.init.zeros_(m.bias)
            elif isinstance(m, nn.BatchNorm2d):
                nn.init.ones_(m.weight)
                nn.init.zeros_(m.bias)
            elif isinstance(m, nn.Linear):
                nn.init.normal_(m.weight, 0, 0.01)
                nn.init.zeros_(m.bias)

    def _forward_impl(self, x:Tensor):
        x = self.features(x)
        x = self.avgpool(x)
        x = torch.flatten(x, 1)
        x = self.classifier(x)

        return x

    def forward(self, x:Tensor) -> Tensor:
        return self._forward_impl(x)


def efficientnet_b0(num_classes=1000):
    return EfficientNet(width_coefficient=1.0, depth_coefficient=1.1, dropout_rate=0.2, num_classes=num_classes)


def efficientnet_b1(num_classes=1000):
    return EfficientNet(width_coefficient=1.0, depth_coefficient=1.1, dropout_rate=0.2, num_classes=num_classes)


def efficientnet_b2(num_classes=1000):
    return EfficientNet(width_coefficient=1.1, depth_coefficient=1.2, dropout_rate=0.3, num_classes=num_classes)


def efficientnet_b3(num_classes=1000):
    return EfficientNet(width_coefficient=1.2, depth_coefficient=1.4, dropout_rate=0.3, num_classes=num_classes)


def efficientnet_b4(num_classes=1000):
    return EfficientNet(width_coefficient=1.4, depth_coefficient=1.8, dropout_rate=0.4, num_classes=num_classes)


def efficientnet_b5(num_classes=1000):
    return EfficientNet(width_coefficient=1.6, depth_coefficient=2.2, dropout_rate=0.4, num_classes=num_classes)


def efficientnet_b6(num_classes=1000):
    return EfficientNet(width_coefficient=1.8, depth_coefficient=2.6, dropout_rate=0.5, num_classes=num_classes)


def efficientnet_b7(num_classes=1000):
    return EfficientNet(width_coefficient=2.0, depth_coefficient=3.1, dropout_rate=0.5, num_classes=num_classes)

Openmax.py

import numpy as np
import scipy.spatial.distance as spd
import torch

import libmr





def calc_distance(query_score, mcv, eu_weight, distance_type='eucos'):
    if distance_type == 'eucos':
        query_distance = spd.euclidean(mcv, query_score) * eu_weight + \
            spd.cosine(mcv, query_score)
    elif distance_type == 'euclidean':
        query_distance = spd.euclidean(mcv, query_score)
    elif distance_type == 'cosine':
        query_distance = spd.cosine(mcv, query_score)
    else:
        print("distance type not known: enter either of eucos, euclidean or cosine")
    return query_distance


def fit_weibull(means, dists, categories, tailsize=20, distance_type='eucos'):
    """
    Input:
        means (C, channel, C)
        dists (N_c, channel, C) * C
    Output:
        weibull_model : Perform EVT based analysis using tails of distances and save
                        weibull model parameters for re-adjusting softmax scores
    """
    weibull_model = {}
    for mean, dist, category_name in zip(means, dists, categories):
        weibull_model[category_name] = {}
        weibull_model[category_name]['distances_{}'.format(distance_type)] = dist[distance_type]
        weibull_model[category_name]['mean_vec'] = mean
        weibull_model[category_name]['weibull_model'] = []
        for channel in range(mean.shape[0]):
            mr = libmr.MR()
            tailtofit = np.sort(dist[distance_type][channel, :])[-tailsize:]
            mr.fit_high(tailtofit, len(tailtofit))
            weibull_model[category_name]['weibull_model'].append(mr)

    return weibull_model


def query_weibull(category_name, weibull_model, distance_type='eucos'):
    return [weibull_model[category_name]['mean_vec'],
            weibull_model[category_name]['distances_{}'.format(distance_type)],
            weibull_model[category_name]['weibull_model']]


def compute_openmax_prob(scores, scores_u):
    prob_scores, prob_unknowns = [], []
    for s, su in zip(scores, scores_u):
        channel_scores = np.exp(s)
        channel_unknown = np.exp(np.sum(su))

        total_denom = np.sum(channel_scores) + channel_unknown
        prob_scores.append(channel_scores / total_denom)
        prob_unknowns.append(channel_unknown / total_denom)

    # Take channel mean
    scores = np.mean(prob_scores, axis=0)
    unknowns = np.mean(prob_unknowns, axis=0)
    modified_scores = scores.tolist() + [unknowns]
    return modified_scores


def softmax(x):
    e_x = np.exp(x - np.max(x))
    return e_x / e_x.sum()


def openmax(weibull_model, categories, input_score, eu_weight, alpha=10, distance_type='eucos'):
    """Re-calibrate scores via OpenMax layer
    Output:
        openmax probability and softmax probability
    """
    nb_classes = len(categories)

    ranked_list = input_score.argsort().ravel()[::-1][:alpha]
    alpha_weights = [((alpha + 1) - i) / float(alpha) for i in range(1, alpha + 1)]
    omega = np.zeros(nb_classes)
    omega[ranked_list] = alpha_weights

    scores, scores_u = [], []
    for channel, input_score_channel in enumerate(input_score):
        score_channel, score_channel_u = [], []
        for c, category_name in enumerate(categories):
            mav, dist, model = query_weibull(category_name, weibull_model, distance_type)
            channel_dist = calc_distance(input_score_channel, mav[channel], eu_weight, distance_type)
            wscore = model[channel].w_score(channel_dist)
            modified_score = input_score_channel[c] * (1 - wscore * omega[c])#v^i(x)=v(x)*(1-welbull *(alpha-i)/alpha)
            score_channel.append(modified_score)
            score_channel_u.append(input_score_channel[c] - modified_score)#v^0(x)=sum(vi(x)*(1-wi(x)))

        scores.append(score_channel)
        scores_u.append(score_channel_u)

    scores = np.asarray(scores)
    scores_u = np.asarray(scores_u)

    openmax_prob = np.array(compute_openmax_prob(scores, scores_u))
    softmax_prob = softmax(np.array(input_score.ravel()))
    return openmax_prob, softmax_prob


def compute_channel_distances(mavs, features, eu_weight=0.5):
    """
    Input:
        mavs (channel, C)
        features: (N, channel, C)
    Output:
        channel_distances: dict of distance distribution from MAV for each channel.
    """
    eucos_dists, eu_dists, cos_dists = [], [], []
    for channel, mcv in enumerate(mavs):  # Compute channel specific distances
        eu_dists.append([spd.euclidean(mcv, feat[channel]) for feat in features])
        cos_dists.append([spd.cosine(mcv, feat[channel]) for feat in features])
        eucos_dists.append([spd.euclidean(mcv, feat[channel]) * eu_weight +
                            spd.cosine(mcv, feat[channel]) for feat in features])

    return {'eucos': np.array(eucos_dists), 'cosine': np.array(cos_dists), 'euclidean': np.array(eu_dists)}


def compute_train_score_and_mavs_and_dists(train_class_num,trainloader, device, net, test_classes):
    scores = [[] for _ in range(train_class_num)]
    with torch.no_grad():
        for batch_idx, (inputs, targets) in enumerate(trainloader):
            onehot_targets_index = [test_classes.index(i) for i in targets]
            targets = torch.LongTensor(onehot_targets_index)
            inputs, targets = inputs.to(device), targets.to(device)

            # this must cause error for cifar10
            outputs = net(inputs)

            for score, t in zip(outputs, targets):
                # print(f"torch.argmax(score) is {torch.argmax(score)}, t is {t}")
                if torch.argmax(score) == t:
                    scores[t].append(score.unsqueeze(dim=0).unsqueeze(dim=0))
    scores = [torch.cat(x).cpu().numpy() for x in scores]  # (N_c, 1, C) * C
    mavs = np.array([np.mean(x, axis=0) for x in scores])  # (C, 1, C)
    dists = [compute_channel_distances(mcv, score) for mcv, score in zip(mavs, scores)]
    return scores, mavs, dists

evaluation.py

import numpy as np
import matplotlib.pyplot as plt
from sklearn.metrics import confusion_matrix, f1_score, \
    classification_report, precision_recall_fscore_support, roc_auc_score
from sklearn.preprocessing import OneHotEncoder
# import sklearn.metrics.ConfusionMatrixDisplay

class Evaluation(object):
    """Evaluation class based on python list"""
    def __init__(self, predict, label,prediction_scores = None):
        self.predict = predict
        self.label = label
        self.prediction_scores = prediction_scores

        self.accuracy = self._accuracy()
        self.f1_measure = self._f1_measure()
        self.f1_macro = self._f1_macro()
        self.f1_macro_weighted = self._f1_macro_weighted()
        self.precision, self.recall = self._precision_recall(average='micro')
        self.precision_macro, self.recall_macro = self._precision_recall(average='macro')
        self.precision_weighted, self.recall_weighted = self._precision_recall(average='weighted')
        self.confusion_matrix = self._confusion_matrix()
        if self.prediction_scores is not None:
            self.area_under_roc = self._area_under_roc(prediction_scores)
            pass

    def _accuracy(self) -> float:
        """
        Returns the accuracy score of the labels and predictions.
        :return: float
        """
        assert len(self.predict) == len(self.label)
        correct = (np.array(self.predict) == np.array(self.label)).sum()
        return float(correct)/float(len(self.predict))

    def _f1_measure(self) -> float:
        """
        Returns the F1-measure with a micro average of the labels and predictions.
        :return: float
        """
        assert len(self.predict) == len(self.label)
        return f1_score(self.label, self.predict, average='micro')

    def _f1_macro(self) -> float:
        """
        Returns the F1-measure with a macro average of the labels and predictions.
        :return: float
        """
        assert len(self.predict) == len(self.label)
        return f1_score(self.label, self.predict, average='macro')

    def _f1_macro_weighted(self) -> float:
        """
        Returns the F1-measure with a weighted macro average of the labels and predictions.
        :return: float
        """
        assert len(self.predict) == len(self.label)
        return f1_score(self.label, self.predict, average='weighted')

    def _precision_recall(self, average) -> (float, float):
        """
        Returns the precision and recall scores for the label and predictions. Observes the average type.

        :param average: string, [None (default), ‘micro’, ‘macro’, ‘samples’, ‘weighted’].
            For explanations of each type of average see the documentation for
            `sklearn.metrics.precision_recall_fscore_support`
        :return: float, float: representing the precision and recall scores respectively
        """
        assert len(self.predict) == len(self.label)
        precision, recall, _, _ = precision_recall_fscore_support(self.label, self.predict, average=average)
        return precision, recall

    def _area_under_roc(self, prediction_scores: np.array = None, multi_class='ovo') -> float:
        """
        Area Under Receiver Operating Characteristic Curve

        :param prediction_scores: array-like of shape (n_samples, n_classes). The multi-class ROC curve requires
            prediction scores for each class. If not specified, will generate its own prediction scores that assume
            100% confidence in selected prediction.
        :param multi_class: {'ovo', 'ovr'}, default='ovo'
            'ovo' computes the average AUC of all possible pairwise combinations of classes.
            'ovr' Computes the AUC of each class against the rest.
        :return: float representing the area under the ROC curve
        """
        label, predict = self.label, self.predict
        one_hot_encoder = OneHotEncoder(sparse=False, handle_unknown='ignore')
        one_hot_encoder.fit(np.array(label).reshape(-1, 1))
        true_scores = one_hot_encoder.transform(np.array(label).reshape(-1, 1))
        if prediction_scores is None:
            prediction_scores = one_hot_encoder.transform(np.array(predict).reshape(-1, 1))
        # assert prediction_scores.shape == true_scores.shape

        # return roc_auc_score(true_scores, prediction_scores, multi_class=multi_class)
        return roc_auc_score(true_scores, prediction_scores)

    def _confusion_matrix(self, normalize=None) -> np.array:
        """
        Returns the confusion matrix corresponding to the labels and predictions.

        :param normalize: {‘true’, ‘pred’, ‘all’}, default=None.
            Normalizes confusion matrix over the true (rows), predicted (columns) conditions or all the population.
            If None, confusion matrix will not be normalized.
        :return:
        """
        assert len(self.predict) == len(self.label)
        # return confusion_matrix(self.label, self.predict, normalize=normalize)
        return confusion_matrix(self.label, self.predict)

    def plot_confusion_matrix(self, labels: [str] = None, normalize=None, ax=None, savepath=None) -> None:
        """

        :param labels: [str]: label names
        :param normalize: {‘true’, ‘pred’, ‘all’}, default=None.
            Normalizes confusion matrix over the true (rows), predicted (columns) conditions or all the population.
            If None, confusion matrix will not be normalized.
        :param ax: matplotlib.pyplot axes to draw the confusion matrix on. Will generate new figure/axes if None.
        :return:
        """
        conf_matrix = self._confusion_matrix(normalize)  # Evaluate the confusion matrix
        # display = ConfusionMatrixDisplay(conf_matrix, display_labels=labels)  # Generate the confusion matrix display

        # Formatting for the plot
        if labels:
            xticks_rotation = 'vertical'
        else:
            xticks_rotation = 'horizontal'

        # display.plot(include_values=True, cmap=plt.cm.get_cmap('Blues'), xticks_rotation=xticks_rotation, ax=ax)
        if savepath is None:
            plt.show()
        else:
            plt.savefig(savepath, bbox_inches='tight', dpi=200)
        plt.close()


if __name__ == '__main__':
    predict = [1, 2, 3, 4, 5, 3, 3, 2, 2, 5, 6, 6, 4, 3, 2, 4, 5, 6, 6, 3, 2]
    label =   [2, 5, 3, 4, 5, 3, 2, 2, 4, 6, 6, 6, 3, 3, 2, 5, 5, 6, 6, 3, 3]

    eval = Evaluation(predict, label)
    print('Accuracy:', f"%.3f" % eval.accuracy)
    print('F1-measure:', f'{eval.f1_measure:.3f}')
    print('F1-macro:', f'{eval.f1_macro:.3f}')
    print('F1-macro (weighted):', f'{eval.f1_macro_weighted:.3f}')
    print('precision:', f'{eval.precision:.3f}')
    print('precision (macro):', f'{eval.precision_macro:.3f}')
    print('precision (weighted):', f'{eval.precision_weighted:.3f}')
    print('recall:', f'{eval.recall:.3f}')
    print('recall (macro):', f'{eval.recall_macro:.3f}')
    print('recall (weighted):', f'{eval.recall_weighted:.3f}')

    # Generate "random prediction score" to test feeding in prediction score from NN
    test_one_hot_encoder = OneHotEncoder(sparse=False, handle_unknown='ignore')
    test_one_hot_encoder.fit(np.array(label).reshape(-1, 1))
    rand_prediction_scores = 2 * test_one_hot_encoder.transform(np.array(predict).reshape(-1, 1))  # One hot
    rand_prediction_scores += np.random.rand(*rand_prediction_scores.shape)
    # rand_prediction_scores /= rand_prediction_scores.sum(axis=1)[:, None]
    # print('Area under ROC curve (with 100% confidence in prediction):', f'{eval.area_under_roc():.3f}')
    # print('Area under ROC curve (variable probability across classes):',
    #       f'{eval.area_under_roc(prediction_scores=rand_prediction_scores):.3f}')
    # print(eval.confusion_matrix)
    label_names = ["bird","bog","perople","horse","cat", "unknown"]
    eval.plot_confusion_matrix(normalize="true",labels=label_names)
    # print("运行到这了")
    print(classification_report(label, predict, digits=3))

cifarutils.py

'''Some helper functions for PyTorch, including:
    - get_mean_and_std: calculate the mean and std value of dataset.
    - msr_init: net parameter initialization.
    - progress_bar: progress bar mimic xlua.progress.
'''
import os
import sys
import time
import errno
import shutil
import torch
import torch.nn as nn
import torch.nn.init as init
import torchvision.utils as vutils

__all__=["get_mean_and_std","progress_bar","format_time",
         'adjust_learning_rate', 'AverageMeter','Logger','mkdir_p', 'save_binary_img', 'save_model']

def get_mean_and_std(dataset):
    '''Compute the mean and std value of dataset.'''
    dataloader = torch.utils.data.DataLoader(dataset, batch_size=1, shuffle=True, num_workers=2)
    mean = torch.zeros(3)
    std = torch.zeros(3)
    print('==> Computing mean and std..')
    for inputs, targets in dataloader:
        for i in range(3):
            mean[i] += inputs[:,i,:,:].mean()
            std[i] += inputs[:,i,:,:].std()
    mean.div_(len(dataset))
    std.div_(len(dataset))
    return mean, std

def init_params(net):
    '''Init layer parameters.'''
    for m in net.modules():
        if isinstance(m, nn.Conv2d):
            init.kaiming_normal(m.weight, mode='fan_out')
            if m.bias:
                init.constant(m.bias, 0)
        elif isinstance(m, nn.BatchNorm2d):
            init.constant(m.weight, 1)
            init.constant(m.bias, 0)
        elif isinstance(m, nn.Linear):
            init.normal(m.weight, std=1e-3)
            if m.bias:
                init.constant(m.bias, 0)


# _, term_width = os.popen('stty size', 'r').read().split()
# term_width = int(term_width)

TOTAL_BAR_LENGTH = 65.
last_time = time.time()
begin_time = last_time
def progress_bar(current, total, msg=None):
    global last_time, begin_time
    if current == 0:
        begin_time = time.time()  # Reset for new bar.

    cur_len = int(TOTAL_BAR_LENGTH*current/total)
    rest_len = int(TOTAL_BAR_LENGTH - cur_len) - 1

    sys.stdout.write(' [')
    for i in range(cur_len):
        sys.stdout.write('=')
    sys.stdout.write('>')
    for i in range(rest_len):
        sys.stdout.write('.')
    sys.stdout.write(']')

    cur_time = time.time()
    step_time = cur_time - last_time
    last_time = cur_time
    tot_time = cur_time - begin_time

    L = []
    L.append('  Step: %s' % format_time(step_time))
    L.append(' | Tot: %s' % format_time(tot_time))
    if msg:
        L.append(' | ' + msg)

    msg = ''.join(L)
    sys.stdout.write(msg)
    # for i in range(term_width-int(TOTAL_BAR_LENGTH)-len(msg)-3):
    #     sys.stdout.write(' ')

    # Go back to the center of the bar.
    # for i in range(term_width-int(TOTAL_BAR_LENGTH/2)+2):
    #     sys.stdout.write('\b')
    sys.stdout.write(' %d/%d ' % (current+1, total))

    if current < total-1:
        sys.stdout.write('\r')
    else:
        sys.stdout.write('\n')
    sys.stdout.flush()

def format_time(seconds):
    days = int(seconds / 3600/24)
    seconds = seconds - days*3600*24
    hours = int(seconds / 3600)
    seconds = seconds - hours*3600
    minutes = int(seconds / 60)
    seconds = seconds - minutes*60
    secondsf = int(seconds)
    seconds = seconds - secondsf
    millis = int(seconds*1000)

    f = ''
    i = 1
    if days > 0:
        f += str(days) + 'D'
        i += 1
    if hours > 0 and i <= 2:
        f += str(hours) + 'h'
        i += 1
    if minutes > 0 and i <= 2:
        f += str(minutes) + 'm'
        i += 1
    if secondsf > 0 and i <= 2:
        f += str(secondsf) + 's'
        i += 1
    if millis > 0 and i <= 2:
        f += str(millis) + 'ms'
        i += 1
    if f == '':
        f = '0ms'
    return f

def write_record(file_path,str):
    if not os.path.exists(file_path):
        # os.makedirs(file_path)
        os.system(r"touch {}".format(file_path))
    f = open(file_path, 'a')
    f.write(str)
    f.close()

def count_parameters(model,all=True):
    # If all= Flase, we only return the trainable parameters; tested
    return sum(p.numel() for p in model.parameters() if p.requires_grad or all)

def adjust_learning_rate(optimizer, epoch, lr,factor=0.1, step=30):
    """Sets the learning rate to the initial LR decayed by factor every step epochs"""
    lr = lr * (factor ** (epoch // step))
    for param_group in optimizer.param_groups:
        param_group['lr'] = lr



class ProgressMeter(object):
    def __init__(self, num_batches, meters, prefix=""):
        self.batch_fmtstr = self._get_batch_fmtstr(num_batches)
        self.meters = meters
        self.prefix = prefix

    def display(self, batch):
        entries = [self.prefix + self.batch_fmtstr.format(batch)]
        entries += [str(meter) for meter in self.meters]
        print('\t'.join(entries))

    def _get_batch_fmtstr(self, num_batches):
        num_digits = len(str(num_batches // 1))
        fmt = '{:' + str(num_digits) + 'd}'
        return '[' + fmt + '/' + fmt.format(num_batches) + ']'


def accuracy(output, target, topk=(1,)):
    """Computes the accuracy over the k top predictions for the specified values of k"""
    with torch.no_grad():
        maxk = max(topk)
        batch_size = target.size(0)

        _, pred = output.topk(maxk, 1, True, True)
        pred = pred.t()
        correct = pred.eq(target.view(1, -1).expand_as(pred))

        res = []
        for k in topk:
            correct_k = correct[:k].view(-1).float().sum(0, keepdim=True)
            res.append(correct_k.mul_(100.0 / batch_size))
        return res


def save_checkpoint(state, is_best, netName):
    torch.save(state, './checkpoint/ckpt_imagenet32_' + netName + '_last.t7')
    if is_best:
        shutil.copyfile('./checkpoint/ckpt_imagenet32_' + netName + '_last.t7',
                        './checkpoint/ckpt_imagenet32_' + netName + '_best.t7')


class AverageMeter(object):
    """Computes and stores the average and current value"""
    def __init__(self, name, fmt=':f'):
        self.name = name
        self.fmt = fmt
        self.reset()

    def reset(self):
        self.val = 0
        self.avg = 0
        self.sum = 0
        self.count = 0

    def update(self, val, n=1):
        self.val = val
        self.sum += val * n
        self.count += n
        self.avg = self.sum / self.count

    def __str__(self):
        fmtstr = '{name} {val' + self.fmt + '} ({avg' + self.fmt + '})'
        return fmtstr.format(**self.__dict__)


class Logger(object):
    '''Save training process to log file with simple plot function.'''
    def __init__(self, fpath, title=None, resume=False):
        self.file = None
        self.resume = resume
        self.title = '' if title == None else title
        if fpath is not None:
            if resume:
                self.file = open(fpath, 'r')
                name = self.file.readline()
                self.names = name.rstrip().split('\t')
                self.numbers = {}
                for _, name in enumerate(self.names):
                    self.numbers[name] = []

                for numbers in self.file:
                    numbers = numbers.rstrip().split('\t')
                    for i in range(0, len(numbers)):
                        self.numbers[self.names[i]].append(numbers[i])
                self.file.close()
                self.file = open(fpath, 'a')
            else:
                self.file = open(fpath, 'w')

    def set_names(self, names):
        if self.resume:
            pass
        # initialize numbers as empty list
        self.numbers = {}
        self.names = names
        for _, name in enumerate(self.names):
            self.file.write(name)
            self.file.write('\t')
            self.numbers[name] = []
        self.file.write('\n')
        self.file.flush()


    def append(self, numbers):
        assert len(self.names) == len(numbers), 'Numbers do not match names'
        for index, num in enumerate(numbers):
            self.file.write("{0:.6f}".format(num))
            self.file.write('\t')
            self.numbers[self.names[index]].append(num)
        self.file.write('\n')
        self.file.flush()

    def close(self):
        if self.file is not None:
            self.file.close()

def mkdir_p(path):
    '''make dir if not exist'''
    try:
        os.makedirs(path)
    except OSError as exc:  # Python >2.5
        if exc.errno == errno.EEXIST and os.path.isdir(path):
            pass
        else:
            raise


def save_model(net, optimizer, epoch, path, **kwargs):
    state = {
        'net': net.state_dict(),
        'optimizer': optimizer.state_dict(),
        'epoch': epoch
    }
    for key, value in kwargs.items():
        state[key] = value
    torch.save(state, path)


def save_binary_img(tensor, file_path="./val.png", nrow=8, binary=False):
    # tensor [b,1,w,h]
    predicted = tensor
    if binary:
        predicted = torch.sigmoid(tensor) > 0.5
    vutils.save_image(predicted.float(), file_path,nrow=nrow)

garbage.py

'''
@File  :garbage.py
@Author:cjh
@Date  :2022/1/16 15:09
@Desc  :
'''
import pickle

import torch.nn.functional as F
import torch
import torch.nn as nn
from torch.autograd import Variable
import torchvision.models as models
from torchvision import transforms, utils
from torch.utils.data import Dataset, DataLoader
from PIL import Image
import numpy as np
import torch.optim as optim
import os
import random
import cv2
from torchvision.datasets.vision import VisionDataset

unknown_class_index=999


class GARBAGE40_Dataset(VisionDataset):
    training_file='/train.txt'
    validating_file='/validate.txt'
    testing_file='/test.txt'

    classes = ['0','1','2','3','4','5','6','7','8','9',
               '10','11','12','13','14','15','16','17','18','19',
               '20','21','22','23','24','25','26','27','28','29',
               '30', '31', '32', '33', '34', '35', '36', '37', '38', '39']
    # def get_root(self):
    #     return os.getcwd()

    def __init__(self, root, train=True, transform=None, target_transform=None,
                 train_class_num=24, test_class_num=40, includes_all_train_class=True,train_classes=None):

        super(GARBAGE40_Dataset, self).__init__(root,transform=transform,
                                                target_transform=target_transform)
        self.train=train
        if self.train:
            data_file=self.training_file
        else:
            data_file=self.testing_file
        self.ori_data,self.ori_targets=[],[]
        self.init_data(txt=root+data_file)
        self.ori_data, self.ori_targets=np.array(self.ori_data),np.array(self.ori_targets)
        self._update_open_set(train_class_num, test_class_num, includes_all_train_class,train_classes)

    def _update_open_set(self, train_class_num=24, test_class_num=40, includes_all_train_class=False,train_classes=None):
        assert train_class_num > 0 and train_class_num <= 40  # not include 10 to ensure openness.
        if includes_all_train_class:
            assert test_class_num >= train_class_num  # not include equal to ensure openness.
        class_list = list(range(len(self.classes))) #[0...39]

        # train_classes = list(range(train_class_num))#[0...23]

        if includes_all_train_class:
            rnd = np.random.RandomState(42)
            # unknown_list = list(range(train_class_num, 10))
            unknown_list=[idx for idx in range(40) if idx not in train_classes]
            test_classes = rnd.choice(unknown_list, test_class_num - train_class_num, replace=False).tolist() # 从unknown_list中随机选择(40-24)=16个项
            test_classes = train_classes + test_classes
        else:
            rnd = np.random.RandomState(42)
            test_classes = rnd.choice(class_list, test_class_num, replace=False).tolist()

        # Update self.classes
        selected_elements = [self.classes[index] for index in train_classes]
        selected_elements.append(str(unknown_class_index) + '-unknown')
        self.classes = selected_elements


        # self.classes = test_classes
        # update self.class_to_idx
        # Ignore: due to the class_to_idx property
        # self.class_to_idx = {_class: i for i, _class in enumerate(self.classes)}
        # Processing data
        if self.train:
            indexes = [i for i, x in enumerate(self.ori_targets) if x in train_classes]
            self.data = self.ori_data[indexes]
            self.targets = [self.ori_targets[i]for i in indexes]

            print(f"\tTraining data includes {train_class_num} classes, {len(self.targets)} samples.")
        else:
            indexes = [i for i, x in enumerate(self.ori_targets) if x in test_classes]
            self.data = self.ori_data[indexes]
            temp_test_classes = [x for x in test_classes if x not in train_classes]
            train_and_test_calsses = train_classes + temp_test_classes
            self.targets = [self.ori_targets[i] for i in indexes]

            for i in range(0, len(self.ori_targets)):
                if self.targets[i] in temp_test_classes:
                    self.targets[i] = unknown_class_index
            print(f"\tTesting data includes {train_class_num + 1} classes (Original {test_class_num} classes),"
                  f" {len(self.targets)} samples.")

            CTR=train_class_num
            CTU=len(temp_test_classes)
            CTA = CTR+CTU
            self.openness = 1-np.sqrt(2*CTR/(CTR+CTA))
            print(f"\tDuring testing, openness is {self.openness}.")

    # 定义读取文件的格式
    def loader(self,fn):
        path = self.root+'/'.join(fn[1:].split("/"))
        return Image.open(path).convert('RGB')

    def init_data(self,txt):
        fh = open(txt, 'r')
        for line in fh:  # 迭代该列表 #按行循环txt文本中的内
            line = line.strip('\n')
            line = line.rstrip('\n')  # 删除 本行string 字符串末尾的指定字符
            words = line.split()  # 用split将该行分割成列表  split的默认参数是空格
            self.ori_data.append(words[0])
            self.ori_targets.append(int(words[1]))

    def __getitem__(self, index):
        """
        Args:
            index (int): Index

        Returns:
            tuple: (image, target) where target is index of the target class.
        """
        fn, target = self.data[index],int(self.targets[index])
        img = self.loader(fn)  # 按照路径读取图片
        if self.transform is not None:
            img = self.transform(img)  # 数据标签转换为Tensor
        if self.target_transform is not None:
            target = self.target_transform(target)
        return img, target

    def __len__(self):
        return len(self.data)

if __name__=="__main__":
    import time
    start1 = time.perf_counter()


    # train_transforms = transforms.Compose([
    #     transforms.Resize(224),
    #     transforms.RandomResizedCrop(224, scale=(0.8, 1.0)),
    #     transforms.RandomHorizontalFlip(0.5),
    #     transforms.RandomRotation(10),
    #     transforms.ToTensor(),
    #     transforms.Normalize([0.5071, 0.4865, 0.4409], [0.2673, 0.2564, 0.2762]),
    # ])
    # test_transforms = transforms.Compose([
    #     transforms.Resize(224),
    #     transforms.RandomResizedCrop(224, scale=(0.8, 1.0)),
    #     transforms.RandomHorizontalFlip(0.5),
    #     transforms.RandomRotation(10),
    #     transforms.ToTensor(),
    #     transforms.Normalize([0.5071, 0.4865, 0.4409], [0.2673, 0.2564, 0.2762]),
    # ])

    train_transforms = transforms.Compose([
        transforms.Resize(256),
        transforms.CenterCrop(256),
        transforms.RandomAffine(degrees=0, translate=(0.05, 0.05)),
        transforms.RandomHorizontalFlip(),
        transforms.ToTensor(),
        transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
    ])
    test_transforms = transforms.Compose([
        transforms.Resize(256),
        transforms.CenterCrop(256),
        transforms.ToTensor(),
        transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225])
    ])
    train_class_num=24
    random.seed(42)
    train_classes = random.sample(range(0, 40), train_class_num)

    trainset = GARBAGE40_Dataset(root='../data/garbage', train=True,
                                transform=test_transforms,
                                train_class_num=train_class_num, test_class_num=40,
                                includes_all_train_class=True, train_classes=train_classes)

    # testset=GARBAGE40_Dataset(root='../data/garbage', train=False,
    #                           transform=test_transforms,
    #                 train_class_num=40, test_class_num=40,
    #                 includes_all_train_class=True,train_classes=train_classes)
    trainloader=torch.utils.data.DataLoader(trainset, batch_size=128, shuffle=True, num_workers=4)
    # testloader = torch.utils.data.DataLoader(testset, batch_size=128, shuffle=False, num_workers=4)
    for i, (data, target) in enumerate(trainloader):
        print()
    end1 = time.perf_counter()
    print("final is in : %s Seconds " % (end1 - start1))

garbage_transform.py

'''
@File  :garbage_transform.py
@Author:cjh
@Date  :2022/2/8 12:38
@Desc  :
'''
import random
import math
import torch

from PIL import Image, ImageOps, ImageFilter
from torchvision import transforms

class Resize(object):
    def __init__(self, size, interpolation=Image.BILINEAR):
        self.size = size
        self.interpolation = interpolation

    def __call__(self, img):
        # padding
        ratio = self.size[0] / self.size[1]
        w, h = img.size
        if w / h < ratio:
            t = int(h * ratio)
            w_padding = (t - w) // 2
            img = img.crop((-w_padding, 0, w+w_padding, h))
        else:
            t = int(w / ratio)
            h_padding = (t - h) // 2
            img = img.crop((0, -h_padding, w, h+h_padding))

        img = img.resize(self.size, self.interpolation)

        return img

class RandomRotate(object):
    def __init__(self, degree, p=0.5):
        self.degree = degree
        self.p = p

    def __call__(self, img):
        if random.random() < self.p:
            rotate_degree = random.uniform(-1*self.degree, self.degree)
            img = img.rotate(rotate_degree, Image.BILINEAR)
        return img

class RandomGaussianBlur(object):
    def __init__(self, p=0.5):
        self.p = p
    def __call__(self, img):
        if random.random() < self.p:
            img = img.filter(ImageFilter.GaussianBlur(
                radius=random.random()))
        return img

class Cutout(object):
    def __init__(self, probability=0.5, size=64, mean=[0.4914, 0.4822, 0.4465]):
        self.probability = probability
        self.mean = mean
        self.size = size

    def __call__(self, img):

        if random.uniform(0, 1) > self.probability:
            return img

        h = self.size
        w = self.size
        for attempt in range(100):
            area = img.size()[1] * img.size()[2]
            if w < img.size()[2] and h < img.size()[1]:
                x1 = random.randint(0, img.size()[1] - h)
                y1 = random.randint(0, img.size()[2] - w)
                if img.size()[0] == 3:
                    img[0, x1:x1 + h, y1:y1 + w] = self.mean[0]
                    img[1, x1:x1 + h, y1:y1 + w] = self.mean[1]
                    img[2, x1:x1 + h, y1:y1 + w] = self.mean[2]
                else:
                    img[0, x1:x1 + h, y1:y1 + w] = self.mean[0]
                return img
        return img

class RandomErasing(object):
    """ Randomly selects a rectangle region in an image and erases its pixels.
        'Random Erasing Data Augmentation' by Zhong et al.
        See https://arxiv.org/pdf/1708.04896.pdf
    Args:
         probability: The probability that the Random Erasing operation will be performed.
         sl: Minimum proportion of erased area against input image.
         sh: Maximum proportion of erased area against input image.
         r1: Minimum aspect ratio of erased area.
         mean: Erasing value.
    """

    def __init__(self, probability=0.5, sl=0.02, sh=0.4, r1=0.3, mean=[0.4914, 0.4822, 0.4465]):
        self.probability = probability
        self.mean = mean
        self.sl = sl
        self.sh = sh
        self.r1 = r1

    def __call__(self, img):

        if random.uniform(0, 1) > self.probability:
            return img

        for attempt in range(100):
            area = img.size()[1] * img.size()[2]

            target_area = random.uniform(self.sl, self.sh) * area
            aspect_ratio = random.uniform(self.r1, 1 / self.r1)

            h = int(round(math.sqrt(target_area * aspect_ratio)))
            w = int(round(math.sqrt(target_area / aspect_ratio)))

            if w < img.size()[2] and h < img.size()[1]:
                x1 = random.randint(0, img.size()[1] - h)
                y1 = random.randint(0, img.size()[2] - w)
                if img.size()[0] == 3:
                    img[0, x1:x1 + h, y1:y1 + w] = self.mean[0]
                    img[1, x1:x1 + h, y1:y1 + w] = self.mean[1]
                    img[2, x1:x1 + h, y1:y1 + w] = self.mean[2]
                else:
                    img[0, x1:x1 + h, y1:y1 + w] = self.mean[0]
                return img

        return img

你可能感兴趣的:(深度学习,机器学习,深度学习,python,pytorch)

python自动化系列：自动抓取网站文章的工具豆本-豆豆奶零基础教程 Python教程 Python python 自动化开发语言
作品介绍作品名称：自动抓取网站文章的工具用到的库：requests、bs4、urllib.parse、logging、subprocess、os、tempfile作品简介：该实例用于自动抓取特定网站文章并将其保存为Word文档(.docx)的脚本。它使用了requests库来获取网页内容，BeautifulSoup从bs4库中解析HTML，urljoin从urllib.parse模块中构建完整的U
Linux 安装gitlab 絮落锦乡 linux gitlab 运维
1.更新系统确保系统是最新的：sudoyumupdate-y2.安装依赖项安装必需的依赖项：sudoyuminstall-ycurlpolicycoreutils-pythonopenssh-serverGitLab需要一个邮件服务来发送通知。你可以使用现有的邮件服务器，或者在本地配置Postfix：sudoyuminstall-ypostfixsudosystemctlenablepostfix
华为OD机试E卷 --猜字谜--24年OD统一考试（Java & JS & Python & C & C++）飞码创造者最新华为OD机试题库2024 java 华为od javascript python c语言
文章目录题目描述输入描述输出描述用例题目解析JS算法源码Java算法源码python算法源码c算法源码c++算法源码题目描述小王设计了一个简单的猜字谜游戏，游戏的谜面是一个错误的单词，比如nesw，玩家需要猜出谜底库中正确的单词。猜中的要求如下:对于某个谜面和谜底单词，满足下面任—条件都表示猜中:1)）变换顺序以后一样的，比如通过变换w和e的顺序，“nwes”跟news”是可以完全对应的;2)字母
Ubuntu怎么更新最新python 互联网裁缝 ubuntu python linux
在Ubuntu上更新Python到最新版本，通常需要通过包管理器apt来操作，因为Ubuntu默认的Python发行版可能会滞后于主线版本。以下是步骤：检查当前Python版本:打开终端并运行命令：python3--version安装software-properties-common（如果未安装）:如果你看到“commandnotfound”，说明software-properties-comm
【深度学习】Pytorch：在 ResNet 中加入注意力机制 T0uken 深度学习 pytorch 人工智能
在这篇教程中，我们将介绍如何在ResNet网络中加入注意力机制模块。我们将通过对标准ResNet50进行改进，向网络中添加两个自定义的注意力模块，并展示如何实现这一过程。为什么要加入注意力机制注意力机制可以帮助神经网络专注于图像中重要的特征区域，从而提高模型的性能。在卷积神经网络中，加入注意力机制能够有效增强特征提取能力，减少冗余信息的干扰，尤其在处理复杂图像时，能够提升网络的表现。在本教程中，我
Python 笔记（06）— 函数不定长参数（可变位置参数、可变关键字参数） wohu007 Python Python 不定长参数
Python函数常见的五类参数：位置参数关键字参数默认参数可变位置参数可变关键字参数1.定义出现带一个星号的参数args，这是可变位置参数；带两个星号的参数kwargs，这是可变关键字参数；deftest(x,y,*args,**kwargs):print(x)print(y)print(args)print(kwargs)可变表示函数被赋值的变量个数是变化的。2.按顺序解析调用例如，可以这样调用
Python之函数中的位置可变参数和关键字可变参数静星辰
1.位置可变参数（*）在形式参数名称前加一个星号*，则代表使用该形式参数可以接收任意多个参数，而且接收的参数将会以元组的方式组织。例：deffunc(*args):#arg形参以元组的方式组织传入的实参print(args)func(1,6,"ab","gh")运行结果：(1,6,‘ab’,‘gh’)2.关键字可变参数（**）在形式参数名称前加两个星号**，则代表使用该形式参数可以接收任意多个传入
winform调用python_C#调用Python代码 weixin_39787826 winform调用python
C#中，如果碰到需要调用Python代码时，一种方法是使用IronPython，不过这种方法太繁琐太累，特别是碰到Python代码中带有大量的第三方包，就会一直报错，提示缺少相应模块，这种方法太low，只支持Python2代码，果断摒弃。推荐另一种方法是用pyinstaller打包Python程序，会自动将程序中引用的第三方包也打包进去，Python3.X随便用，很方便。pyinstaller怎么
GitHub（修改host）加速访问程序员
GitHub（修改host）加速访问对GitHub访问太难了：访问慢、图片加载不出来项目来源github520代码运行获取host文件项目具体代码#!/usr/bin/python3#-*-coding:utf-8-*-##Author:XueWeiHan#E-mail:[email protected]#Date:2020-05-1915:27#Desc:获取最新的GitHub相关域名对应IPim
Python 和Selenium统计jira tomchn 笔记
我最近写了一个Python程序，自动提取Excel数据，用Selenium统计Jiras数据，并写入Excel。1.openPage打开并登录Jira，打开需统计的jira的页面，页面的search文本框，输入查询条件，就是sql语句，在jira中，叫做jql.2.statistic统计jira数据，并写入Excel。从Excel读取要搜索的条件：读取这个sheet：“JiraData”读取jir
python 形参可变位置参数可变关键字参数 *args **kwargs shyrainxy python 可变位置参数可变关键字参数 args kwargs
定义函数的时候，我们会指定参数，此时参数有这么几种一：固定参数，va，vb二：可变位置参数，用*号标识，*args、*var，本质是tuple三：可变关键字参数，用**好标识，**kwargs、**keyword，本质是dict但是参数位置有一定的要求：固定参数需要在可变参数的前面，且固定参数是必须传入的，可变参数可以为空。示例如下：定义的时候固定参数一定要在可变参数前面deffunction（v
基于Python的招聘系统——应聘兼职功能设计与实现 IT实战课堂—x小凡同学 Python毕业设计项目数据库
摘要：随着互联网的快速发展，招聘行业逐渐实现了线上化、自动化。本文提出了一种基于Python的招聘系统，特别关注应聘兼职功能的设计与实现。系统通过集成职位发布、简历管理、在线应聘、面试安排等功能模块，为招聘方和应聘者提供了一个高效、便捷的线上交流平台。本文首先分析了招聘系统的需求，然后详细阐述了应聘兼职功能的设计与实现过程，最后对系统进行了测试与评估。实验结果表明，该系统能够有效提高招聘效率，降低
Python入门--个数可变的位置参数和关键字参数愈努力俞幸运 Python入门 python
#函数的参数定义#个数可变的位置参数'''定义函数时，无法事先确定传递的位置实参的个数时，使用可变的位置形参使用过*定义位置可变的位置形参结果为一个元组'''#个数可变的关键字形参'''定义函数时，无法事先确定传递的关键字实参的个数时，使用可变的关键字形参使用过**定义个数可变的关键字形参结果为一个字典'''###################################3deffun(*a
@property ww哈哈哈ww 前端
@property的概念在Python中，@property是一个装饰器（decorator），它用于将一个方法转换为一个属性来访问。这使得我们可以像访问普通属性一样访问方法的返回值，而不需要显式地调用方法。简单来说，它提供了一种简洁的方式来定义和访问类中的属性，同时允许在获取和设置属性值时添加自定义的逻辑。使用@property的基本步骤定义一个类并使用@property装饰器例如，定义一个Re
python定义函数时-＞ ww哈哈哈ww python python 开发语言
在Python中，函数定义时使用的->符号用于表示函数的返回值类型注解。虽然Python是动态类型语言，这种注解并非强制要求，但它能提高代码的可读性和可维护性，也有助于类型检查工具（如mypy）进行静态类型检查。以下是关于函数定义中->的详细介绍：1.基本语法deffunction_name(parameters)->return_type:"""函数文档字符串"""#函数体returnvalue
C# 调用Python 易之阴阳敏捷编程开源技术架构 c#python microsoft
在C#中调用Python可以通过几种不同的方法实现。以下是两种常用的方法：使用Python.Runtime库和使用IronPython。使用Python.Runtime库Python.Runtime是一个允许.NET应用程序与Python交互的库。它支持Python2.x和3.x版本。以下是基本步骤：安装Python.Runtime可以通过NuGet安装Python.Runtime库。初始化Pyt
mac 安装 python2 梦魇梦狸º macos python
官网下载2.7：PythonReleasePython2.7.18|Python.org查找地址：whichpython2#/usr/local/bin/python2设置npm使用Python2（新建窗口）：npmconfigsetpython/usr/local/bin/python2验证Python版本npmconfiggetpython#应返回你设置的Python2路径python2--v
使用ChatLlamaCpp和Llama CPP Python进行聊天模型集成 AWsggdrg llama python 开发语言
在这篇文章中，我们将探讨如何使用ChatLlamaCpp和LlamaCPPPython库来搭建一个强大的聊天模型。我们将详细讲解如何进行模型集成，并提供完整的代码示例以帮助您快速上手。技术背景介绍随着自然语言处理技术的不断发展，越来越多的应用需要集成复杂的聊天模型以提高交互能力。ChatLlamaCpp是一个基于LlamaCPPPython库构建的聊天模型，支持多种功能调用和结构化输出，非常适合用
Django网站搭建流程补三补四 #Django框架后端开发 sqlite 数据库 django 后端 python
使用Django搭建网站是一个系统的过程，涉及从环境搭建到部署上线的多个步骤。以下是详细的流程：1.环境搭建（1）安装PythonDjango是基于Python的Web框架，因此需要先安装Python。建议安装Python3.8及以上版本。下载地址：Python官网。（2）安装Django使用pip安装Django：pipinstalldjango检查Django是否安装成功：django-adm
宇宙规律对可转移量子强化学习架构的启示 AI天才研究院计算机软件编程原理与应用实践 java python javascript kotlin golang 架构人工智能大厂程序员硅基计算碳基计算认知计算生物计算深度学习神经网络大数据 AIGC AGI LLM 系统架构设计软件哲学 Agent 程序员实现财富自由
第1章引言：宇宙规律与量子强化学习架构1.1问题背景宇宙规律是指宇宙中普遍存在的自然规律，如物理学中的万有引力定律、量子力学中的不确定性原理等。这些规律对宇宙的运行和演化起着决定性的作用。随着科技的发展，人们开始意识到这些宇宙规律可能对人工智能领域，尤其是量子强化学习架构的设计和优化有着深远的启示。量子强化学习是一种结合了量子计算和强化学习的新型机器学习方法。它利用量子计算机的优势，在训练和优化模
C# 与 Python 代码互相调用的实践一只小灿灿 net Python c#python
一、引言在当今的软件开发领域，不同的编程语言都有其独特的优势和适用场景。C#是一种功能强大、面向对象的编程语言，主要应用于Windows平台开发、企业级应用开发以及游戏开发（借助Unity引擎等）等领域；而Python则以其简洁的语法、丰富的库以及在数据科学、机器学习、自动化脚本等众多方面的出色表现备受青睐。在实际的项目开发中，有时候我们希望能够结合这两种语言的优势，实现C#与Python代码的互
python和PLC通信（以太网modbustcp） weixin_51506576 python 开发语言自动化
要在Python中与PLC建立通信，通常需要进行以下步骤流程：1.确定PLC的通信协议：不同的PLC厂商和型号可能采用不同的通信协议，例如Modbus、OPCUA、Profinet等。请先确定您的PLC使用的是哪种通信协议（本文为modbustcp）。2.安装相应的Python库：根据您所选择的PLC通信协议，在Python中安装相应的库。例如，如果使用Modbus协议，可以安装`pymodbus
时间序列预测综述 Super_Whw 时序预测
文章目录非周期时间序列预测1.转化为监督学习数据集，使用xgboot/LSTM模型/时间卷积网络/seq2seq(attention_based_model)2.Facebook-prophet，类似于STL分解思路3.深度学习网络，结合CNN+RNN+Attention，作用各不相同互相配合参考：非周期时间序列预测1.转化为监督学习数据集，使用xgboot/LSTM模型/时间卷积网络/seq2s
plc编程和python的联系_通过Python与西门子PLC通信 weixin_39788960 plc编程和python的联系
供大家想要与西门子PLC通信的朋友使用1、该程序是通过pythonsnap7连接西门子1200、1500系列PLC并按照I、Q、M区采集打印信息；2、用户打开应用程序之前，要将目录下的snap7.dll、snap7.lib拷贝到C盘system32或syswow64目录下，具体根据系统版本而定；3、填写config配置文件和csv文件，其中config文件每行代表意思分别是：——》plc_ip=1
python snap7 plc_Python-Snap7获取西门子PLC 300数值 weixin_39541767 python snap7 plc
说明在一次数采项目中，对现场PLC300进行取数。本人小白，在网上搜罗了大量信息，终于找到解决方法。准备事项1.操作系统2.Python环境（本次使用Python3.6.6）3.Snap7connectconnect('192.168.0.1',rack=0,slot=1)三个参数分别为：IP地址，机架，插槽read_area及write_area函数read_area(self，area，dbn
清华和哈工大把大模型量化做到了1比特，把世界顶尖多模态大模型开源大模型量化个人电脑运行！机器人领域首个开源视觉-语言操作大模型，激发开源VLMs更大潜能，视 Mamba速度提升2.8倍，内存能省87% 代码讲故事机器人智慧之心 Mamba 机器人量化大模型开源视觉 VLMs
清华和哈工大把大模型量化做到了1比特，把世界顶尖多模态大模型开源大模型量化个人电脑运行！机器人领域首个开源视觉-语言操作大模型，激发开源VLMs更大潜能，视Mamba速度提升2.8倍，内存能省87%。清华和哈工大把大模型量化做到了1比特。在追求更高效的机器学习模型部署时，模型量化技术应运而生，它通过降低权重矩阵的位宽来显著减少大型语言模型的存储和计算需求。我们一般的双精度浮点型double是64位
Python文件封装成EXE（可执行文件）苏学能 python 开发语言后端
Section1-创建纯python环境创建一个python环境，最好32位的，这样执行生成的exe可以在32位系统和64位系统上运行，此外，打包编译的exe也不至于过于庞大，以及出现总是打包不成功的问题。Section2-执行pipinstallpyinstaller在纯python环境中pip命令下执行。Section3-修改配置文件：#-*-mode:python-*-block_ciphe
大模型的部署方法三：使用Xinference部署大模型微调部署人工智能 AI大模型大模型 AI 深度学习大模型部署
Xinference是一个分布式推理框架，它支持一键部署各种模型，包括大型语言模型（LLMs）。使用Xinference部署AI大模型的步骤：一、安装Xinference1）环境准备：确保您的系统上安装了Python3.9或以上版本。安装Docker（如果选择使用Docker部署）。2）安装Xinference：通过Python的包管理工具pip安装Xinference：pipinstall"xi
Django学习笔记 Atmanlee python SQL Django
Django跟着“自强学堂”学习django。。。。。感谢学堂！！！https://code.ziqiangxuetang.com/django/django-tutorial.html（自强学堂）Django使用python开发的免费开源的web框架，用于快速搭建网站。特点之一就是拥有强大的数据库操作接口(QuerySetAPI),如果需要也可以执行原生SQLDjango概览urls.py网址入
FastAPI教程：快速构建高性能API 迪小莫学AI fastapi python
FastAPI教程：快速构建高性能API介绍FastAPI是一个现代的、快速的（高性能）Web框架，用于构建APIs，基于标准的Python类型提示。它非常适合用于构建高效、易于维护的API服务。FastAPI支持自动生成文档，输入数据验证和异步编程，且性能接近Go和Node.js。本教程目标本教程将带领你构建一个简单的FastAPI应用，包括：1.创建FastAPI项目2.定义和处理API端点3
面向对象面向过程 3213213333332132 java
面向对象：把要完成的一件事，通过对象间的协作实现。面向过程：把要完成的一件事，通过循序依次调用各个模块实现。我把大象装进冰箱这件事为例，用面向对象和面向过程实现，都是用java代码完成。 1、面向对象 package bigDemo.ObjectOriented; /** * 大象类 * * @Description * @author FuJian
Java Hotspot: Remove the Permanent Generation bookjovi HotSpot
openjdk上关于hotspot将移除永久带的描述非常详细，http://openjdk.java.net/jeps/122 JEP 122: Remove the Permanent Generation Author Jon Masamitsu Organization Oracle Created 2010/8/15 Updated 2011/
正则表达式向前查找向后查找,环绕或零宽断言 dcj3sjt126com 正则表达式
向前查找和向后查找 1. 向前查找：根据要匹配的字符序列后面存在一个特定的字符序列(肯定式向前查找)或不存在一个特定的序列(否定式向前查找)来决定是否匹配。.NET将向前查找称之为零宽度向前查找断言。对于向前查找，出现在指定项之后的字符序列不会被正则表达式引擎返回。 2. 向后查找：一个要匹配的字符序列前面有或者没有指定的
BaseDao 171815164 seda
import java.sql.Connection; import java.sql.DriverManager; import java.sql.SQLException; import java.sql.PreparedStatement; import java.sql.ResultSet; public class BaseDao { public Conn
Ant标签详解--Java命令 g21121 Java命令
这一篇主要介绍与java相关标签的使用终于开始重头戏了，Java部分是我们关注的重点也是项目中用处最多的部分。 1
[简单]代码片段_电梯数字排列 53873039oycg 代码
今天看电梯数字排列是9 18 26这样呈倒N排列的,写了个类似的打印例子，如下: import java.util.Arrays; public class 电梯数字排列_S3_Test { public static void main(S
Hessian原理云端月影 hessian原理
Hessian 原理分析一．远程通讯协议的基本原理网络通信需要做的就是将流从一台计算机传输到另外一台计算机，基于传输协议和网络 IO 来实现，其中传输协议比较出名的有 http 、 tcp 、 udp 等等， http 、 tcp 、 udp 都是在基于 Socket 概念上为某类应用场景而扩展出的传输协
区分Activity的四种加载模式----以及Intent的setFlags aijuans android
在多Activity开发中，有可能是自己应用之间的Activity跳转，或者夹带其他应用的可复用Activity。可能会希望跳转到原来某个Activity实例，而不是产生大量重复的Activity。这需要为Activity配置特定的加载模式，而不是使用默认的加载模式。加载模式分类及在哪里配置 Activity有四种加载模式： standard singleTop
hibernate几个核心API及其查询分析 antonyup_2006 html .net Hibernate xml 配置管理
(一) org.hibernate.cfg.Configuration类读取配置文件并创建唯一的SessionFactory对象.(一般,程序初始化hibernate时创建.) Configuration co
PL/SQL的流程控制百合不是茶 oracle PL/SQL编程循环控制
PL/SQL也是一门高级语言,所以流程控制是必须要有的,oracle数据库的pl/sql比sqlserver数据库要难,很多pl/sql中有的sqlserver里面没有流程控制; 分支语句 if 条件 then 结果 else 结果 end if ; 条件语句 case when 条件 then 结果; 循环语句 loop
强大的Mockito测试框架 bijian1013 mockito 单元测试
一.自动生成Mock类在需要Mock的属性上标记@Mock注解，然后@RunWith中配置Mockito的TestRunner或者在setUp()方法中显示调用MockitoAnnotations.initMocks(this);生成Mock类即可。二.自动注入Mock类到被测试类 &nbs
精通Oracle10编程SQL(11)开发子程序 bijian1013 oracle 数据库 plsql
/* *开发子程序 */ --子程序目是指被命名的PL/SQL块，这种块可以带有参数，可以在不同应用程序中多次调用 --PL/SQL有两种类型的子程序：过程和函数 --开发过程 --建立过程：不带任何参数 CREATE OR REPLACE PROCEDURE out_time IS BEGIN DBMS_OUTPUT.put_line(systimestamp); E
【EhCache一】EhCache版Hello World bit1129 Hello world
本篇是EhCache系列的第一篇，总体介绍使用EhCache缓存进行CRUD的API的基本使用，更细节的内容包括EhCache源代码和设计、实现原理在接下来的文章中进行介绍环境准备 1.新建Maven项目 2.添加EhCache的Maven依赖 <dependency> <groupId>ne
学习EJB3基础知识笔记白糖_ bean Hibernate jboss webservice ejb
最近项目进入系统测试阶段，全赖袁大虾领导有力，保持一周零bug记录，这也让自己腾出不少时间补充知识。花了两天时间把“传智播客EJB3.0”看完了，EJB基本的知识也有些了解，在这记录下EJB的部分知识，以供自己以后复习使用。 EJB是sun的服务器端组件模型，最大的用处是部署分布式应用程序。EJB (Enterprise JavaBean)是J2EE的一部分，定义了一个用于开发基
angular.bootstrap boyitech AngularJS AngularJS API angular中文api
angular.bootstrap 描述：手动初始化angular。这个函数会自动检测创建的module有没有被加载多次，如果有则会在浏览器的控制台打出警告日志，并且不会再次加载。这样可以避免在程序运行过程中许多奇怪的问题发生。使用方法： angular .
java-谷歌面试题-给定一个固定长度的数组，将递增整数序列写入这个数组。当写到数组尾部时，返回数组开始重新写，并覆盖先前写过的数 bylijinnan java
public class SearchInShiftedArray { /** * 题目：给定一个固定长度的数组，将递增整数序列写入这个数组。当写到数组尾部时，返回数组开始重新写，并覆盖先前写过的数。 * 请在这个特殊数组中找出给定的整数。 * 解答： * 其实就是“旋转数组”。旋转数组的最小元素见http://bylijinnan.iteye.com/bl
天使还是魔鬼？都是我们制造 ducklsl 生活教育情感
----------------------------剧透请原谅，有兴趣的朋友可以自己看看电影，互相讨论哦！！！从厦门回来的动车上，无意中瞟到了书中推荐的几部关于儿童的电影。当然，这几部电影可能会另大家失望，并不是类似小鬼当家的电影，而是关于“坏小孩”的电影！自己挑了两部先看了看，但是发现看完之后，心里久久不能平
[机器智能与生物]研究生物智能的问题 comsci 生物
我想,人的神经网络和苍蝇的神经网络,并没有本质的区别...就是大规模拓扑系统和中小规模拓扑分析的区别.... 但是,如果去研究活体人类的神经网络和脑系统,可能会受到一些法律和道德方面的限制,而且研究结果也不一定可靠,那么希望从事生物神经网络研究的朋友,不如把
获取Android Device的信息 dai_lm android
String phoneInfo = "PRODUCT: " + android.os.Build.PRODUCT; phoneInfo += ", CPU_ABI: " + android.os.Build.CPU_ABI; phoneInfo += ", TAGS: " + android.os.Build.TAGS; ph
最佳字符串匹配算法（Damerau-Levenshtein距离算法）的Java实现 datamachine java 算法字符串匹配
原文：http://www.javacodegeeks.com/2013/11/java-implementation-of-optimal-string-alignment.html------------------------------------------------------------------------------------------------------------
小学5年级英语单词背诵第一课 dcj3sjt126com english word
long 长的 show 给...看，出示 mouth 口，嘴 write 写 use 用，使用 take 拿，带来 hand 手 clever 聪明的 often 经常 wash 洗 slow 慢的 house 房子 water 水 clean 清洁的 supper 晚餐 out 在外 face 脸，
macvim的使用实战 dcj3sjt126com mac vim
macvim用的是mac里面的vim, 只不过是一个GUI的APP, 相当于一个壳 1. 下载macvim https://code.google.com/p/macvim/ 2. 了解macvim :h vim的使用帮助信息 :h macvim
java二分法查找蕃薯耀 java二分法查找二分法 java二分法
java二分法查找 >>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> 蕃薯耀 2015年6月23日 11:40:03 星期二 http:/
Spring Cache注解+Memcached hanqunfeng spring memcached
Spring3.1 Cache注解依赖jar包：  <dependency> <groupId>com.google.code.simple-spring-memcached</groupId> <artifactId>simple-s
apache commons io包快速入门 jackyrong apache commons
原文参考 http://www.javacodegeeks.com/2014/10/apache-commons-io-tutorial.html Apache Commons IO 包绝对是好东西，地址在http://commons.apache.org/proper/commons-io/，下面用例子分别介绍： 1）工具类 2
如何学习编程 lampcy java 编程 C++c
首先,我想说一下学习思想.学编程其实跟网络游戏有着类似的效果.开始的时候,你会对那些代码,函数等产生很大的兴趣,尤其是刚接触编程的人,刚学习第一种语言的人.可是,当你一步步深入的时候,你会发现你没有了以前那种斗志.就好象你在玩韩国泡菜网游似的,玩到一定程度,每天就是练级练级,完全是一个想冲到高级别的意志力在支持着你.而学编程就更难了,学了两个月后,总是觉得你好象全都学会了,却又什么都做不了,又没有
架构师之spring-----spring3.0新特性的bean加载控制@DependsOn和@Lazy nannan408 Spring3
1.前言。如题。 2.描述。 @DependsOn用于强制初始化其他Bean。可以修饰Bean类或方法，使用该Annotation时可以指定一个字符串数组作为参数，每个数组元素对应于一个强制初始化的Bean。 @DependsOn({"steelAxe","abc"}) @Comp
Spring4+quartz2的配置和代码方式调度 Everyday都不同代码配置 spring4 quartz2.x 定时任务
前言：这些天简直被quartz虐哭。。因为quartz 2.x版本相比quartz1.x版本的API改动太多，所以，只好自己去查阅底层API…… quartz定时任务必须搞清楚几个概念： JobDetail——处理类 Trigger——触发器，指定触发时间，必须要有JobDetail属性，即触发对象 Scheduler——调度器，组织处理类和触发器，配置方式一般只需指定触发
Hibernate入门 tntxia Hibernate
前言使用面向对象的语言和关系型的数据库，开发起来很繁琐，费时。由于现在流行的数据库都不面向对象。Hibernate 是一个Java的ORM（Object/Relational Mapping）解决方案。 Hibernte不仅关心把Java对象对应到数据库的表中，而且提供了请求和检索的方法。简化了手工进行JDBC操作的流程。如
Math类 xiaoxing598 Math
一、Java中的数字（Math）类是final类，不可继承。 1、常数 PI：double圆周率 E：double自然对数 2、截取（注意方法的返回类型） double ceil(double d) 返回不小于d的最小整数 double floor(double d) 返回不大于d的整最大数 int round(float f) 返回四舍五入后的整数 long round