kezunlin

使用TensorRT对caffe和pytorch onnx模型进行fp32和fp16推理

本文首发于个人博客https://kezunlin.me/post/bcdfb73c/，欢迎阅读最新内容！

tensorrt fp32 fp16 tutorial with caffe pytorch minist model

Series

Part 1: install and configure tensorrt 4 on ubuntu 16.04
Part 2: tensorrt fp32 fp16 tutorial
Part 3: tensorrt int8 tutorial

Code Example

include headers

#include 
#include 
#include 

#include 
#include 
#include 
#include 
#include 
#include 

#include 

#include "NvCaffeParser.h"
#include "NvOnnxConfig.h"
#include "NvOnnxParser.h"
#include "NvInfer.h"
#include "common.h"

using namespace nvinfer1;
using namespace nvcaffeparser1;

static Logger gLogger;

// Attributes of MNIST Caffe model
static const int INPUT_H = 28;
static const int INPUT_W = 28;
static const int OUTPUT_SIZE = 10;
//const char* INPUT_BLOB_NAME = "data";
const char* OUTPUT_BLOB_NAME = "prob";
const std::string mnist_data_dir = "data/mnist/";


// Simple PGM (portable greyscale map) reader
void readPGMFile(const std::string& fileName, uint8_t buffer[INPUT_H * INPUT_W])
{
    readPGMFile(fileName, buffer, INPUT_H, INPUT_W);
}

caffe model to tensorrt

void caffeToTRTModel(const std::string& deployFilepath,       // Path of Caffe prototxt file
                     const std::string& modelFilepath,        // Path of Caffe model file
                     const std::vector& outputs, // Names of network outputs
                     unsigned int maxBatchSize,               // Note: Must be at least as large as the batch we want to run with
                     IHostMemory*& trtModelStream)            // Output buffer for the TRT model
{
    // Create builder
    IBuilder* builder = createInferBuilder(gLogger);

    // Parse caffe model to populate network, then set the outputs
    std::cout << "Reading Caffe prototxt: " << deployFilepath << "\n";
    std::cout << "Reading Caffe model: " << modelFilepath << "\n";
    INetworkDefinition* network = builder->createNetwork();
    ICaffeParser* parser = createCaffeParser();

    bool useFp16 = builder->platformHasFastFp16();
    std::cout << "platformHasFastFp16: " << useFp16 << "\n";

    bool useInt8 = builder->platformHasFastInt8();
    std::cout << "platformHasFastInt8: " << useInt8 << "\n";

    // create a 16-bit model if it's natively supported
    DataType modelDataType = useFp16 ? DataType::kHALF : DataType::kFLOAT; 
    
    const IBlobNameToTensor* blobNameToTensor = parser->parse(deployFilepath.c_str(),
                                                              modelFilepath.c_str(),
                                                              *network,
                                                              modelDataType);
    // Specify output tensors of network
    // ERROR: Network must have at least one output
    for (auto& s : outputs){
        std::cout<<"output = "<< s.c_str() << std::endl;
        network->markOutput(*blobNameToTensor->find(s.c_str())); // prob
    } 

    builder->setMaxBatchSize(maxBatchSize);
    builder->setMaxWorkspaceSize(1 << 20);

    // set up the network for paired-fp16 format if available
    if(useFp16)
        builder->setFp16Mode(true);

    // Build engine
    ICudaEngine* engine = builder->buildCudaEngine(*network);
    assert(engine);

    // Destroy parser and network
    network->destroy();
    parser->destroy();

    // Serialize engine and destroy it
    trtModelStream = engine->serialize();
    engine->destroy();
    builder->destroy();

    //shutdownProtobufLibrary();
}

pytorch onnx to tensorrt

void onnxToTRTModel( const std::string& modelFilepath,        // name of the onnx model 
                     unsigned int maxBatchSize,            // batch size - NB must be at least as large as the batch we want to run with
                     IHostMemory *&trtModelStream)      // output buffer for the TensorRT model
{
    // create the builder
    IBuilder* builder = createInferBuilder(gLogger);

    nvonnxparser::IOnnxConfig* config = nvonnxparser::createONNXConfig();
    config->setModelFileName(modelFilepath.c_str());
    
    nvonnxparser::IONNXParser* parser = nvonnxparser::createONNXParser(*config);
    
    //Optional - uncomment below lines to view network layer information
    //config->setPrintLayerInfo(true);
    //parser->reportParsingInfo();
    
    if (!parser->parse(modelFilepath.c_str(), DataType::kFLOAT))
    {
        string msg("failed to parse onnx file");
        gLogger.log(nvinfer1::ILogger::Severity::kERROR, msg.c_str());
        exit(EXIT_FAILURE);
    }
    
    if (!parser->convertToTRTNetwork()) {
        string msg("ERROR, failed to convert onnx network into TRT network");
        gLogger.log(nvinfer1::ILogger::Severity::kERROR, msg.c_str());
        exit(EXIT_FAILURE);
    }
    nvinfer1::INetworkDefinition* network = parser->getTRTNetwork();
    
    // Build the engine
    builder->setMaxBatchSize(maxBatchSize);
    builder->setMaxWorkspaceSize(1 << 20);

    ICudaEngine* engine = builder->buildCudaEngine(*network);
    assert(engine);

    // we don't need the network any more, and we can destroy the parser
    network->destroy();
    parser->destroy();

    // serialize the engine, then close everything down
    trtModelStream = engine->serialize();
    engine->destroy();
    builder->destroy();

    //shutdownProtobufLibrary();
}

do inference

void doInference(IExecutionContext& context, float* input, float* output, int batchSize)
{
    const ICudaEngine& engine = context.getEngine();
    // Pointers to input and output device buffers to pass to engine.
    // Engine requires exactly IEngine::getNbBindings() number of buffers.
    assert(engine.getNbBindings() == 2);
    void* buffers[2];

    // In order to bind the buffers, we need to know the names of the input and output tensors.
    // Note that indices are guaranteed to be less than IEngine::getNbBindings()
    int inputIndex, outputIndex;

    printf("Bindings after deserializing:\n");
    for (int bi = 0; bi < engine.getNbBindings(); bi  ) 
    {
        if (engine.bindingIsInput(bi) == true) 
        {
            inputIndex = bi;
            printf("Binding %d (%s): Input.\n",  bi, engine.getBindingName(bi));
        } else 
        {
            outputIndex = bi;
            printf("Binding %d (%s): Output.\n", bi, engine.getBindingName(bi));
        }
    }

    //const int inputIndex = engine.getBindingIndex(INPUT_BLOB_NAME);
    //const int outputIndex = engine.getBindingIndex(OUTPUT_BLOB_NAME);

    std::cout<<"inputIndex = "<< inputIndex << std::endl; // 0   data
    std::cout<<"outputIndex = "<< outputIndex << std::endl; // 1  prob

    // Create GPU buffers on device
    CHECK(cudaMalloc(&buffers[inputIndex], batchSize * INPUT_H * INPUT_W * sizeof(float)));
    CHECK(cudaMalloc(&buffers[outputIndex], batchSize * OUTPUT_SIZE * sizeof(float)));

    // Create stream
    cudaStream_t stream;
    CHECK(cudaStreamCreate(&stream));

    // DMA input batch data to device, infer on the batch asynchronously, and DMA output back to host
    CHECK(cudaMemcpyAsync(buffers[inputIndex], input, batchSize * INPUT_H * INPUT_W * sizeof(float), cudaMemcpyHostToDevice, stream));
    context.enqueue(batchSize, buffers, stream, nullptr);
    CHECK(cudaMemcpyAsync(output, buffers[outputIndex], batchSize * OUTPUT_SIZE * sizeof(float), cudaMemcpyDeviceToHost, stream));
    cudaStreamSynchronize(stream);

    // Release stream and buffers
    cudaStreamDestroy(stream);
    CHECK(cudaFree(buffers[inputIndex]));
    CHECK(cudaFree(buffers[outputIndex]));
}

save and load engine

void SaveEngine(const nvinfer1::IHostMemory& trtModelStream, const std::string& engine_filepath)
{
    std::ofstream file;
    file.open(engine_filepath, std::ios::binary | std::ios::out);
    if(!file.is_open())
    {
        std::cout << "read create engine file" << engine_filepath <<" failed" << std::endl;
        return;
    }
    file.write((const char*)trtModelStream.data(), trtModelStream.size());
    file.close();
};


ICudaEngine* LoadEngine(IRuntime& runtime, const std::string& engine_filepath)
{
    ifstream file;
    file.open(engine_filepath, ios::binary | ios::in);
    file.seekg(0, ios::end); 
    int length = file.tellg();         
    file.seekg(0, ios::beg); 

    std::shared_ptr data(new char[length], std::default_delete());
    file.read(data.get(), length);
    file.close();

    // runtime->deserializeCudaEngine(trtModelStream->data(), trtModelStream->size(), nullptr);
    ICudaEngine* engine = runtime.deserializeCudaEngine(data.get(), length, nullptr);
    assert(engine != nullptr);
    return engine;
}

example

void demo_save_caffe_to_trt(const std::string& engine_filepath)
{
    std::string deploy_filepath = mnist_data_dir   "mnist.prototxt";
    std::string model_filepath = mnist_data_dir   "mnist.caffemodel";
    
     // Create TRT model from caffe model and serialize it to a stream
    IHostMemory* trtModelStream{nullptr};
    caffeToTRTModel(deploy_filepath, model_filepath, std::vector{OUTPUT_BLOB_NAME}, 1, trtModelStream);
    assert(trtModelStream != nullptr);

    SaveEngine(*trtModelStream, engine_filepath);

    // destroy stream
    trtModelStream->destroy();
}


void demo_save_onnx_to_trt(const std::string& engine_filepath)
{
    std::string onnx_filepath = mnist_data_dir   "mnist.onnx";
    
     // Create TRT model from caffe model and serialize it to a stream
    IHostMemory* trtModelStream{nullptr};
    onnxToTRTModel(onnx_filepath, 1, trtModelStream);
    assert(trtModelStream != nullptr);

    SaveEngine(*trtModelStream, engine_filepath);

    // destroy stream
    trtModelStream->destroy();
}


int mnist_demo()
{
    bool use_caffe = false; 
    std::string engine_filepath;
    if (use_caffe){
        engine_filepath = "cfg/mnist/caffe_minist_fp32.trt";
        demo_save_caffe_to_trt(engine_filepath);
    } else {
        engine_filepath = "cfg/mnist/onnx_minist_fp32.trt";
        demo_save_onnx_to_trt(engine_filepath);
    }
    std::cout<<"[API] Save engine to "<< engine_filepath <parseBinaryProto(mean_filepath.c_str());
        parser->destroy();

        // Subtract mean from image
        const float* meanData = reinterpret_cast(meanBlob->getData()); // size 786

        for (int i = 0; i < INPUT_H * INPUT_W; i  )
            data[i] = float(fileData[i]) - meanData[i];
        
        meanBlob->destroy();
    } else {

        for (int i = 0; i < INPUT_H * INPUT_W; i  )
            data[i] = 1.0 - float(fileData[i]/255.0);
    }
    

    // Deserialize engine we serialized earlier
    IRuntime* runtime = createInferRuntime(gLogger);
    assert(runtime != nullptr);

    std::cout<<"[API] Load engine from "<< engine_filepath <createExecutionContext();
    assert(context != nullptr);

    // Run inference on input data
    float prob[OUTPUT_SIZE];
    doInference(*context, data, prob, 1);

    // Destroy the engine
    context->destroy();
    engine->destroy();
    runtime->destroy();

    // Print histogram of the output distribution
    std::cout << "\nOutput:\n\n";

    // for onnx,we get z as output, we need to use softmax to get probs
    if ( !use_caffe){

        //Calculate Softmax
        float sum{0.0f};
        for(int i = 0; i < OUTPUT_SIZE; i  )
        {
            prob[i] = exp(prob[i]);
            sum  = prob[i];
        }
        for(int i = 0; i < OUTPUT_SIZE; i  )
        {
            prob[i] /= sum;
        }
    }
    
    // find max probs
    float val{0.0f};
    int idx{0};
    for (unsigned int i = 0; i < 10; i  )
    {
        val = std::max(val, prob[i]);
        if (val == prob[i]) {
            idx = i;
        }
        cout << " Prob " << i << "  "<< std::fixed << std::setw(5) << std::setprecision(4) << prob[i];
        std::cout << i << ": " << std::string(int(std::floor(prob[i] * 10   0.5f)), '*') << "\n";
    }
    std::cout << std::endl;

    return (idx == num && val > 0.9f) ? EXIT_SUCCESS : EXIT_FAILURE;
}


int main(int argc, char** argv)
{
    mnist_demo();
    return 0;
}

results

./bin/sample_mnist 
[API] Save engine to cfg/mnist/onnx_minist_fp32.trt
[API] Load engine from cfg/mnist/onnx_minist_fp32.trt
Bindings after deserializing:
Binding 0 (Input3): Input.
Binding 1 (Plus214_Output_0): Output.
inputIndex = 0
outputIndex = 1

Output:

 Prob 0  0.00000: 
 Prob 1  0.00001: 
 Prob 2  0.00002: 
 Prob 3  0.00003: 
 Prob 4  0.00004: 
 Prob 5  0.00005: 
 Prob 6  1.00006: **********
 Prob 7  0.00007: 
 Prob 8  0.00008: 
 Prob 9  0.00009:

Reference

tensorrt-api

History

20190422 created.

Copyright

Post author: kezunlin
Post link: https://kezunlin.me/post/bcdfb73c/
Copyright Notice: All articles in this blog are licensed under CC BY-NC-SA 3.0 unless stating additionally.

Windows 10上源码编译glog和gflags 编写glog-config.cmake和gflags-config.cmake kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/bb64e398/，欢迎阅读!compileglogv0.3.5andglagsonwindowsfromsource.Seriescompileglogandglagsonwindowscompileglogandglagsonubuntu16.04Guideversionglog:v0.3.5https://github.co
ubuntu 16.04上源码编译glog和gflags 编写glog-config.cmake和gflags-config.cmake kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/977f5125/，欢迎阅读!compileglogandglagsonubuntu16.04Seriescompileglogandglagsonwindowscompileglogandglagsonubuntu16.04Guideversionwgethttps://github.com/schuhschuh/gflags/
ubuntu 16.04源码编译OpenCV教程 | compile opencv on ubuntu 16.04 kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/15f5c3e8/，欢迎阅读!compileopencvonubuntu16.04SeriesPart1:compileopencvonubuntu16.04Part2:compileopencvwithCUDAsupportonwindows10Part3:opencvmatforloopPart4:speedupopencvi
Ubuntu 16.04源码编译boost库编写CMakeLists.txt | compile boost 1.66.0 from source on ubuntu 16.04 kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/d5d4a460/，欢迎阅读!compileboost1.66.0fromsourceonubuntu16.04Guideapt-get#1.58forubuntu16.04sudoapt-getinstalllibboost-all-devcompilefromsourcesudoapt-get-ypurgelibboost-a
windows 10使用vscode进行远程代码开发 | tutorial to use vscode for remote development using ssh on windows kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/c93b6ba6/，欢迎阅读最新内容！tutorialtousevscodeforremotedevelopmentusingsshonwindowsGuideserversudoapt-getinstallopenssh-serverlocalinstallssh-clientonlocalmachine.downloadVSC
Ubuntu 16.04安装ROS Kinetic详细教程 | Tutorial to Install ROS Kinetic on Ubuntu 16.04 kezunlin kezunlin.me ros
本文首发于个人博客https://kezunlin.me/post/e2780b93/，欢迎阅读!TutorialtoInstallandConfigureROSKineticonUbuntu16.04.ROSreleaseROSversionUbuntuversion2016.3ROSKineticKameUbuntu16.04(Xenial)/Ubuntu15.10InstallGuidequ
使用TensorRT对caffe和pytorch onnx模型进行fp32和fp16推理 kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/bcdfb73c/，欢迎阅读最新内容！tensorrtfp32fp16tutorialwithcaffepytorchministmodelSeriesPart1:installandconfiguretensorrt4onubuntu16.04Part2:tensorrtfp32fp16tutorialPart3:tensorr
keras EfficientNet介绍，在ImageNet任务上涨点明显 | keras efficientnet introduction kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/88fbc049/，欢迎阅读最新内容！kerasefficientnetintroductionGuideAboutEfficientNetModelscomparedwithresnet50,EfficientNet-B4improvesthetop-1accuracyfrom76.3%ofResNet-50to82.6%(6.
C 中自定义类2种自增运算的代码实现和区别 kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/caef83a3/，欢迎阅读最新内容！cppivsiforuserdefinedclassGuidecode#include#include#include#include#includeusingnamespacestd;classInteger{public:Integer(intvalue):v(value){cout<<"
如何使用resty命令行客户端和http rest服务进行交互 kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/4f5f98b9/，欢迎阅读最新内容！howtoinstallanduserestycommandlineclientforinteractingwithrestservicesGuideinstallYouhavecurl,right?Okay.curl-Lhttps://raw.githubusercontent.com/mi
python有用代码合集旋转图像/base64图像编码/json序列化/request爬取网页等 kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/77697d8d/，欢迎阅读最新内容！pythonusefultoolsandcodesnippetsGuideflipimportcv2image=cv2.imread("demo.jpg")#FlippedHorizontally水平翻转h_flip=cv2.flip(image,1)cv2.imwrite("demo-h.j
C 中如何使用CUDA进行高性能大规模矩阵乘法运算？ kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/ad5c5bd9/，欢迎阅读最新内容！cublasSgemmforlargematrixmultiplicationongpuinCGuidePart1:cppcudaprogrammingtutorialPart2:cudaactivationkernelsPart3:cublasSgemmforlargematrixmulti
ubuntu 16.04 上使用pybind11进行C 和Python代码相互调用 | Interfacing C and Python kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/a41adc1/，欢迎阅读!InterfacingCandPythonwithpybind11onubuntu16.04SeriesPart1:InterfacingCandPythonwithpybind11onwindows10Part2:InterfacingCandPythonwithpybind11onubuntu16.
C 中如何使用CUDA自己实现常用的深度学习激活函数？ kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/ee123cac/，欢迎阅读最新内容！howtoimplementdeeplearningactivationkernelswithcudaincGuidePart1:cppcudaprogrammingtutorialPart2:cudaactivationkernelsPart3:cublasSgemmforlargematr
ubuntu 16.04上源码编译和安装cgal并编写CMakeLists.txt | compile and install cgal on ubuntu 16.04 kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/39ab7ed9/，欢迎阅读最新内容！compileandinstallcgalonubuntu16.04Guideversion:4.13.1installwgethttps://github.com/CGAL/cgal/releases/download/releases/CGAL-4.13.1/CGAL-4.13.1.zip
Ubuntu 16.04上源码编译和安装pytorch教程，并编写C Demo CMakeLists.txt kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/54e7a3d8/，欢迎阅读最新内容！tutorialtocompileandusepytorchonubuntu16.04PyTorchforPythoninstallpytorchfromanacondacondainfo--envscondaactivatepy35#newestversion#1.1.0pytorch/0.
keras RAdam优化器使用教程， keras加载模型包含自定义优化器报错如何解决？ kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/c691f02b/，欢迎阅读最新内容！pythonkerasRAdamtutorialandloadcustomoptimizerwithCustomObjectScopeRAdamusageimportkerasimportnumpyasnpfromkeras_radamimportRAdam#Buildtoymodelwith
Ubuntu网络network eth0配置 | ubuntu network configuration kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/5076bc45/，欢迎阅读!ubuntunetworkconfigurationGuidenetworkproxySystemwide:Network--->None/Manualchrome:cannotsetfirefox:about:preferences--->NetworkProxyeth0configrenamexx
keras对图像数据进行增强 | keras data augmentation kezunlin kezunlin.me
本文首发于个人博客https://kezunlin.me/post/8db507ff/，欢迎阅读最新内容！kerasdataaugmentationGuidecode#importthenecessarypackagesfromkeras.preprocessing.imageimportImageDataGeneratorfromkeras.preprocessing.imageimportim
如何编译和使用自定义Qt动态链接库 | how to build and use user-defined qt library kezunlin
本文首发于个人博客https://kezunlin.me/post/cf628dd8/，欢迎阅读!guidetobuildqtlibraryanduseinanotherprojectGuidebuildqtlibraryQObjectclassclassSHARED_EXPORTCameraGrabber:publicQObject{Q_OBJECTsignals:voidsendFrameTr
C++中如何使用CUDA进行高性能大规模矩阵乘法运算 kezunlin c++
本文首发于个人博客https://kezunlin.me/post/ad5c5bd9/，欢迎阅读最新内容！cublasSgemmforlargematrixmultiplicationongpuinC++GuidePart1:cppcudaprogrammingtutorialPart2:cudaactivationkernelsPart3:cublasSgemmforlargematrixmul
C++中如何使用CUDA自己实现常用的深度学习激活函数？ kezunlin c++
本文首发于个人博客https://kezunlin.me/post/ee123cac/，欢迎阅读最新内容！howtoimplementdeeplearningactivationkernelswithcudainc++GuidePart1:cppcudaprogrammingtutorialPart2:cudaactivationkernelsPart3:cublasSgemmforlargema
caffe和pytorch如何从文件file和流stream中导入模型? kezunlin 深度学习
本文首发于个人博客https://kezunlin.me/post/5898412/，欢迎阅读最新内容！loadmodelfromfileandstreamforcaffeandpytorchGuidecaffeloadfromfileenumcaffe::Phasephase=caffe::Phase::TEST;std::stringproto_filepath="yolov3.prototx
如何在动态链接库dll/so中导出自定义的模板类template class kezunlin c++
本文首发于个人博客https://kezunlin.me/post/4ec4ae49/，欢迎阅读最新内容！howtoimplementatemplateclasswithc++andexportindll/soGuidequestions模板类必须在header中实现，而不能在cpp中实现，否则作为dll调用进行链接的时候回出错。commonsolutions(Recommend)implemen
5种智能指针指向数组的方法 kezunlin c++
本文首发于个人博客https://kezunlin.me/post/b82753fc/，欢迎阅读最新内容！5methodsforc++shared_ptrpointtoanarrayGuideshared_ptrPriortoC++17,shared_ptrcouldnotbeusedtomanagedynamicallyallocatedarrays.Bydefault,shared_ptrwi
nlohmann 最优秀的C++序列化工具库详细入门教程 kezunlin c++
本文首发于个人博客https://kezunlin.me/post/f3c3eb8/，欢迎阅读最新内容！tutorialtousenlohmannjsonforserializingdatawithmoderncppGuideinclude#include//forconvenienceusingjson=nlohmann::json;compilewith-std=c++11CMakeLists
C++ 如何用百行代码实现线程安全的并发队列 | concurrent queue kezunlin c++
本文首发于个人博客https://kezunlin.me/post/cabccf5c/，欢迎阅读最新内容！concurrentqueueorblockingqueueimplementedincppGuideintroductionWhereproduce-consumerpatternispresentitisoftenthecasethatoneisfasterthattheother:apa
你的首个golang语言详细入门教程 | your first golang tutorial kezunlin golang
本文首发于个人博客https://kezunlin.me/post/a0fb7f06/，欢迎阅读最新内容！yourfirstgolangtutorialgotutorialversions:go:1.13.1installwgethttps://dl.google.com/go/go1.13.1.linux-amd64.tar.gzsudotar-C/usr/local-xzfgo1.13.1.l
如何使用1行代码让你的C++程序控制台输出彩色log信息 kezunlin c++
本文首发于个人博客https://kezunlin.me/post/a201e11b/，欢迎阅读最新内容！colorwheelforcoloredprintandtraceforcppprogramsGuideinstallsudowget-O/usr/include/colorwheel.hhttps://raw.githubusercontent.com/Totoditoto/colorwhe
C++如何使用宏定义来简化代码性能测试 kezunlin c++
本文首发于个人博客https://kezunlin.me/post/65dc693d/，欢迎阅读最新内容！cppmacrolikefunctiontoimplementaperformanceprofilerGuidemacroexpansionsname===>quoteasstrings"xxx"name,name===>xxxa##b===>concatenatetheprecedingan
Js函数返回值 _wy_ js return
一、返回控制与函数结果，语法为：return 表达式;作用: 结束函数执行，返回调用函数，而且把表达式的值作为函数的结果二、返回控制语法为：return;作用: 结束函数执行，返回调用函数，而且把undefined作为函数的结果在大多数情况下,为事件处理函数返回false,可以防止默认的事件行为.例如,默认情况下点击一个<a>元素,页面会跳转到该元素href属性
MySQL 的 char 与 varchar bylijinnan mysql
今天发现，create table 时，MySQL 4.1有时会把 char 自动转换成 varchar 测试举例： CREATE TABLE `varcharLessThan4` ( `lastName` varchar(3) ) ; mysql> desc varcharLessThan4; +----------+---------+------+-
Quartz——TriggerListener和JobListener eksliang TriggerListener JobListener quartz
转载请出自出处：http://eksliang.iteye.com/blog/2208624 一.概述 listener是一个监听器对象，用于监听scheduler中发生的事件，然后执行相应的操作；你可能已经猜到了，TriggerListeners接受与trigger相关的事件，JobListeners接受与jobs相关的事件。二.JobListener监听器 j
oracle层次查询 18289753290 oracle；层次查询；树查询
.oracle层次查询(connect by) oracle的emp表中包含了一列mgr指出谁是雇员的经理，由于经理也是雇员，所以经理的信息也存储在emp表中。这样emp表就是一个自引用表，表中的mgr列是一个自引用列，它指向emp表中的empno列，mgr表示一个员工的管理者， select empno,mgr,ename,sal from e
通过反射把map中的属性赋值到实体类bean对象中酷的飞上天空 javaee 泛型类型转换
使用过struts2后感觉最方便的就是这个框架能自动把表单的参数赋值到action里面的对象中但现在主要使用Spring框架的MVC，虽然也有@ModelAttribute可以使用但是明显感觉不方便。好吧，那就自己再造一个轮子吧。原理都知道，就是利用反射进行字段的赋值，下面贴代码主要类如下： import java.lang.reflect.Field; imp
SAP HANA数据存储：传统硬盘的瓶颈问题蓝儿唯美 HANA
SAPHANA平台有各种各样的应用场景，这也意味着客户的实施方法有许多种选择，关键是如何挑选最适合他们需求的实施方案。在《Implementing SAP HANA》这本书中，介绍了SAP平台在现实场景中的运作原理，并给出了实施建议和成功案例供参考。本系列文章节选自《Implementing SAP HANA》，介绍了行存储和列存储的各自特点，以及SAP HANA的数据存储方式如何提升空间压
Java Socket 多线程实现文件传输随便小屋 java socket
高级操作系统作业，让用Socket实现文件传输，有些代码也是在网上找的，写的不好，如果大家能用就用上。客户端类： package edu.logic.client; import java.io.BufferedInputStream; import java.io.Buffered
java初学者路径 aijuans java
学习Java有没有什么捷径?要想学好Java，首先要知道Java的大致分类。自从Sun推出Java以来，就力图使之无所不包，所以Java发展到现在，按应用来分主要分为三大块：J2SE,J2ME和J2EE,这也就是Sun ONE(Open Net Environment)体系。J2SE就是Java2的标准版，主要用于桌面应用软件的编程；J2ME主要应用于嵌入是系统开发，如手机和PDA的编程；J2EE
APP推广 aoyouzi APP 推广
一，免费篇 1，APP推荐类网站自主推荐最美应用、酷安网、DEMO8、木蚂蚁发现频道等,如果产品独特新颖，还能获取最美应用的评测推荐。PS：推荐简单。只要产品有趣好玩，用户会自主分享传播。例如足迹APP在最美应用推荐一次，几天用户暴增将服务器击垮。 2，各大应用商店首发合作老实盯着排期，多给应用市场官方负责人献殷勤。 3，论坛贴吧推广百度知道，百度贴吧，猫扑论坛，天涯社区，豆瓣（
JSP转发与重定向百合不是茶 jsp servlet Java Web jsp转发
在servlet和jsp中我们经常需要请求,这时就需要用到转发和重定向; 转发包括;forward和include 例子;forwrad转发; 将请求装法给reg.html页面关键代码; req.getRequestDispatcher("reg.html
web.xml之jsp-config bijian1013 java web.xml servlet jsp-config
1.作用：主要用于设定JSP页面的相关配置。 2.常见定义： <jsp-config> <taglib> <taglib-uri>URI(定义TLD文件的URI,JSP页面的tablib命令可以经由此URI获取到TLD文件)</tablib-uri> <taglib-location> TLD文件所在的位置
JSF2.2 ViewScoped Using CDI sunjing CDI JSF 2.2 ViewScoped
JSF 2.0 introduced annotation @ViewScoped; A bean annotated with this scope maintained its state as long as the user stays on the same view(reloads or navigation - no intervening views). One problem w
【分布式数据一致性二】Zookeeper数据读写一致性 bit1129 zookeeper
很多文档说Zookeeper是强一致性保证，事实不然。关于一致性模型请参考http://bit1129.iteye.com/blog/2155336 Zookeeper的数据同步协议 Zookeeper采用称为Quorum Based Protocol的数据同步协议。假如Zookeeper集群有N台Zookeeper服务器(N通常取奇数，3台能够满足数据可靠性同时
Java开发笔记白糖_ java开发
1、Map<key,value>的remove方法只能识别相同类型的key值 Map<Integer,String> map = new HashMap<Integer,String>(); map.put(1,"a"); map.put(2,"b"); map.put(3,"c"
图片黑色阴影 bozch 图片
.event{ padding:0; width:460px; min-width: 460px; border:0px solid #e4e4e4; height: 350px; min-heig
编程之美-饮料供货-动态规划 bylijinnan 动态规划
import java.util.Arrays; import java.util.Random; public class BeverageSupply { /** * 编程之美饮料供货 * 设Opt（V’，i）表示从i到n-1种饮料中，总容量为V’的方案中，满意度之和的最大值。 * 那么递归式就应该是：Opt（V’，i）=max{ k * Hi+Op
ajax大参数（大数据）提交性能分析 chenbowen00 Web Ajax 框架浏览器 prototype
近期在项目中发现如下一个问题项目中有个提交现场事件的功能，该功能主要是在web客户端保存现场数据（主要有截屏，终端日志等信息）然后提交到服务器上方便我们分析定位问题。客户在使用该功能的过程中反应点击提交后反应很慢，大概要等10到20秒的时间浏览器才能操作，期间页面不响应事件。根据客户描述分析了下的代码流程，很简单，主要通过OCX控件截屏，在将前端的日志等文件使用OCX控件打包，在将之转换为
[宇宙与天文]在太空采矿,在太空建造 comsci
我们在太空进行工业活动...但是不太可能把太空工业产品又运回到地面上进行加工,而一般是在哪里开采,就在哪里加工,太空的微重力环境,可能会使我们的工业产品的制造尺度非常巨大.... 地球上制造的最大工业机器是超级油轮和航空母舰,再大些就会遇到困难了,但是在空间船坞中,制造的最大工业机器,可能就没
ORACLE中CONSTRAINT的四对属性 daizj oracle CONSTRAINT
ORACLE中CONSTRAINT的四对属性 summary:在data migrate时,某些表的约束总是困扰着我们,让我们的migratet举步维艰,如何利用约束本身的属性来处理这些问题呢?本文详细介绍了约束的四对属性: Deferrable/not deferrable, Deferred/immediate, enalbe/disable, validate/novalidate,以及如
Gradle入门教程 dengkane gradle
一、寻找gradle的历程一开始的时候，我们只有一个工程，所有要用到的jar包都放到工程目录下面，时间长了，工程越来越大，使用到的jar包也越来越多，难以理解jar之间的依赖关系。再后来我们把旧的工程拆分到不同的工程里，靠ide来管理工程之间的依赖关系，各工程下的jar包依赖是杂乱的。一段时间后，我们发现用ide来管理项程很不方便，比如不方便脱离ide自动构建，于是我们写自己的ant脚本。再后
C语言简单循环示例 dcj3sjt126com c
# include <stdio.h> int main(void) { int i; int count = 0; int sum = 0; float avg; for (i=1; i<=100; i++) { if (i%2==0) { count++; sum += i; } } avg
presentModalViewController 的动画效果 dcj3sjt126com controller
系统自带(四种效果)： presentModalViewController模态的动画效果设置： [cpp] view plain copy UIViewController *detailViewController = [[UIViewController al
java 二分查找 shuizhaosi888 二分查找 java二分查找
需求：在排好顺序的一串数字中，找到数字T 一般解法：从左到右扫描数据，其运行花费线性时间O(N)。然而这个算法并没有用到该表已经排序的事实。 /** * * @param array * 顺序数组 * @param t * 要查找对象 * @return */ public stati
Spring Security（07）——缓存UserDetails 234390216 ehcache 缓存 Spring Security
Spring Security提供了一个实现了可以缓存UserDetails的UserDetailsService实现类，CachingUserDetailsService。该类的构造接收一个用于真正加载UserDetails的UserDetailsService实现类。当需要加载UserDetails时，其首先会从缓存中获取，如果缓存中没
Dozer 深层次复制 jayluns VO maven po
最近在做项目上遇到了一些小问题，因为架构在做设计的时候web前段展示用到了vo层，而在后台进行与数据库层操作的时候用到的是Po层。这样在业务层返回vo到控制层，每一次都需要从po-->转化到vo层，用到BeanUtils.copyProperties(source, target)只能复制简单的属性，因为实体类都配置了hibernate那些关联关系，所以它满足不了现在的需求，但后发现还有个很
CSS规范整理（摘自懒人图库） a409435341 html UI css 浏览器
刚没事闲着在网上瞎逛，找了一篇CSS规范整理，粗略看了一下后还蛮有一定的道理，并自问是否有这样的规范，这也是初入前端开发的人一个很好的规范吧。一、文件规范 1、文件均归档至约定的目录中。具体要求通过豆瓣的CSS规范进行讲解：所有的CSS分为两大类：通用类和业务类。通用的CSS文件，放在如下目录中：基本样式库 /css/core
C++动态链接库创建与使用你不认识的休道人 C++dll
一、创建动态链接库 1.新建工程test中选择”MFC [dll]”dll类型选择第二项"Regular DLL With MFC shared linked"，完成 2.在test.h中添加 extern “C” 返回类型 _declspec(dllexport)函数名(参数列表); 3.在test.cpp中最后写 extern “C” 返回类型 _decls
Android代码混淆之ProGuard rensanning ProGuard
Android应用的Java代码，通过反编译apk文件（dex2jar、apktool）很容易得到源代码，所以在release版本的apk中一定要混淆一下一些关键的Java源码。 ProGuard是一个开源的Java代码混淆器（obfuscation）。ADT r8开始它被默认集成到了Android SDK中。官网： http://proguard.sourceforge.net/
程序员在编程中遇到的奇葩弱智问题 tomcat_oracle jquery 编程 ide
　　现在收集一下：　　排名不分先后，按照发言顺序来的。 1、Jquery插件一个通用函数一直报错，尤其是很明显是存在的函数，很有可能就是你没有引入jquery。。。或者版本不对 2、调试半天没变化：不在同一个文件中调试。这个很可怕，我们很多时候会备份好几个项目，改完发现改错了。有个群友说的好：在汤匙
解决maven-dependency-plugin (goals "copy-dependencies","unpack") is not supported xp9802 dependency
解决办法：在plugins之前添加如下pluginManagement，二者前后顺序如下： [html] view plain copy <build> <pluginManagement

使用TensorRT对caffe和pytorch onnx模型进行fp32和fp16推理

Series

Code Example

include headers

caffe model to tensorrt

pytorch onnx to tensorrt

do inference

save and load engine

example

results

Reference

History

Copyright

你可能感兴趣的:(kezunlin.me)