当前位置：首页 > 编程日记 > 正文

TensorRT Samples: GoogleNet

编程日记 2024-12-20 13:50:00

关于TensorRT的介绍可以参考： http://blog.csdn.net/fengbingchun/article/details/78469551

以下是参考TensorRT 2.1.2中的sampleGoogleNet.cpp文件改写的测试代码，文件(googlenet.cpp)内容如下：

#include <iostream>
#include <tuple>
#include <string>
#include <vector>
#include <algorithm>#include <cuda_runtime_api.h>
#include <NvInfer.h>
#include <NvCaffeParser.h>#include "common.hpp"// reference: TensorRT-2.1.2/samples/sampleMNIST/sampleGoogleNet.cppnamespace {
// batch size, timing iterations, input blob name, output blob name, deploy file, model file
typedef std::tuple<int, int, std::string, std::string, std::string , std::string> DATA_INFO;  struct Profiler : public nvinfer1::IProfiler {typedef std::pair<std::string, float> Record;std::vector<Record> mProfile;int timing_iterations {1};void setTimeIterations(int iteration){timing_iterations = iteration;}virtual void reportLayerTime(const char* layerName, float ms){auto record = std::find_if(mProfile.begin(), mProfile.end(), [&](const Record& r){ return r.first == layerName; });if (record == mProfile.end())mProfile.push_back(std::make_pair(layerName, ms));elserecord->second += ms;}void printLayerTimes(){float totalTime = 0;for (size_t i = 0; i < mProfile.size(); ++i) {fprintf(stdout, "%s %4.3fms\n", mProfile[i].first.c_str(), mProfile[i].second / timing_iterations);totalTime += mProfile[i].second;}fprintf(stdout, "Time over all layers: %4.3f\n", totalTime / timing_iterations);}};int caffeToGIEModel(const std::string& deployFile,		// name for caffe prototxtconst std::string& modelFile,				// name for model const std::vector<std::string>& outputs,   // network outputsunsigned int maxBatchSize,					// batch size - NB must be at least as large as the batch we want to run with)nvinfer1::IHostMemory *&gieModelStream, Logger logger)
{// create API root class - must span the lifetime of the engine usagenvinfer1::IBuilder* builder = nvinfer1::createInferBuilder(logger);nvinfer1::INetworkDefinition* network = builder->createNetwork();// parse the caffe model to populate the network, then set the outputsnvcaffeparser1::ICaffeParser* parser = nvcaffeparser1::createCaffeParser();bool useFp16 = builder->platformHasFastFp16();nvinfer1::DataType modelDataType = useFp16 ? nvinfer1::DataType::kHALF : nvinfer1::DataType::kFLOAT; // create a 16-bit model if it's natively supportedconst nvcaffeparser1::IBlobNameToTensor* blobNameToTensor = parser->parse(deployFile.c_str(), modelFile.c_str(), *network, modelDataType);CHECK(blobNameToTensor != nullptr);// the caffe file has no notion of outputs, so we need to manually say which tensors the engine should generate	for (auto& s : outputs)network->markOutput(*blobNameToTensor->find(s.c_str()));// Build the enginebuilder->setMaxBatchSize(maxBatchSize);builder->setMaxWorkspaceSize(16 << 20);// set up the network for paired-fp16 format if availableif(useFp16)builder->setHalf2Mode(true);nvinfer1::ICudaEngine* engine = builder->buildCudaEngine(*network);CHECK(engine != nullptr);// we don't need the network any more, and we can destroy the parsernetwork->destroy();parser->destroy();// serialize the engine, then close everything downgieModelStream = engine->serialize();engine->destroy();builder->destroy();nvcaffeparser1::shutdownProtobufLibrary();return 0;
}int timeInference(nvinfer1::ICudaEngine* engine, const DATA_INFO& info, Profiler* profiler)
{// input and output buffer pointers that we pass to the engine - the engine requires exactly ICudaEngine::getNbBindings(),// of these, but in this case we know that there is exactly one input and one output.CHECK(engine->getNbBindings() == 2);void* buffers[2];// In order to bind the buffers, we need to know the names of the input and output tensors.// note that indices are guaranteed to be less than ICudaEngine::getNbBindings()int inputIndex = engine->getBindingIndex(std::get<2>(info).c_str()), outputIndex = engine->getBindingIndex(std::get<3>(info).c_str());// allocate GPU buffersnvinfer1::DimsCHW inputDims = static_cast<nvinfer1::DimsCHW&&>(engine->getBindingDimensions(inputIndex)), outputDims = static_cast<nvinfer1::DimsCHW&&>(engine->getBindingDimensions(outputIndex));size_t inputSize = std::get<0>(info) * inputDims.c() * inputDims.h() * inputDims.w() * sizeof(float);size_t outputSize = std::get<0>(info) * outputDims.c() * outputDims.h() * outputDims.w() * sizeof(float);cudaMalloc(&buffers[inputIndex], inputSize);cudaMalloc(&buffers[outputIndex], outputSize);nvinfer1::IExecutionContext* context = engine->createExecutionContext();context->setProfiler(profiler);// zero the input buffercudaMemset(buffers[inputIndex], 0, inputSize);for (int i = 0; i < std::get<1>(info); ++i)context->execute(std::get<0>(info), buffers);// release the context and bufferscontext->destroy();cudaFree(buffers[inputIndex]);cudaFree(buffers[outputIndex]);return 0;
}} // namespaceint test_googlenet()
{fprintf(stdout, "Building and running a GPU inference engine for GoogleNet, N=4...\n");// stuff we know about the network and the caffe input/output blobsDATA_INFO info(4, 1000, "data", "prob", "models/googlenet.prototxt", "models/googlenet.caffemodel");Logger logger;// parse the caffe model and the mean filenvinfer1::IHostMemory* gieModelStream{ nullptr };caffeToGIEModel(std::get<4>(info), std::get<5>(info), std::vector<std::string>{std::get<3>(info)}, std::get<0>(info), gieModelStream, logger);// create an enginenvinfer1::IRuntime* infer = nvinfer1::createInferRuntime(logger);nvinfer1::ICudaEngine* engine = infer->deserializeCudaEngine(gieModelStream->data(), gieModelStream->size(), nullptr);fprintf(stdout, "Bindings after deserializing:\n"); for (int bi = 0; bi < engine->getNbBindings(); bi++) { if (engine->bindingIsInput(bi) == true) { fprintf(stdout, "Binding %d (%s): Input.\n",  bi, engine->getBindingName(bi)); } else { fprintf(stdout, "Binding %d (%s): Output.\n", bi, engine->getBindingName(bi)); } } Profiler profiler;profiler.setTimeIterations(std::get<1>(info));// run inference with null data to time network performancetimeInference(engine,  info, &profiler);engine->destroy();infer->destroy();profiler.printLayerTimes();fprintf(stdout, "Done.\n");return 0;
}

执行结果如下：

测试代码编译步骤如下(ReadMe.txt)：

在Linux下通过CMake编译TensorRT_Test中的测试代码步骤：
1. 将终端定位到CUDA_Test/prj/linux_tensorrt_cmake，依次执行如下命令：$ mkdir build$ cd build$ cmake ..$ make (生成TensorRT_Test执行文件)$ ln -s ../../../test_data/models  ./ (将models目录软链接到build目录下)$ ln -s ../../../test_data/images  ./ (将images目录软链接到build目录下)$ ./TensorRT_Test
2. 对于有需要用OpenCV参与的读取图像的操作，需要先将对应文件中的图像路径修改为Linux支持的路径格式

GitHub: https://github.com/fengbingchun/CUDA_Test

https://www.dkcj.cn/info/32659.html

Visual Studio Code Go 插件文档翻译

此插件为 Go 语言在 VS Code 中开发提供了多种语言支持。阅读版本变更日志了解此插件过去几个版本的更改内容。 1. 语言功能 (Language Features) 1.1 智能感知 (IntelliSense) 编码时符号自动补全（使用 gocode ）编码时函数签名帮助提示（使用…

编程日记2024/12/20 13:40:00

资源 | 吴恩达《机器学习训练秘籍》中文版58章节完整开源

整理 | Jane出品 | AI科技大本营（ID：rgznai100）一年前，吴恩达老师的《Machine Learning Yearning》(机器学习训练秘籍）中文版正式发布，经过一年多的陆续更新，近日，这本书的中文版 58…

编程日记2024/12/20 13:30:00

js字符串加密的几种方法

在做web前端的时候免不了要用javascript来处理一些简单操作，其实如果要用好JQuery, Prototype,Dojo 等其中一两个javascript框架并不简单，它提高你的web交互和用户体验，从而能使你的web前端有非一样的感觉，如海阔凭鱼跃。当然&…

编程日记2024/12/20 13:20:00

Vue开发入门看这篇文章就够了

摘要： 很多值得了解的细节。原文：Vue开发看这篇文章就够了作者：RandomFundebug经授权转载，版权归原作者所有。介绍 Vue 中文网Vue githubVue.js 是一套构建用户界面(UI)的渐进式JavaScript框架库和框架的区别我们所说的前端框架…

编程日记2024/12/20 13:10:00

TensorRT Samples: CharRNN

关于TensorRT的介绍可以参考： http://blog.csdn.net/fengbingchun/article/details/78469551 以下是参考TensorRT 2.1.2中的sampleCharRNN.cpp文件改写的测试代码，文件(charrnn.cpp)内容如下：#include <assert.h> #include <str…

编程日记2024/12/20 13:00:00

Python脚本BUG引发学界震动，影响有多大？

作者 | beyondma编辑 | Jane来源 | CSDN博客近日一篇“A guide to small-molecule structure assignment through computation of (1H and 13C) NMR chemical shifts”文章火爆网络，据作者看到的资料上看这篇论文自身的结果没有什么问题，但是&#xff0c…

编程日记2024/12/20 12:50:00

C++中public、protect和private用法区别

Calsspig : public animal,意思是外部代码可以随意访问 Classpig : protect animal ,意思是外部代码无法通过该子类访问基类中的public Classpig : private animal ,意思是告诉编译器从基类继承的每一个成员都当成private,即只有这个子类可以访问转载于:https://blog.51cto.…

编程日记2024/12/20 12:40:00

TensorRT Samples: MNIST(Plugin, add a custom layer)

关于TensorRT的介绍可以参考：http://blog.csdn.net/fengbingchun/article/details/78469551 以下是参考TensorRT 2.1.2中的samplePlugin.cpp文件改写的通过IPlugin添加一个全连接层实现对手写数字0-9识别的测试代码，plugin.cpp文件内容如下&#xff1a…

编程日记2024/12/20 12:30:00

AutoML很火，过度吹捧的结果？

作者 | Denis Vorotyntsev译者 | Shawnice编辑 | Jane出品 | AI科技大本营（ID：rgznai100）【导语】现在，很多企业都很关注AutoML领域，很多开发者也开始接触和从事AutoML相关的研究与应用工作，作者也是&#…

编程日记2024/12/20 12:20:00

tomcat6 配置web管理端访问权限

配置tomcat 管理端登陆 /apache-tomcat-6.0.35/conf/tomcat-users.xml 配置文件，使用时需要把注释去掉<!-- <!-- <role rolename"tomcat"/> <role rolename"role1"/> <user username"tomcat" password"…

编程日记2024/12/20 12:10:00

@程序员：Python 3.8正式发布，重要新功能都在这里

整理 | Jane、夕颜出品 | AI科技大本营（ID：rgznai100）【导读】最新版本的Python发布了！今年夏天，Python 3.8发布beta版本，但在2019年10月14日，第一个正式版本已准备就绪。现在，我们都…

编程日记2024/12/20 12:00:00

TensorRT Samples: MNIST(serialize TensorRT model)

关于TensorRT的介绍可以参考： http://blog.csdn.net/fengbingchun/article/details/78469551 这里实现在构建阶段将TensorRT model序列化存到本地文件，然后在部署阶段直接load TensorRT model序列化的文件进行推理，mnist_infer.cpp文件内容…

编程日记2024/12/20 11:50:00

【mysql错误】用as别名做where条件，报未知的列 1054 - Unknown column 'name111' in 'field list'...

需求：SELECT a AS b WHRER b1; //这样使用会报错，说b不存在。因为mysql底层跑SQL语句时：where 后的筛选条件在先， as B的别名在后。所以机器看到where 后的别名是不认的，所以会报说B不存在。这个b只是字段a查询结…

编程日记2024/12/20 11:40:00

C++2年经验

网络 sql 基础算法最多到图和树常用的几种设计模式，5以内即可转载于:https://www.cnblogs.com/liujin2012/p/3766106.html

编程日记2024/12/20 11:30:00

在Caffe中调用TensorRT提供的MNIST model

在TensorRT 2.1.2中提供了MNIST的model，这里拿来用Caffe的代码调用实现，原始的mnist_mean.binaryproto文件调整为了纯二进制文件mnist_tensorrt_mean.binary，测试结果与使用TensorRT调用(http://blog.csdn.net/fengbingchun/article/details/…

编程日记2024/12/20 11:20:00

142页ICML会议强化学习笔记整理，值得细读

作者 | David Abel编辑 | DeepRL来源 | 深度强化学习实验室（ID: Deep-RL）ICML 是 International Conference on Machine Learning的缩写，即国际机器学习大会。ICML如今已发展为由国际机器学习学会（IMLS）主办的年度机器…

编程日记2024/12/20 11:10:00

CF1148F - Foo Fighters

CF1148F - Foo Fighters 题意：你有n个物品，每个都有val和mask。你要选择一个数s，如果一个物品的mask & s含有奇数个1，就把val变成-val。求一个s使得val总和变号。解：分步来做。发现那个奇数个1可以变成&#x…

编程日记2024/12/20 11:00:00

html传參中？和amp;

<a href"MealServlet?typefindbyid&mid<%m1.getMealId()%> 在这句传參中？之后的代表要传递的參数当中有两个參数第一个为type第二个为mid假设是一个參数就不用加&假设是多个參数须要加上&来传递

编程日记2024/12/20 10:50:00

实战：手把手教你实现用语音智能控制电脑 | 附完整代码

作者 | 叶圣出品 | AI科技大本营（ID:rgznai100）导语：本篇文章将基于百度API实现对电脑的语音智能控制，不需要任何硬件上的支持，仅仅依靠一台电脑即可以实现。作者经过测试，效果不错，同时可以依据…

编程日记2024/12/20 10:40:00

C++/C++11中左值、左值引用、右值、右值引用的使用

C的表达式要不然是右值(rvalue)，要不然就是左值(lvalue)。这两个名词是从C语言继承过来的，原本是为了帮助记忆：左值可以位于赋值语句的左侧，右值则不能。在C语言中，二者的区别就没那么简单了。一个左值表达式的求值结…

编程日记2024/12/20 10:30:00

Could not create the view: An unexpected exception was thrown. Myeclipse空间报错

转载于:https://blog.51cto.com/82654993/1424339

编程日记2024/12/20 10:20:00

Banknote Dataset(钞票数据集)介绍

Banknote Dataset(钞票数据集)：这是从纸币鉴别过程中的图像里提取的数据，用来预测钞票的真伪的数据集。该数据集中含有1372个样本，每个样本由5个数值型变量构成，4个输入变量和1个输出变量。小波变换工具用于从图像中提取特征。这是…

编程日记2024/12/20 10:10:00

快速适应性很重要，但不是元学习的全部目标

作者 | Khurram Javed, Hengshuai Yao, Martha White译者 | Monanfei出品 | AI科技大本营（ID:rgznai100）实践证明，基于梯度的元学习在学习模型初始化、表示形式和更新规则方面非常有效，该模型允许从少量样本中进行快速适应。这些方…

编程日记2024/12/20 10:00:00

面试题-自旋锁，以及jvm对synchronized的优化

背景想要弄清楚这些问题，需要弄清楚其他的很多问题。比如，对象，而对象本身又可以延伸出很多其他的问题。我们平时不过只是在使用对象而已，怎么使用？就是new 对象。这只是语法层面的使用，相当于会了一门编…

编程日记2024/12/20 09:50:00

DNS解析故障

在实际应用过程中可能会遇到DNS解析错误的问题，就是说当我们访问一个域名时无法完成将其解析到IP地址的工作，而直接输入网站IP却可以正常访问，这就是因为DNS解析出现故障造成的。这个现象发生的机率比较大，所以本文将从零起步教给…

编程日记2024/12/20 09:40:00

cinder存储服务

一、cinder 介绍： 理解 Block Storage 操作系统获得存储空间的方式一般有两种： 1、通过某种协议（SAS,SCSI,SAN,iSCSI 等）挂接裸硬盘，然后分区、格式化、创建文件系统；或者直接使用裸硬盘存储数据&#xff0…

编程日记2024/12/20 09:30:00

Ubuntu 14.04 64位机上配置Android Studio操作步骤

Android Studio是一个为Android平台开发程序的集成开发环境。2013年5月16日在Google I/O上发布，可供开发者免费使用。Android Studio基于JetBrains IntelliJ IDEA，为Android开发特殊定制，并在Windows、OS X和Linux平台上均可运行。1. 从 htt…

编程日记2024/12/20 09:20:00

大规模1.4亿中文知识图谱数据，我把它开源了

作者 | Just出品 | AI科技大本营（ID:rgznai100）人工智能从感知阶段逐步进入认知智能的过程中，知识图谱技术将为机器提供认知思维能力和关联分析能力，可以应用于机器人问答系统、内容推荐等系统中。不过要降低知识图谱技术应用的门…

编程日记2024/12/20 09:10:00

使用CSS 3创建不规则图形

2019独角兽企业重金招聘Python工程师标准>>> 前言 CSS 创建复杂图形的技术即将会被广泛支持，并且应用到实际项目中。本篇文章的目的是为大家开启它的冰山一角。我希望这篇文章能让你对不规则图形有一个初步的了解。现在，我们已经可以使用CSS…

编程日记2024/12/20 09:00:00

谷歌丰田联合成果ALBERT了解一下：新轻量版BERT，参数小18倍，性能依旧SOTA

作者 | Less Wright编译 | ronghuaiyang来源 | AI公园（ID:AI_Paradise）【导读】这是来自Google和Toyota的新NLP模型，超越Bert，参数小了18倍。你以前的NLP模型参数效率低下，而且有些过时。祝你有美好的一天。谷歌Resear…

编程日记2024/12/20 08:50:00

相关文章：