tools/cpp/MNNV2Basic.cpp

// // MNNV2Basic.cpp // MNN // // Created by MNN on 2019/01/22. // Copyright © 2018, Alibaba Group Holding Limited // #define MNN_OPEN_TIME_TRACE #include <stdlib.h> #include <algorithm> #include <cstring> #include <fstream> #include <iostream> #include <map> #include <memory> #include <sstream> #include <string> #if defined(_MSC_VER) #include <Windows.h> #undef min #undef max #else #include <sys/time.h> #endif #include <MNN/MNNDefine.h> #include <MNN/AutoTime.hpp> #include <MNN/Interpreter.hpp> #include <MNN/Tensor.hpp> #include <core/Backend.hpp> #include <core/TensorUtils.hpp> #include <MNN_generated.h> //#define FEED_INPUT_NAME_VALUE using namespace MNN; #define DUMP_NUM_DATA(type) \ auto data = tensor->host<type>(); \ for (int z = 0; z < outside; ++z) { \ for (int x = 0; x < width; ++x) { \ outputOs << data[x + z * width] << "\t"; \ } \ outputOs << "\n"; \ } #define DUMP_CHAR_DATA(type) \ auto data = tensor->host<type>(); \ for (int z = 0; z < outside; ++z) { \ for (int x = 0; x < width; ++x) { \ outputOs << static_cast<int>(data[x + z * width]) << "\t"; \ } \ outputOs << "\n"; \ } static void dumpTensor2File(const Tensor* tensor, const char* file, std::ofstream& orderFile) { orderFile << file << std::endl; std::ofstream outputOs(file); auto type = tensor->getType(); int dimension = tensor->buffer().dimensions; int width = 1; if (dimension > 1) { width = tensor->length(dimension - 1); } const int outside = tensor->elementSize() / width; const auto dataType = type.code; const auto dataBytes = type.bytes(); if (dataType == halide_type_float) { DUMP_NUM_DATA(float); } if (dataType == halide_type_int && dataBytes == 4) { DUMP_NUM_DATA(int32_t); } if (dataType == halide_type_uint && dataBytes == 1) { DUMP_CHAR_DATA(uint8_t); } if (dataType == halide_type_int && dataBytes == 1) { #ifdef MNN_USE_SSE auto data = tensor->host<uint8_t>(); for (int z = 0; z < outside; ++z) { for (int x = 0; x < width; ++x) { outputOs << (static_cast<int>(data[x + z * width]) - 128) << "\t"; } outputOs << "\n"; } #else DUMP_CHAR_DATA(int8_t); #endif } } static void _loadInputFromFile(Tensor* inputTensor, std::string pwd, std::string name) { MNN::Tensor givenTensor(inputTensor, inputTensor->getDimensionType()); { int size_w = inputTensor->width(); int size_h = inputTensor->height(); int bpp = inputTensor->channel(); int batch = inputTensor->batch(); MNN_PRINT("Input size:%d\n", inputTensor->elementSize()); inputTensor->printShape(); std::ostringstream fileName; fileName << pwd << name; std::ifstream input(fileName.str().c_str()); FUNC_PRINT_ALL(fileName.str().c_str(), s); if (givenTensor.getType().code == halide_type_int) { auto size = givenTensor.elementSize(); const auto bytesLen = givenTensor.getType().bytes(); if (bytesLen == 4) { auto inputData = givenTensor.host<int32_t>(); double temp; for (int i = 0; i < size; ++i) { input >> temp; inputData[i] = temp; } } else if (bytesLen == 1) { auto inputData = givenTensor.host<int8_t>(); double pixel = 0; for (int i = 0; i < size; ++i) { input >> pixel; inputData[i] = static_cast<int8_t>(pixel); } } } else if (givenTensor.getType().code == halide_type_uint) { auto size = givenTensor.elementSize(); { FUNC_PRINT(givenTensor.getType().bytes()); auto inputData = givenTensor.host<uint8_t>(); for (int i = 0; i < size; ++i) { double p; input >> p; inputData[i] = (uint8_t)p; } } } else if (givenTensor.getType().code == halide_type_float) { auto inputData = givenTensor.host<float>(); auto size = givenTensor.elementSize(); for (int i = 0; i < size; ++i) { input >> inputData[i]; // inputData[i] = 1.0f; } } inputTensor->copyFromHostTensor(&givenTensor); } } static inline int64_t getTimeInUs() { uint64_t time; #if defined(_MSC_VER) LARGE_INTEGER now, freq; QueryPerformanceCounter(&now); QueryPerformanceFrequency(&freq); uint64_t sec = now.QuadPart / freq.QuadPart; uint64_t usec = (now.QuadPart % freq.QuadPart) * 1000000 / freq.QuadPart; time = sec * 1000000 + usec; #else struct timeval tv; gettimeofday(&tv, nullptr); time = static_cast<uint64_t>(tv.tv_sec) * 1000000 + tv.tv_usec; #endif return time; } static int test_main(int argc, const char* argv[]) { if (argc < 2) { MNN_PRINT("========================================================================\n"); MNN_PRINT("Arguments: model.MNN runLoops runMask forwardType numberThread precision inputSize \n"); MNN_PRINT("========================================================================\n"); return -1; } std::string cmd = argv[0]; std::string pwd = "./"; auto rslash = cmd.rfind("/"); if (rslash != std::string::npos) { pwd = cmd.substr(0, rslash + 1); } // read args const char* fileName = argv[1]; int runTime = 1; if (argc > 2) { runTime = ::atoi(argv[2]); } int runMask = 0; if (argc > 3) { runMask = atoi(argv[3]); } int saveOutput = 0; if ((runMask & 1) || (runMask & 2)) { MNN_PRINT("Save AllTensors to output/*.txt\n"); saveOutput = 1; } int saveInput = 0; if (runMask & 2) { saveInput = 1; } bool autoBackend = false; if (runMask & 16) { autoBackend = true; } auto type = MNN_FORWARD_CPU; if (argc > 4) { type = (MNNForwardType)atoi(argv[4]); MNN_PRINT("Use extra forward type: %d\n", type); } int modeNum = 4; if (argc > 5) { modeNum = ::atoi(argv[5]); } int precision = BackendConfig::Precision_Low; int memory = BackendConfig::Memory_Normal; if (argc > 6) { int mask = atoi(argv[6]); precision = mask % 4; memory = (mask / 4) % 4; } // input dims std::vector<int> inputDims; if (argc > 7) { std::string inputShape(argv[7]); const char* delim = "x"; std::ptrdiff_t p1 = 0, p2; while (1) { p2 = inputShape.find(delim, p1); if (p2 != std::string::npos) { inputDims.push_back(atoi(inputShape.substr(p1, p2 - p1).c_str())); p1 = p2 + 1; } else { inputDims.push_back(atoi(inputShape.substr(p1).c_str())); break; } } } for (auto dim : inputDims) { MNN_PRINT("%d ", dim); } MNN_PRINT("\n"); // create net MNN_PRINT("Open Model %s\n", fileName); std::shared_ptr<MNN::Interpreter> net = std::shared_ptr<MNN::Interpreter>(MNN::Interpreter::createFromFile(fileName), MNN::Interpreter::destroy); if (nullptr == net) { return 0; } net->setCacheFile(".tempcache"); net->setSessionMode(Interpreter::Session_Debug); if (autoBackend) { net->setSessionMode(Interpreter::Session_Backend_Auto); net->setSessionHint(Interpreter::MAX_TUNING_NUMBER, 15); } if (!inputDims.empty()) { net->setSessionMode(Interpreter::Session_Resize_Defer); } if (runMask & 32) { net->setSessionHint(Interpreter::WINOGRAD_MEMORY_LEVEL, 0); } // create session MNN::ScheduleConfig config; config.type = type; /*modeNum means gpuMode for GPU usage, Or means numThread for CPU usage.*/ config.numThread = modeNum; // If type not fount, let it failed config.backupType = type; BackendConfig backendConfig; // config.path.outputs.push_back("ResizeBilinear_2"); // backendConfig.power = BackendConfig::Power_High; backendConfig.precision = static_cast<MNN::BackendConfig::PrecisionMode>(precision); backendConfig.memory = static_cast<MNN::BackendConfig::MemoryMode>(memory); config.backendConfig = &backendConfig; MNN::Session* session = NULL; MNN::Tensor* inputTensor = nullptr; { AUTOTIME; session = net->createSession(config); if (nullptr == session) { return 0; } inputTensor = net->getSessionInput(session, NULL); if (!inputDims.empty()) { MNN_PRINT("===========> Resize Again...\n"); net->resizeTensor(inputTensor, inputDims); net->resizeSession(session); //Set when size is changed, After resizeSession } } int resizeStatus = 0; net->getSessionInfo(session, MNN::Interpreter::RESIZE_STATUS, &resizeStatus); if (resizeStatus != 0) { MNN_ERROR("Resize error, can't execute MNN\n"); return 0; } float memoryUsage = 0.0f; net->getSessionInfo(session, MNN::Interpreter::MEMORY, &memoryUsage); float flops = 0.0f; net->getSessionInfo(session, MNN::Interpreter::FLOPS, &flops); int backendType[2]; net->getSessionInfo(session, MNN::Interpreter::BACKENDS, backendType); MNN_PRINT("Session Info: memory use %f MB, flops is %f M, backendType is %d\n", memoryUsage, flops, backendType[0]); // Set Other Inputs to Zero auto allInput = net->getSessionInputAll(session); for (auto& iter : allInput) { auto inputTensor = iter.second; auto size = inputTensor->size(); if (size <= 0) { continue; } MNN::Tensor tempTensor(inputTensor, inputTensor->getDimensionType()); ::memset(tempTensor.host<void>(), 0, tempTensor.size()); inputTensor->copyFromHostTensor(&tempTensor); } MNN_PRINT("===========> Session Resize Done.\n"); MNN_PRINT("===========> Session Start running...\n"); if (type == MNN_FORWARD_CPU || (!autoBackend)) { net->releaseModel(); } _loadInputFromFile(inputTensor, pwd, "input_0.txt"); // input auto dimType = inputTensor->getDimensionType(); if (inputTensor->getType().code == halide_type_uint || inputTensor->getType().code == halide_type_int) { dimType = Tensor::TENSORFLOW; } std::ofstream orderFileOs; orderFileOs.open(".order"); if (saveOutput) { MNN::TensorCallBack beforeCallBack = [&](const std::vector<MNN::Tensor*>& ntensors, const std::string& opName) { if (!saveInput) { return true; } for (int i = 0; i < ntensors.size(); ++i) { auto ntensor = ntensors[i]; if (nullptr == ntensor->host<void>() && 0 == ntensor->deviceId()) { // Raster Input continue; } auto outDimType = ntensor->getDimensionType(); auto expectTensor = new MNN::Tensor(ntensor, outDimType); ntensor->copyToHostTensor(expectTensor); auto tensor = ntensor; std::ostringstream outputFileName; auto opCopyName = opName; for (int j = 0; j < opCopyName.size(); ++j) { if (opCopyName[j] == '/') { opCopyName[j] = '_'; } } MNN_PRINT("Dump %s Input, %d, %d X %d X %d X %d\n", opName.c_str(), i, tensor->width(), tensor->height(), tensor->channel(), tensor->batch()); outputFileName << "output/Input_" << opCopyName << "_" << i; dumpTensor2File(expectTensor, outputFileName.str().c_str(), orderFileOs); delete expectTensor; } return true; }; MNN::TensorCallBack callBack = [&](const std::vector<MNN::Tensor*>& ntensors, const std::string& opName) { for (int i = 0; i < ntensors.size(); ++i) { auto ntensor = ntensors[i]; auto outDimType = ntensor->getDimensionType(); auto expectTensor = new MNN::Tensor(ntensor, outDimType); ntensor->copyToHostTensor(expectTensor); auto tensor = expectTensor; std::ostringstream outputFileName; auto opCopyName = opName; for (int j = 0; j < opCopyName.size(); ++j) { if (opCopyName[j] == '/') { opCopyName[j] = '_'; } } if (tensor->dimensions() == 4) { MNN_PRINT("Dimensions: 4, W,H,C,B: %d X %d X %d X %d, OP name %s : %d\n", tensor->width(), tensor->height(), tensor->channel(), tensor->batch(), opName.c_str(), i); } else { std::ostringstream oss; for (int i = 0; i < tensor->dimensions(); i++) { oss << (i ? " X " : "") << tensor->length(i); } MNN_PRINT("Dimensions: %d, %s, OP name %s : %d\n", tensor->dimensions(), oss.str().c_str(), opName.c_str(), i); } outputFileName << "output/" << opCopyName << "_" << i; dumpTensor2File(expectTensor, outputFileName.str().c_str(), orderFileOs); delete expectTensor; } return true; }; net->runSessionWithCallBack(session, beforeCallBack, callBack); } else { net->runSession(session); } // save output auto outputTensor = net->getSessionOutput(session, NULL); MNN::Tensor expectTensor(outputTensor, outputTensor->getDimensionType()); { outputTensor->copyToHostTensor(&expectTensor); auto outputFile = pwd + "output.txt"; if (outputTensor->size() > 0) { dumpTensor2File(&expectTensor, outputFile.c_str(), orderFileOs); } else { MNN_ERROR("output size is 0, can't save\n"); } } auto allOutputs = net->getSessionOutputAll(session); for (auto& iter : allOutputs) { MNN_PRINT("output: %s\n", iter.first.c_str()); { MNN::Tensor expectTensor2(iter.second, iter.second->getDimensionType()); iter.second->copyToHostTensor(&expectTensor2); auto outputFile = pwd + "/output/" + iter.first + ".txt"; if (iter.second->size() > 0) { dumpTensor2File(&expectTensor2, outputFile.c_str(), orderFileOs); } } } // benchmark. for CPU, op time means calc duration; for others, op time means schedule duration. { int t = runTime; MNN_PRINT("precision:%d, memory: %d, Run %d time:\n", precision, memory, t); std::map<std::string, std::pair<float, float>> opTimes; std::map<std::string, std::string> opTypes; uint64_t opBegin = 0; MNN::TensorCallBackWithInfo beforeCallBack = [&](const std::vector<MNN::Tensor*>& ntensors, const OperatorInfo* info) { if(opTypes.find(info->name()) == opTypes.end()){ opTypes.insert(std::make_pair(info->name(), info->type())); } opBegin = getTimeInUs(); if (opTimes.find(info->name()) == opTimes.end()) { opTimes.insert(std::make_pair(info->name(), std::make_pair(0.0f, info->flops()))); } return true; }; MNN::TensorCallBackWithInfo afterCallBack = [&](const std::vector<MNN::Tensor*>& ntensors, const OperatorInfo* info) { auto opEnd = getTimeInUs(); float cost = (float)(opEnd - opBegin) / 1000.0f; opTimes[info->name()].first += cost; return true; }; if (t > 0) { for (int i = 0; i < 3; ++i) { // warmup { auto ptr = inputTensor->map(MNN::Tensor::MAP_TENSOR_WRITE, inputTensor->getDimensionType()); inputTensor->unmap(MNN::Tensor::MAP_TENSOR_WRITE, inputTensor->getDimensionType(), ptr); } net->runSession(session); { auto ptr = outputTensor->map(MNN::Tensor::MAP_TENSOR_READ, outputTensor->getDimensionType()); outputTensor->unmap(MNN::Tensor::MAP_TENSOR_READ, outputTensor->getDimensionType(), ptr); } } float minTime = 0.0f; float maxTime = 0.0f; float sum = 0.0f; for (int i = 0; i < t; ++i) { auto begin = getTimeInUs(); { auto ptr = inputTensor->map(MNN::Tensor::MAP_TENSOR_WRITE, inputTensor->getDimensionType()); inputTensor->unmap(MNN::Tensor::MAP_TENSOR_WRITE, inputTensor->getDimensionType(), ptr); } net->runSessionWithCallBackInfo(session, beforeCallBack, afterCallBack, false); { auto ptr = outputTensor->map(MNN::Tensor::MAP_TENSOR_READ, outputTensor->getDimensionType()); outputTensor->unmap(MNN::Tensor::MAP_TENSOR_READ, outputTensor->getDimensionType(), ptr); } auto end = getTimeInUs(); auto curtime = (end - begin) / 1000.0f; if (0 == i) { minTime = curtime; maxTime = curtime; } else { minTime = ALIMIN(curtime, minTime); maxTime = ALIMAX(curtime, maxTime); } sum += curtime; } std::vector<std::pair<float, std::pair<std::string, float>>> allOpsTimes; float sumFlops = 0.0f; for (auto& iter : opTimes) { allOpsTimes.push_back( std::make_pair(iter.second.first, std::make_pair(iter.first, iter.second.second))); sumFlops += iter.second.second; } std::sort(allOpsTimes.begin(), allOpsTimes.end()); float opSum = 0; for (auto& iter : allOpsTimes) { opSum += iter.first; MNN_PRINT("%*s \t[%s] run %d average cost %f ms, %.3f %%, FlopsRate: %.3f %%\n", 50, iter.second.first.c_str(), opTypes[iter.second.first].c_str(), runTime, iter.first / (float)runTime, iter.first / sum * 100.0f, iter.second.second / sumFlops * 100.0f); } opSum = opSum / runTime; MNN_PRINT("Avg= %f ms, OpSum = %f ms min= %f ms, max= %f ms\n", sum / (float)t, opSum, minTime, maxTime); } } net->updateCacheFile(session); return 0; } int main(int argc, const char* argv[]) { // For Detect Memory Leak, set circle as true bool circle = false; do { test_main(argc, argv); } while (circle); return 0; }

tools/cpp/MNNV2Basic.cpp (472 lines of code) (raw):