MNN/tools/cpp/timeProfile.cpp

//
//  timeProfile.cpp
//  MNN
//
//  Created by MNN on 2019/01/22.
//  Copyright © 2018, Alibaba Group Holding Limited
//

#define MNN_OPEN_TIME_TRACE
#include <stdlib.h>
#include <cstring>
#include <memory>
#include <string>
#include <MNN/AutoTime.hpp>
#include <MNN/Interpreter.hpp>
#include <MNN/MNNDefine.h>
#include "core/Macro.h"
#include "Profiler.hpp"
#include <MNN/Tensor.hpp>
#include "revertMNNModel.hpp"

#define MNN_PRINT_TIME_BY_NAME

using namespace MNN;

static inline std::vector<int> parseIntList(const std::string& str, char delim) {
    std::vector<int> result;
    std::ptrdiff_t p1 = 0, p2;
    while (1) {
        p2 = str.find(delim, p1);
        if (p2 != std::string::npos) {
            result.push_back(atoi(str.substr(p1, p2 - p1).c_str()));
            p1 = p2 + 1;
        } else {
            result.push_back(atoi(str.substr(p1).c_str()));
            break;
        }
    }
    return result;
}
int main(int argc, const char* argv[]) {
    if (argc < 2) {
        MNN_PRINT("=========================================================================================\n");
        MNN_PRINT("Arguments: model.MNN runLoops forwardType inputSize numberThread precision sparsity cpuIds\n");
        MNN_PRINT("Example: %s model.MNN 100 0 1x3x224x224 4 0 0 0,1,2,3\n", argv[0]);
        MNN_PRINT("=========================================================================================\n");
        return -1;
    }

    std::string cmd = argv[0];
    std::string pwd = "./";
    auto rslash     = cmd.rfind("/");
    if (rslash != std::string::npos) {
        pwd = cmd.substr(0, rslash + 1);
    }

    // read args
    const char* fileName = argv[1];
    int runTime          = 100;
    if (argc > 2) {
        runTime = ::atoi(argv[2]);
    }
    auto type = MNN_FORWARD_CPU;
    if (argc > 3) {
        type = (MNNForwardType)atoi(argv[3]);
        printf("Use extra forward type: %d\n", type);
    }

    // input dims
    std::vector<int> inputDims;
    if (argc > 4) {
        inputDims = parseIntList(argv[4], 'x');
    }
    MNN_PRINT("inputDims: ");
    for (auto dim : inputDims) {
        MNN_PRINT("%d ", dim);
    }
    MNN_PRINT("\n");
    int threadNumber = 4;
    if (argc > 5) {
        threadNumber = ::atoi(argv[5]);
        MNN_PRINT("Set ThreadNumber = %d\n", threadNumber);
    }

    auto precision = BackendConfig::PrecisionMode::Precision_Normal;
    if (argc > 6) {
        precision = (BackendConfig::PrecisionMode)atoi(argv[6]);
        printf("Use precision type: %d\n", precision);
    }

    float sparsity = 0.0f;
    if(argc > 7) {
        sparsity = atof(argv[7]);
    }
    
    // CPU IDs
    std::vector<int> cpuIds;
    if (argc > 8) {
        cpuIds = parseIntList(argv[8], ',');
    }
    MNN_PRINT("cpuIds: ");
    for (auto id : cpuIds) {
        MNN_PRINT("%d ", id);
    }
    MNN_PRINT("\n");


    // revert MNN model if necessary
    auto revertor = std::unique_ptr<Revert>(new Revert(fileName));
    revertor->initialize(sparsity);
    auto modelBuffer = revertor->getBuffer();
    auto bufferSize  = revertor->getBufferSize();

    // create net
    MNN_PRINT("Open Model %s\n", fileName);
    auto net = std::shared_ptr<Interpreter>(Interpreter::createFromBuffer(modelBuffer, bufferSize));
    if (nullptr == net) {
        return 0;
    }
    revertor.reset();
    net->setSessionMode(Interpreter::Session_Debug);
    net->setSessionHint(Interpreter::HintMode::CPU_CORE_IDS, cpuIds.data(), cpuIds.size());

    // create session
    MNN::ScheduleConfig config;
    config.type           = type;
    config.numThread      = threadNumber;
    BackendConfig backendConfig;
    backendConfig.precision = precision;
    config.backendConfig  = &backendConfig;
    MNN::Session* session = NULL;
    session               = net->createSession(config);
    auto inputTensor      = net->getSessionInput(session, NULL);
    if (!inputDims.empty()) {
        net->resizeTensor(inputTensor, inputDims);
        net->resizeSession(session);
    }
    auto allInput = net->getSessionInputAll(session);
    for (auto& iter : allInput) {
        auto inputTensor = iter.second;
        auto size = inputTensor->size();
        if (size <= 0) {
            continue;
        }
        MNN::Tensor tempTensor(inputTensor, inputTensor->getDimensionType());
        ::memset(tempTensor.host<void>(), 0, tempTensor.size());
        inputTensor->copyFromHostTensor(&tempTensor);
    }
    net->releaseModel();
    std::shared_ptr<MNN::Tensor> inputTensorUser(MNN::Tensor::createHostTensorFromDevice(inputTensor, false));
    auto outputTensor = net->getSessionOutput(session, NULL);
    if (outputTensor->size() <= 0) {
        MNN_ERROR("Output not available\n");
        return 0;
    }
    std::shared_ptr<MNN::Tensor> outputTensorUser(MNN::Tensor::createHostTensorFromDevice(outputTensor, false));

    auto profiler      = MNN::Profiler::getInstance();
    auto beginCallBack = [&](const std::vector<Tensor*>& inputs, const OperatorInfo* info) {
        profiler->start(info);
        return true;
    };
    auto afterCallBack = [&](const std::vector<Tensor*>& tensors, const OperatorInfo* info) {
        for (auto o : tensors) {
            o->wait(MNN::Tensor::MAP_TENSOR_READ, true);
        }
        profiler->end(info);
        return true;
    };

    AUTOTIME;
    // just run
    for (int i = 0; i < runTime; ++i) {
        inputTensor->copyFromHostTensor(inputTensorUser.get());
        net->runSessionWithCallBackInfo(session, beginCallBack, afterCallBack);
        outputTensor->copyToHostTensor(outputTensorUser.get());
    }

#ifdef MNN_PRINT_TIME_BY_NAME
    profiler->printTimeByName(runTime);
#endif
    profiler->printSlowOp("Convolution", 20, 0.03f);
    profiler->printTimeByType(runTime);
    return 0;
}
beta 0.1.0 2019-04-17 10:49:11 +08:00			`//`
			`// timeProfile.cpp`
			`// MNN`
			`//`
			`// Created by MNN on 2019/01/22.`
			`// Copyright © 2018, Alibaba Group Holding Limited`
			`//`

			`#define MNN_OPEN_TIME_TRACE`
			`#include <stdlib.h>`
			`#include <cstring>`
			`#include <memory>`
			`#include <string>`
Update 2019-12-27 22:16:57 +08:00			`#include <MNN/AutoTime.hpp>`
			`#include <MNN/Interpreter.hpp>`
			`#include <MNN/MNNDefine.h>`
			`#include "core/Macro.h"`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`#include "Profiler.hpp"`
Update 2019-12-27 22:16:57 +08:00			`#include <MNN/Tensor.hpp>`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`#include "revertMNNModel.hpp"`

- dynamic computation graph (beta) - add supports (/express) - add tests - add benchmarks with it (/benchmark/exprModels) - Python - MNN engine and tools were submitted to pip - available on Windows/macOS/Linux - Engine/Converter - add supports for each op benchmarking - refactor optimizer by separating steps - CPU - add supports for Conv3D, Pool3D, ELU, ReverseSequence - fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf - OpenCL - add half transform in CPU - add broadcast supports for binary - optimize Conv2D, Reshape, Eltwise, Gemm, etc. - OpenGL - add sub, real div supports for binary - add supports for unary - optimize Conv2D, Reshape - Vulkan - add max supports for eltwise - Metal - fix metallib missing problem - Train/Quantization - use express to refactor training codes 2019-09-26 21:02:07 +08:00			`#define MNN_PRINT_TIME_BY_NAME`

beta 0.1.0 2019-04-17 10:49:11 +08:00			`using namespace MNN;`

bind cpuIds 2025-07-11 12:47:18 +08:00			`static inline std::vector<int> parseIntList(const std::string& str, char delim) {`
			`std::vector<int> result;`
			`std::ptrdiff_t p1 = 0, p2;`
			`while (1) {`
			`p2 = str.find(delim, p1);`
			`if (p2 != std::string::npos) {`
			`result.push_back(atoi(str.substr(p1, p2 - p1).c_str()));`
			`p1 = p2 + 1;`
			`} else {`
			`result.push_back(atoi(str.substr(p1).c_str()));`
			`break;`
			`}`
			`}`
			`return result;`
			`}`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`int main(int argc, const char* argv[]) {`
bind cpuIds 2025-07-11 12:47:18 +08:00			`if (argc < 2) {`
			`MNN_PRINT("=========================================================================================\n");`
			`MNN_PRINT("Arguments: model.MNN runLoops forwardType inputSize numberThread precision sparsity cpuIds\n");`
			`MNN_PRINT("Example: %s model.MNN 100 0 1x3x224x224 4 0 0 0,1,2,3\n", argv[0]);`
			`MNN_PRINT("=========================================================================================\n");`
			`return -1;`
			`}`

beta 0.1.0 2019-04-17 10:49:11 +08:00			`std::string cmd = argv[0];`
			`std::string pwd = "./";`
			`auto rslash = cmd.rfind("/");`
			`if (rslash != std::string::npos) {`
			`pwd = cmd.substr(0, rslash + 1);`
			`}`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00
beta 0.1.0 2019-04-17 10:49:11 +08:00			`// read args`
			`const char* fileName = argv[1];`
			`int runTime = 100;`
			`if (argc > 2) {`
			`runTime = ::atoi(argv[2]);`
			`}`
			`auto type = MNN_FORWARD_CPU;`
			`if (argc > 3) {`
			`type = (MNNForwardType)atoi(argv[3]);`
			`printf("Use extra forward type: %d\n", type);`
			`}`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00
beta 0.1.0 2019-04-17 10:49:11 +08:00			`// input dims`
			`std::vector<int> inputDims;`
			`if (argc > 4) {`
bind cpuIds 2025-07-11 12:47:18 +08:00			`inputDims = parseIntList(argv[4], 'x');`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`
bind cpuIds 2025-07-11 12:47:18 +08:00			`MNN_PRINT("inputDims: ");`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`for (auto dim : inputDims) {`
			`MNN_PRINT("%d ", dim);`
			`}`
			`MNN_PRINT("\n");`
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00			`int threadNumber = 4;`
			`if (argc > 5) {`
sync from internal repo 2021-04-28 18:02:10 +08:00			`threadNumber = ::atoi(argv[5]);`
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00			`MNN_PRINT("Set ThreadNumber = %d\n", threadNumber);`
			`}`

[Sync] Sync Internal Gitlab 2.2.0 2022-10-30 08:44:24 +08:00			`auto precision = BackendConfig::PrecisionMode::Precision_Normal;`
			`if (argc > 6) {`
			`precision = (BackendConfig::PrecisionMode)atoi(argv[6]);`
			`printf("Use precision type: %d\n", precision);`
			`}`

Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`float sparsity = 0.0f;`
bind cpuIds 2025-07-11 12:47:18 +08:00			`if(argc > 7) {`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`sparsity = atof(argv[7]);`
			`}`
bind cpuIds 2025-07-11 12:47:18 +08:00
			`// CPU IDs`
			`std::vector<int> cpuIds;`
			`if (argc > 8) {`
			`cpuIds = parseIntList(argv[8], ',');`
			`}`
			`MNN_PRINT("cpuIds: ");`
			`for (auto id : cpuIds) {`
			`MNN_PRINT("%d ", id);`
			`}`
			`MNN_PRINT("\n");`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00

beta 0.1.0 2019-04-17 10:49:11 +08:00			`// revert MNN model if necessary`
			`auto revertor = std::unique_ptr<Revert>(new Revert(fileName));`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`revertor->initialize(sparsity);`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`auto modelBuffer = revertor->getBuffer();`
			`auto bufferSize = revertor->getBufferSize();`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00
beta 0.1.0 2019-04-17 10:49:11 +08:00			`// create net`
			`MNN_PRINT("Open Model %s\n", fileName);`
			`auto net = std::shared_ptr<Interpreter>(Interpreter::createFromBuffer(modelBuffer, bufferSize));`
			`if (nullptr == net) {`
			`return 0;`
			`}`
			`revertor.reset();`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`net->setSessionMode(Interpreter::Session_Debug);`
refactor cpuids setting from BackendConfig to HintMode 2025-07-18 17:42:59 +08:00			`net->setSessionHint(Interpreter::HintMode::CPU_CORE_IDS, cpuIds.data(), cpuIds.size());`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00
beta 0.1.0 2019-04-17 10:49:11 +08:00			`// create session`
			`MNN::ScheduleConfig config;`
			`config.type = type;`
[MNN:Sync] Sync internal Gitlab 2021-04-08 15:34:23 +08:00			`config.numThread = threadNumber;`
[Sync] Sync Internal Gitlab 2.2.0 2022-10-30 08:44:24 +08:00			`BackendConfig backendConfig;`
			`backendConfig.precision = precision;`
			`config.backendConfig = &backendConfig;`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`MNN::Session* session = NULL;`
			`session = net->createSession(config);`
			`auto inputTensor = net->getSessionInput(session, NULL);`
			`if (!inputDims.empty()) {`
			`net->resizeTensor(inputTensor, inputDims);`
			`net->resizeSession(session);`
			`}`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00			`auto allInput = net->getSessionInputAll(session);`
			`for (auto& iter : allInput) {`
			`auto inputTensor = iter.second;`
			`auto size = inputTensor->size();`
			`if (size <= 0) {`
			`continue;`
			`}`
			`MNN::Tensor tempTensor(inputTensor, inputTensor->getDimensionType());`
			`::memset(tempTensor.host<void>(), 0, tempTensor.size());`
			`inputTensor->copyFromHostTensor(&tempTensor);`
			`}`
beta 0.1.1.6 - add support for windows - fix bugs in converting dropout - fix bugs in post treat 2019-06-10 21:08:55 +08:00			`net->releaseModel();`
beta 0.1.1.4 - refactor OpenGL, test relative codes - optimize LRN - fix doc link error 2019-05-24 11:26:54 +08:00			`std::shared_ptr<MNN::Tensor> inputTensorUser(MNN::Tensor::createHostTensorFromDevice(inputTensor, false));`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`auto outputTensor = net->getSessionOutput(session, NULL);`
			`if (outputTensor->size() <= 0) {`
			`MNN_ERROR("Output not available\n");`
			`return 0;`
			`}`
beta 0.1.1.4 - refactor OpenGL, test relative codes - optimize LRN - fix doc link error 2019-05-24 11:26:54 +08:00			`std::shared_ptr<MNN::Tensor> outputTensorUser(MNN::Tensor::createHostTensorFromDevice(outputTensor, false));`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00
beta 0.1.0 2019-04-17 10:49:11 +08:00			`auto profiler = MNN::Profiler::getInstance();`
			`auto beginCallBack = [&](const std::vector<Tensor>& inputs, const OperatorInfo info) {`
			`profiler->start(info);`
			`return true;`
			`};`
[MNN:Sync] Sync internal gitlab 2022-01-04 10:50:40 +08:00			`auto afterCallBack = [&](const std::vector<Tensor>& tensors, const OperatorInfo info) {`
			`for (auto o : tensors) {`
			`o->wait(MNN::Tensor::MAP_TENSOR_READ, true);`
			`}`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`profiler->end(info);`
			`return true;`
			`};`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00
beta 0.1.0 2019-04-17 10:49:11 +08:00			`AUTOTIME;`
			`// just run`
			`for (int i = 0; i < runTime; ++i) {`
beta 0.1.1.4 - refactor OpenGL, test relative codes - optimize LRN - fix doc link error 2019-05-24 11:26:54 +08:00			`inputTensor->copyFromHostTensor(inputTensorUser.get());`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`net->runSessionWithCallBackInfo(session, beginCallBack, afterCallBack);`
beta 0.1.1.4 - refactor OpenGL, test relative codes - optimize LRN - fix doc link error 2019-05-24 11:26:54 +08:00			`outputTensor->copyToHostTensor(outputTensorUser.get());`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`}`
Synchronize internal github for version 1.2.0 (#1518) 2021-06-11 17:17:13 +08:00
- dynamic computation graph (beta) - add supports (/express) - add tests - add benchmarks with it (/benchmark/exprModels) - Python - MNN engine and tools were submitted to pip - available on Windows/macOS/Linux - Engine/Converter - add supports for each op benchmarking - refactor optimizer by separating steps - CPU - add supports for Conv3D, Pool3D, ELU, ReverseSequence - fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf - OpenCL - add half transform in CPU - add broadcast supports for binary - optimize Conv2D, Reshape, Eltwise, Gemm, etc. - OpenGL - add sub, real div supports for binary - add supports for unary - optimize Conv2D, Reshape - Vulkan - add max supports for eltwise - Metal - fix metallib missing problem - Train/Quantization - use express to refactor training codes 2019-09-26 21:02:07 +08:00			`#ifdef MNN_PRINT_TIME_BY_NAME`
			`profiler->printTimeByName(runTime);`
			`#endif`
[MNN:Sync] Sync internal Gitlab 2021-09-18 15:52:30 +08:00			`profiler->printSlowOp("Convolution", 20, 0.03f);`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`profiler->printTimeByType(runTime);`
			`return 0;`
- dynamic computation graph (beta) - add supports (/express) - add tests - add benchmarks with it (/benchmark/exprModels) - Python - MNN engine and tools were submitted to pip - available on Windows/macOS/Linux - Engine/Converter - add supports for each op benchmarking - refactor optimizer by separating steps - CPU - add supports for Conv3D, Pool3D, ELU, ReverseSequence - fix ArgMax, Permute, Scale, BinaryOp, Slice, SliceTf - OpenCL - add half transform in CPU - add broadcast supports for binary - optimize Conv2D, Reshape, Eltwise, Gemm, etc. - OpenGL - add sub, real div supports for binary - add supports for unary - optimize Conv2D, Reshape - Vulkan - add max supports for eltwise - Metal - fix metallib missing problem - Train/Quantization - use express to refactor training codes 2019-09-26 21:02:07 +08:00			`}`