MNN/source/backend/cuda/execution/MatMulExecution.hpp

//
//  MatMulExecution.hpp
//  MNN
//
//  Created by MNN on 2020/07/30.
//  Copyright © 2018, Alibaba Group Holding Limited
//

#ifndef MatMulExecution_hpp
#define MatMulExecution_hpp
#include <vector>
#include "backend/cuda/core/CUDABackend.hpp"
#include "core/Execution.hpp"
#include "TensorCoreGemm.cuh"
namespace MNN {
namespace CUDA {
class MatMulExecution : public Execution {
public:
    MatMulExecution(bool transposeA, bool transposeB, Backend *backend);
    virtual ~MatMulExecution();
    virtual ErrorCode onResize(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;
    virtual ErrorCode onExecute(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;

private:
    bool mTransposeA;
    bool mTransposeB;
    std::pair<void*, int> mTempA;
    std::pair<void*, int> mTempB;
    std::pair<void*, int> mParameters; // In GPU
    MatMulParam mParam; // In CPU
    bool mUseBlas = false;
};
} // namespace CUDA
} // namespace MNN

#endif
beta 0.1.0 2019-04-17 10:49:11 +08:00			`//`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`// MatMulExecution.hpp`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`// MNN`
			`//`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`// Created by MNN on 2020/07/30.`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`// Copyright © 2018, Alibaba Group Holding Limited`
			`//`

Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#ifndef MatMulExecution_hpp`
			`#define MatMulExecution_hpp`
			`#include <vector>`
			`#include "backend/cuda/core/CUDABackend.hpp"`
Update 2019-12-27 22:16:57 +08:00			`#include "core/Execution.hpp"`
[MNN:Sync] Sync internal gitlab 2022-01-04 10:50:40 +08:00			`#include "TensorCoreGemm.cuh"`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`namespace MNN {`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`namespace CUDA {`
			`class MatMulExecution : public Execution {`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`public:`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`MatMulExecution(bool transposeA, bool transposeB, Backend *backend);`
			`virtual ~MatMulExecution();`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`virtual ErrorCode onResize(const std::vector<Tensor > &inputs, const std::vector<Tensor > &outputs) override;`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`virtual ErrorCode onExecute(const std::vector<Tensor > &inputs, const std::vector<Tensor > &outputs) override;`
beta 0.1.0 2019-04-17 10:49:11 +08:00
			`private:`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`bool mTransposeA;`
			`bool mTransposeB;`
[MNN:Sync] Sync internal gitlab 2022-01-04 10:50:40 +08:00			`std::pair<void*, int> mTempA;`
			`std::pair<void*, int> mTempB;`
			`std::pair<void*, int> mParameters; // In GPU`
			`MatMulParam mParam; // In CPU`
[Sync] Sync internal Gitlab 2022-02-18 11:30:27 +08:00			`bool mUseBlas = false;`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`};`
Github release 1.1.0 2020-11-05 16:41:56 +08:00			`} // namespace CUDA`
beta 0.1.0 2019-04-17 10:49:11 +08:00			`} // namespace MNN`

Github release 1.1.0 2020-11-05 16:41:56 +08:00			`#endif`