MNN/source/backend/cuda/execution/RasterExecution.hpp

49 lines
1.5 KiB
C++

//
// RasterExecution.hpp
// MNN
//
// Created by MNN on b'2020/04/02'.
// Copyright © 2018, Alibaba Group Holding Limited
//
#ifndef RasterExecution_hpp
#define RasterExecution_hpp
#include "backend/cuda/core/CUDABackend.hpp"
#include <map>
#include <set>
#include "core/TensorUtils.hpp"
#include "core/OpCommonUtils.hpp"
namespace MNN {
namespace CUDA {
class RasterExecution : public Execution {
public:
RasterExecution(Backend* bn) : Execution(bn) {
// Do nothing
}
virtual ~ RasterExecution() {
// Do nothing
}
virtual ErrorCode onResize(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;
virtual ErrorCode onExecute(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) override;
void executeFaster(const std::vector<Tensor *> &inputs, const std::vector<Tensor *> &outputs) const;
private:
std::map<Tensor*, Tensor*> mTempInput;
std::vector<std::pair<const Tensor*, Tensor::InsideDescribe::Region*>> mTempInputCopy;
std::vector<std::pair<const Tensor*, Tensor::InsideDescribe::Region>> mFastBlit;
std::shared_ptr<Tensor> mTempOutput;
Tensor* mOutputPtr;
bool mNeedZero = false;
bool mFast = false;
OpCommonUtils::TensorConvertParameter mSingleConvert;
int32_t mZeroPoint = 0;
// First: type, 0: not , 1: unit, 4:unitc4
// Second: count
std::pair<int, int> mFuseRaster;
void *mOffset;
std::shared_ptr<Tensor> mOffsetTensor;
std::shared_ptr<Tensor> mTempInputTensor;
};
}
}
#endif