mirror of https://github.com/alibaba/MNN.git
133 lines
5.4 KiB
C++
133 lines
5.4 KiB
C++
//
|
|
// GeometryPermute.cpp
|
|
// MNN
|
|
//
|
|
// Created by MNN on 2020/04/03.
|
|
// Copyright © 2018, Alibaba Group Holding Limited
|
|
//
|
|
|
|
#include "geometry/GeometryComputer.hpp"
|
|
#include "core/TensorUtils.hpp"
|
|
namespace MNN {
|
|
class GeometryPermute : public GeometryComputer {
|
|
public:
|
|
virtual bool onCompute(const Op* op, const std::vector<Tensor*>& inputs, const std::vector<Tensor*>& outputs,
|
|
Context& context, CommandBuffer& res) const override {
|
|
auto input = inputs[0];
|
|
auto output = outputs[0];
|
|
auto inputDes = TensorUtils::getDescribe(input);
|
|
auto outputDes = TensorUtils::getDescribe(output);
|
|
auto inputSlice = inputDes->regions;
|
|
MNN_ASSERT(input->dimensions() >= 1);
|
|
MNN_ASSERT(output->dimensions() == input->dimensions());
|
|
auto originTensor = input;
|
|
int basicOffset = 0;
|
|
std::vector<int> inputStrides(input->buffer().dimensions);
|
|
std::vector<int> shape(input->buffer().dimensions);
|
|
if (op->type() == OpType_Permute) {
|
|
auto shapeValue = op->main_as_Permute()->dims();
|
|
for (int i = 0; i < shape.size(); ++i) {
|
|
shape[i] = shapeValue->data()[i];
|
|
}
|
|
} else if (op->type() == OpType_Transpose) {
|
|
auto shapeValue = inputs[1]->host<int32_t>();
|
|
for (int i = 0; i < shape.size(); ++i) {
|
|
shape[i] = shapeValue[i];
|
|
}
|
|
} else {
|
|
MNN_ASSERT(false);
|
|
}
|
|
int eleSize = 1;
|
|
{
|
|
int stride = 1;
|
|
for (int i = input->buffer().dimensions - 1; i >= 0; --i) {
|
|
inputStrides[i] = stride;
|
|
stride *= input->length(i);
|
|
}
|
|
eleSize = stride;
|
|
}
|
|
// Select not zero dims
|
|
std::vector<int> seperateDimIndexes;
|
|
std::vector<int> outputStrides(input->buffer().dimensions);
|
|
for (int i = 0; i < shape.size(); ++i) {
|
|
outputStrides[i] = inputStrides[shape[i]];
|
|
if (1 != output->length(i)) {
|
|
seperateDimIndexes.emplace_back(i);
|
|
}
|
|
}
|
|
int basicStride = 1;
|
|
// Compute inside, outside, axis
|
|
int inside = 1;
|
|
int insideStride = 0;
|
|
int outside = 1;
|
|
int outsideStride = 0;
|
|
int axis = 1;
|
|
int axisStride = 0;
|
|
int breakAxis = -1;
|
|
int remainSize = 1;
|
|
{
|
|
if (seperateDimIndexes.size() >= 1) {
|
|
auto index = seperateDimIndexes[seperateDimIndexes.size() - 1];
|
|
inside = output->length(index);
|
|
insideStride = outputStrides[index];
|
|
}
|
|
if (seperateDimIndexes.size() >= 2) {
|
|
auto index = seperateDimIndexes[seperateDimIndexes.size() - 2];
|
|
axis = output->length(index);
|
|
axisStride = outputStrides[index];
|
|
}
|
|
if (seperateDimIndexes.size() >= 3) {
|
|
auto index = seperateDimIndexes[seperateDimIndexes.size() - 3];
|
|
outside = output->length(index);
|
|
outsideStride = outputStrides[index];
|
|
breakAxis = (int)seperateDimIndexes.size() - 3;
|
|
for (int i = 0; i < seperateDimIndexes.size() - 3; ++i) {
|
|
remainSize *= output->length(seperateDimIndexes[i]);
|
|
}
|
|
}
|
|
}
|
|
outputDes->regions.resize(remainSize);
|
|
outputDes->memoryType = Tensor::InsideDescribe::MEMORY_VIRTUAL;
|
|
std::vector<int32_t> mod(breakAxis + 1);
|
|
for (int i = 0; i < breakAxis; ++i) {
|
|
int value = 1;
|
|
for (int j = i + 1; j < breakAxis; ++j) {
|
|
auto index = seperateDimIndexes[j];
|
|
value *= output->length(index);
|
|
}
|
|
mod[i] = value;
|
|
}
|
|
for (int indice = 0; indice < remainSize; ++indice) {
|
|
int value = indice;
|
|
int inputOffset = 0;
|
|
for (int i = 0; i < breakAxis; ++i) {
|
|
auto coordinate = value / mod[i];
|
|
auto index = seperateDimIndexes[i];
|
|
inputOffset += coordinate * outputStrides[index];
|
|
value = value % mod[i];
|
|
}
|
|
Tensor::InsideDescribe::Region& slice = outputDes->regions[indice];
|
|
slice.src.offset = inputOffset + basicOffset;
|
|
slice.src.stride[0] = outsideStride * basicStride;
|
|
slice.size[0] = outside;
|
|
slice.src.stride[1] = axisStride * basicStride;
|
|
slice.size[1] = axis;
|
|
slice.src.stride[2] = insideStride * basicStride;
|
|
slice.size[2] = inside;
|
|
slice.origin = originTensor;
|
|
slice.dst.offset = indice * outside * axis * inside;
|
|
slice.dst.stride[0] = axis * inside;
|
|
slice.dst.stride[1] = inside;
|
|
slice.dst.stride[2] = 1;
|
|
}
|
|
return true;
|
|
}
|
|
};
|
|
static void _create() {
|
|
std::shared_ptr<GeometryComputer> comp(new GeometryPermute);
|
|
GeometryComputer::registerGeometryComputer(comp, {OpType_Transpose, OpType_Permute});
|
|
}
|
|
|
|
REGISTER_GEOMETRY(GeometryPermute, _create);
|
|
}; // namespace MNN
|