mirror of https://github.com/alibaba/MNN.git
				
				
				
			
		
			
				
	
	
		
			133 lines
		
	
	
		
			5.4 KiB
		
	
	
	
		
			C++
		
	
	
	
			
		
		
	
	
			133 lines
		
	
	
		
			5.4 KiB
		
	
	
	
		
			C++
		
	
	
	
//
 | 
						|
//  GeometryPermute.cpp
 | 
						|
//  MNN
 | 
						|
//
 | 
						|
//  Created by MNN on 2020/04/03.
 | 
						|
//  Copyright © 2018, Alibaba Group Holding Limited
 | 
						|
//
 | 
						|
 | 
						|
#include "geometry/GeometryComputer.hpp"
 | 
						|
#include "core/TensorUtils.hpp"
 | 
						|
namespace MNN {
 | 
						|
class GeometryPermute : public GeometryComputer {
 | 
						|
public:
 | 
						|
    virtual bool onCompute(const Op* op, const std::vector<Tensor*>& inputs, const std::vector<Tensor*>& outputs,
 | 
						|
                           Context& context, CommandBuffer& res) const override {
 | 
						|
        auto input      = inputs[0];
 | 
						|
        auto output     = outputs[0];
 | 
						|
        auto inputDes   = TensorUtils::getDescribe(input);
 | 
						|
        auto outputDes  = TensorUtils::getDescribe(output);
 | 
						|
        auto inputSlice = inputDes->regions;
 | 
						|
        MNN_ASSERT(input->dimensions() >= 1);
 | 
						|
        MNN_ASSERT(output->dimensions() == input->dimensions());
 | 
						|
        auto originTensor = input;
 | 
						|
        int basicOffset   = 0;
 | 
						|
        std::vector<int> inputStrides(input->buffer().dimensions);
 | 
						|
        std::vector<int> shape(input->buffer().dimensions);
 | 
						|
        if (op->type() == OpType_Permute) {
 | 
						|
            auto shapeValue = op->main_as_Permute()->dims();
 | 
						|
            for (int i = 0; i < shape.size(); ++i) {
 | 
						|
                shape[i] = shapeValue->data()[i];
 | 
						|
            }
 | 
						|
        } else if (op->type() == OpType_Transpose) {
 | 
						|
            auto shapeValue = inputs[1]->host<int32_t>();
 | 
						|
            for (int i = 0; i < shape.size(); ++i) {
 | 
						|
                shape[i] = shapeValue[i];
 | 
						|
            }
 | 
						|
        } else {
 | 
						|
            MNN_ASSERT(false);
 | 
						|
        }
 | 
						|
        int eleSize = 1;
 | 
						|
        {
 | 
						|
            int stride = 1;
 | 
						|
            for (int i = input->buffer().dimensions - 1; i >= 0; --i) {
 | 
						|
                inputStrides[i] = stride;
 | 
						|
                stride *= input->length(i);
 | 
						|
            }
 | 
						|
            eleSize = stride;
 | 
						|
        }
 | 
						|
        // Select not zero dims
 | 
						|
        std::vector<int> seperateDimIndexes;
 | 
						|
        std::vector<int> outputStrides(input->buffer().dimensions);
 | 
						|
        for (int i = 0; i < shape.size(); ++i) {
 | 
						|
            outputStrides[i] = inputStrides[shape[i]];
 | 
						|
            if (1 != output->length(i)) {
 | 
						|
                seperateDimIndexes.emplace_back(i);
 | 
						|
            }
 | 
						|
        }
 | 
						|
        int basicStride = 1;
 | 
						|
        // Compute inside, outside, axis
 | 
						|
        int inside        = 1;
 | 
						|
        int insideStride  = 0;
 | 
						|
        int outside       = 1;
 | 
						|
        int outsideStride = 0;
 | 
						|
        int axis          = 1;
 | 
						|
        int axisStride    = 0;
 | 
						|
        int breakAxis     = -1;
 | 
						|
        int remainSize    = 1;
 | 
						|
        {
 | 
						|
            if (seperateDimIndexes.size() >= 1) {
 | 
						|
                auto index   = seperateDimIndexes[seperateDimIndexes.size() - 1];
 | 
						|
                inside       = output->length(index);
 | 
						|
                insideStride = outputStrides[index];
 | 
						|
            }
 | 
						|
            if (seperateDimIndexes.size() >= 2) {
 | 
						|
                auto index = seperateDimIndexes[seperateDimIndexes.size() - 2];
 | 
						|
                axis       = output->length(index);
 | 
						|
                axisStride = outputStrides[index];
 | 
						|
            }
 | 
						|
            if (seperateDimIndexes.size() >= 3) {
 | 
						|
                auto index    = seperateDimIndexes[seperateDimIndexes.size() - 3];
 | 
						|
                outside       = output->length(index);
 | 
						|
                outsideStride = outputStrides[index];
 | 
						|
                breakAxis     = (int)seperateDimIndexes.size() - 3;
 | 
						|
                for (int i = 0; i < seperateDimIndexes.size() - 3; ++i) {
 | 
						|
                    remainSize *= output->length(seperateDimIndexes[i]);
 | 
						|
                }
 | 
						|
            }
 | 
						|
        }
 | 
						|
        outputDes->regions.resize(remainSize);
 | 
						|
        outputDes->memoryType = Tensor::InsideDescribe::MEMORY_VIRTUAL;
 | 
						|
        std::vector<int32_t> mod(breakAxis + 1);
 | 
						|
        for (int i = 0; i < breakAxis; ++i) {
 | 
						|
            int value = 1;
 | 
						|
            for (int j = i + 1; j < breakAxis; ++j) {
 | 
						|
                auto index = seperateDimIndexes[j];
 | 
						|
                value *= output->length(index);
 | 
						|
            }
 | 
						|
            mod[i] = value;
 | 
						|
        }
 | 
						|
        for (int indice = 0; indice < remainSize; ++indice) {
 | 
						|
            int value       = indice;
 | 
						|
            int inputOffset = 0;
 | 
						|
            for (int i = 0; i < breakAxis; ++i) {
 | 
						|
                auto coordinate = value / mod[i];
 | 
						|
                auto index      = seperateDimIndexes[i];
 | 
						|
                inputOffset += coordinate * outputStrides[index];
 | 
						|
                value = value % mod[i];
 | 
						|
            }
 | 
						|
            Tensor::InsideDescribe::Region& slice = outputDes->regions[indice];
 | 
						|
            slice.src.offset                      = inputOffset + basicOffset;
 | 
						|
            slice.src.stride[0]                   = outsideStride * basicStride;
 | 
						|
            slice.size[0]                         = outside;
 | 
						|
            slice.src.stride[1]                   = axisStride * basicStride;
 | 
						|
            slice.size[1]                         = axis;
 | 
						|
            slice.src.stride[2]                   = insideStride * basicStride;
 | 
						|
            slice.size[2]                         = inside;
 | 
						|
            slice.origin                          = originTensor;
 | 
						|
            slice.dst.offset                      = indice * outside * axis * inside;
 | 
						|
            slice.dst.stride[0]                   = axis * inside;
 | 
						|
            slice.dst.stride[1]                   = inside;
 | 
						|
            slice.dst.stride[2]                   = 1;
 | 
						|
        }
 | 
						|
        return true;
 | 
						|
    }
 | 
						|
};
 | 
						|
static void _create() {
 | 
						|
    std::shared_ptr<GeometryComputer> comp(new GeometryPermute);
 | 
						|
    GeometryComputer::registerGeometryComputer(comp, {OpType_Transpose, OpType_Permute});
 | 
						|
}
 | 
						|
 | 
						|
REGISTER_GEOMETRY(GeometryPermute, _create);
 | 
						|
}; // namespace MNN
 |