tranpose op: perm as input tensor

dboyliao · dboyliao · commit bfa4cb66d573 · 2020-11-20T19:34:52.000+08:00
diff --git a/TESTS/operators/constants_transpose.hpp b/TESTS/operators/constants_transpose.hpp
@@ -1,8 +1,18 @@
 #ifndef _TRANSPOSE_TEST_H
 #define _TRANSPOSE_TEST_H
 
-static const unsigned short transpose_axes_arr[3] = { 2,1,0 };
-static const float random_input_arr[15] = { 3.484638214111328, 2.033799886703491, 3.2437448501586914, 4.783249855041504, 3.497023582458496, 3.511240005493164, 1.558927297592163, 3.7084484100341797, 2.570117712020874, 0.2405869960784912, 1.8713605403900146, 4.19132661819458, 0.6596618890762329, 0.9029078483581543, 0.2223271131515503 };
-static const float ref_output_arr[15] = { 3.484638214111328, 3.511240005493164, 1.8713605403900146, 2.033799886703491, 1.558927297592163, 4.19132661819458, 3.2437448501586914, 3.7084484100341797, 0.6596618890762329, 4.783249855041504, 2.570117712020874, 0.9029078483581543, 3.497023582458496, 0.2405869960784912, 0.2223271131515503 };
+static const int32_t transpose_perm_arr[4] = {2, 1, 0, 3};
+static const float random_input_arr[15] = {
+    3.484638214111328,  2.033799886703491,  3.2437448501586914,
+    4.783249855041504,  3.497023582458496,  3.511240005493164,
+    1.558927297592163,  3.7084484100341797, 2.570117712020874,
+    0.2405869960784912, 1.8713605403900146, 4.19132661819458,
+    0.6596618890762329, 0.9029078483581543, 0.2223271131515503};
+static const float ref_output_arr[15] = {
+    3.484638214111328,  3.511240005493164,  1.8713605403900146,
+    2.033799886703491,  1.558927297592163,  4.19132661819458,
+    3.2437448501586914, 3.7084484100341797, 0.6596618890762329,
+    4.783249855041504,  2.570117712020874,  0.9029078483581543,
+    3.497023582458496,  0.2405869960784912, 0.2223271131515503};
 
-#endif // _TRANSPOSE
+#endif  // _TRANSPOSE_TEST_H
diff --git a/TESTS/operators/test_transpose.cpp b/TESTS/operators/test_transpose.cpp
@@ -2,8 +2,8 @@
 #include <iostream>
 
 #include "RamTensor.hpp"
-#include "Transpose.hpp"
 #include "RomTensor.hpp"
+#include "Transpose.hpp"
 #include "arenaAllocator.hpp"
 #include "constants_transpose.hpp"
 #include "context.hpp"
@@ -19,19 +19,19 @@ TEST(Transpose, transpose_test) {
   localCircularArenaAllocator<15 * 2 * sizeof(float), uint32_t> ram_allocator;
   Context::get_default_context()->set_metadata_allocator(&meta_allocator);
   Context::get_default_context()->set_ram_data_allocator(&ram_allocator);
-  
+
   Tensor input_tensor = new RomTensor({3, 1, 5, 1}, flt, random_input_arr);
+  Tensor perm_tensor = new RomTensor({4}, i32, transpose_perm_arr);
 
   TensorShape input_target_shape(3, 1, 5, 1);
   TensorShape input_shape = input_tensor->get_shape();
   EXPECT_TRUE(input_target_shape == input_shape);
 
-  Tensor transpose_axes = new RomTensor({4}, u8, transpose_axes_arr);
   Tensor output_tensor = new RamTensor(flt);
-  TransposeOperator<float> op({2,1,0,3});
-
+  TransposeOperator<float> op;
 
-  op.set_inputs({{TransposeOperator<float>::input, input_tensor}})
+  op.set_inputs({{TransposeOperator<float>::input, input_tensor},
+                 {TransposeOperator<float>::perm, perm_tensor}})
       .set_outputs({{TransposeOperator<float>::output, output_tensor}})
       .eval();
 
diff --git a/src/uTensor/ops/Transpose.hpp b/src/uTensor/ops/Transpose.hpp
@@ -1,30 +1,38 @@
 #ifndef UTENSOR_TRANSPOSE_H
 #define UTENSOR_TRANSPOSE_H
 
+#include <cstring>
+
 #include "context.hpp"
-#include "types.hpp"
+#include "operatorBase.hpp"
 #include "tensor.hpp"
+#include "types.hpp"
 #include "uTensor_util.hpp"
-#include "operatorBase.hpp"
-
-#include <cstring>
 
 namespace uTensor {
 namespace ReferenceOperators {
 
 // Transpose (Swap Axes) as a port from Numpy
 // using stride interation in the order of transpose axes
 template <typename Tin>
-class TransposeOperator : public OperatorInterface<1, 1> {
-/* reshape input as the shape of output*/
-public:
-  TransposeOperator(const TensorShape&& axes) : _axes(axes) {}
-  TransposeOperator(const TensorShape& axes) : _axes(axes) {}
-  
-  enum names_in : uint8_t { input };
+class TransposeOperator : public OperatorInterface<2, 1> {
+  /* reshape input as the shape of output*/
+ public:
+  enum names_in : uint8_t { input, perm };
   enum names_out : uint8_t { output };
 
-  virtual void compute(){
+  virtual void compute() {
+    Tensor& perm_tensor = inputs[perm].tensor();
+    if (perm_tensor.get_shape().num_dims() > 1) {
+      uTensor_printf(
+          "the input tensor perm should be a vector (dimension should be 1)\n");
+      Context::get_default_context()->throwError(new InvalidTensorInputError);
+    }
+    if (perm_tensor->get_type() != i32) {
+      uTensor_printf("expecting perm tensor of element type int32_t\n");
+      Context::get_default_context()->throwError(
+          new InvalidTensorDataTypeError);
+    }
     Tensor& input_tensor = inputs[input].tensor();
     TensorShape& input_shape = input_tensor.get_shape();
     input_shape.update_dims();
@@ -36,78 +44,80 @@ class TransposeOperator : public OperatorInterface<1, 1> {
     Tensor& output_tensor = outputs[output].tensor();
 
     // Create a placeholder to calculate the output shape
-    // Normally this would reference output shape, but since this could (usually would) be referencing the input, let's keep a dedicated value
-    TensorShape output_shape = TensorShape(1,1,1,1);
+    // Normally this would reference output shape, but since this could (usually
+    // would) be referencing the input, let's keep a dedicated value
+    TensorShape output_shape = TensorShape(1, 1, 1, 1);
     TensorStrides output_strides = TensorStrides(output_shape);
     TensorShape offsets = TensorShape(input_shape.num_dims());
 
-    for (size_t i = 0; i < 4; ++i) { 
+    for (size_t i = 0; i < 4; ++i) {
       output_shape[i] = 0;
       output_strides[i] = 0;
 
       // Offsets are used to avoid multiple for loops
       offsets[i] = 0;
     }
 
-    for (size_t i = 0; i < (size_t) input_shape.num_dims(); ++i) { 
-      output_shape[_axes[i]] = input_shape[i];
+    for (size_t i = 0; i < (size_t)input_shape.num_dims(); ++i) {
+      int32_t axis = static_cast<int32_t>(perm_tensor(i));
+      output_shape[axis] = input_shape[i];
 
       // output_strides(i) is derived from axes and input_strides
-      output_strides[_axes[i]] = input_strides[i];
+      output_strides[axis] = input_strides[i];
     }
-    
-    // Output shape can be asserted once the transform 
+
+    // Output shape can be asserted once the transform
     // effect has been determined
     output_shape.update_dims();
     output_tensor->resize(output_shape);
 
     // Perform some basic checks
-    if (input_tensor->num_elems() != output_tensor->num_elems()){
-        uTensor_printf("inconsistent input and output shape for reshape\n");
-        Context::get_default_context()->throwError(new InvalidReshapeError);
-        return;
-    }    
-    if (input_tensor->get_type() != output_tensor->get_type()){
-        uTensor_printf("inconsistent input and output data type for reshape\n");
-        Context::get_default_context()->throwError(new InvalidTensorDataTypeError);
-        return;
+    if (input_tensor->num_elems() != output_tensor->num_elems()) {
+      uTensor_printf("inconsistent input and output shape for reshape\n");
+      Context::get_default_context()->throwError(new InvalidReshapeError);
+      return;
+    }
+    if (input_tensor->get_type() != output_tensor->get_type()) {
+      uTensor_printf("inconsistent input and output data type for reshape\n");
+      Context::get_default_context()->throwError(
+          new InvalidTensorDataTypeError);
+      return;
     }
-    if (!_check_input_shape()){
-        Context::get_default_context()->throwError(new InvalidTensorDataTypeError);
-        return;
+    if (!_check_input_shape()) {
+      Context::get_default_context()->throwError(
+          new InvalidTensorDataTypeError);
+      return;
     }
 
     // copy data
-    for (uint32_t i = 0; i < input_tensor->num_elems(); ++i) { 
-        // Index of the source value, must be calculated
-        // using the output strides and output shape
-        uint32_t idx = 0;
-        for (uint32_t j = 0; j < output_shape.num_dims(); j++) {
-            idx += offsets[j] * output_strides[j];
-        }
-
-        // this is not copy: `output_tensor(i) = input_tensor(i);`
-        output_tensor(i) = static_cast<Tin>(input_tensor(idx));
+    for (uint32_t i = 0; i < input_tensor->num_elems(); ++i) {
+      // Index of the source value, must be calculated
+      // using the output strides and output shape
+      uint32_t idx = 0;
+      for (uint32_t j = 0; j < output_shape.num_dims(); j++) {
+        idx += offsets[j] * output_strides[j];
+      }
 
-        // Update offsets, to iterate sequentially along strides
-        // in the order of axes
-        for (int32_t j = output_shape.num_dims() - 1; j >= 0; j--) {
-            offsets[j] = (offsets[j] + 1) % (output_shape[j]);
-            if( offsets[j] > 0 ) {
-                break;
-            }
-        }        
-    }  
+      // this is not copy: `output_tensor(i) = input_tensor(i);`
+      output_tensor(i) = static_cast<Tin>(input_tensor(idx));
 
+      // Update offsets, to iterate sequentially along strides
+      // in the order of axes
+      for (int32_t j = output_shape.num_dims() - 1; j >= 0; j--) {
+        offsets[j] = (offsets[j] + 1) % (output_shape[j]);
+        if (offsets[j] > 0) {
+          break;
+        }
+      }
+    }
   }
-private:
-  TensorShape _axes;
 
-  bool _check_input_shape(){
+ private:
+  bool _check_input_shape() {
     const Tensor& input_tensor = inputs[input].tensor();
     const TensorShape& shape = input_tensor->get_shape();
     uint8_t num_dims = shape.num_dims();
-    for (int i = 0; i < num_dims; ++i){
+    for (int i = 0; i < num_dims; ++i) {
       if (shape[i] < 0) {
         uTensor_printf("the output shape must be all positive\n");
         return false;
@@ -117,7 +127,7 @@ class TransposeOperator : public OperatorInterface<1, 1> {
   }
 };
 
-}
-}
+}  // namespace ReferenceOperators
+}  // namespace uTensor
 
-#endif // UTENSOR_TRANSPOSE_H
+#endif  // UTENSOR_TRANSPOSE_H