onnxruntime/onnxruntime/test/providers/cpu/tensor/transpose_test.cc

// Copyright (c) Microsoft Corporation. All rights reserved.
// Licensed under the MIT License.

#include "gtest/gtest.h"
#include "test/providers/provider_test_utils.h"
#include "test/providers/compare_provider_test_utils.h"
#include "core/providers/cpu/tensor/transpose.h"

namespace onnxruntime {
namespace test {

TEST(TransposeOpTest, IsTransposeReshapeTest) {
  std::vector<int64_t> input_dims{1, 2, 3, 4, 1};
  std::vector<size_t> perm{0, 1, 2, 3, 4};
  ASSERT_TRUE(IsTransposeReshape(perm, input_dims));
  perm = std::vector<size_t>{1, 2, 3, 0, 4};
  ASSERT_TRUE(IsTransposeReshape(perm, input_dims));
  perm = std::vector<size_t>{4, 1, 0, 2, 3};
  ASSERT_TRUE(IsTransposeReshape(perm, input_dims));
  perm = std::vector<size_t>{4, 1, 0, 3, 2};
  ASSERT_FALSE(IsTransposeReshape(perm, input_dims));
}

// Some of the tests can't run on TensorrtExecutionProvider because of errors.
// Those tests will fallback to other EPs.

template <class T>
void TransposeTest(std::vector<int64_t>& input_shape,
                   std::vector<T>& input_vals,
                   std::vector<int64_t>* p_perm,
                   std::vector<int64_t> expected_shape,
                   std::initializer_list<T>& expected_vals,
                   bool is_tensorrt_supported = true,
                   bool is_openvino_supported = true) {
  OpTester test("Transpose");
  if (nullptr != p_perm)
    test.AddAttribute("perm", *p_perm);
  test.AddInput<T>("X", input_shape, input_vals);
  test.AddOutput<T>("Y", expected_shape, expected_vals);

  // Disable TensorRT on unsupported tests
  std::unordered_set<std::string> excluded_providers;
  if (!is_tensorrt_supported) {
    excluded_providers.insert(kTensorrtExecutionProvider);
  }
  if (!is_openvino_supported) {
    excluded_providers.insert(kOpenVINOExecutionProvider);
  }

  test.Run(OpTester::ExpectResult::kExpectSuccess, "", excluded_providers);
}

// Test 2 dimensional transpose, with no permutation attribute specified
TEST(TransposeOpTest, TwoDimNoAttr) {
  std::vector<int64_t> input_shape({2, 3});
  std::vector<float> input_vals = {
      1.0f, 2.0f, 3.0f,
      4.0f, 5.0f, 6.0f};

  std::vector<int64_t> expected_shape({3, 2});
  auto expected_vals = {
      1.0f, 4.0f,
      2.0f, 5.0f,
      3.0f, 6.0f};

  TransposeTest(input_shape, input_vals, nullptr, expected_shape, expected_vals, false);  //TensorRT: SegFault error
}

TEST(TransposeOpTest, TwoDimNoAttrStr) {
  std::vector<int64_t> input_shape({2, 3});
  std::vector<std::string> input_vals = {
      "1", "2", "3",
      "4", "5", "6"};

  std::vector<int64_t> expected_shape({3, 2});
  std::initializer_list<std::string> expected_vals = {
      "1", "4",
      "2", "5",
      "3", "6"};

  TransposeTest(input_shape, input_vals, nullptr, expected_shape, expected_vals);
}

// Test 2 dimensional transpose, with permutation attribute specified
TEST(TransposeOpTest, TwoDim) {
  std::vector<int64_t> input_shape({2, 3});
  std::vector<float> input_vals = {1.0f, 2.0f, 3.0f,
                                   4.0f, 5.0f, 6.0f};

  std::vector<int64_t> perm = {1, 0};
  std::vector<int64_t> expected_shape({3, 2});
  auto expected_vals = {1.0f, 4.0f,
                        2.0f, 5.0f,
                        3.0f, 6.0f};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals);
}

TEST(TransposeOpTest, TwoDim_double) {
  std::vector<int64_t> input_shape({2, 3});
  std::vector<double> input_vals = {1.0, 2.0, 3.0,
                                    4.0, 5.0, 6.0};

  std::vector<int64_t> perm = {1, 0};
  std::vector<int64_t> expected_shape({3, 2});
  std::initializer_list<double> expected_vals = {1.0, 4.0,
                                                 2.0, 5.0,
                                                 3.0, 6.0};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals);
}

TEST(TransposeOpTest, TwoDim_int32) {
  std::vector<int64_t> input_shape({2, 3});
  std::vector<int32_t> input_vals = {1, 2, 3,
                                     4, 5, 6};

  std::vector<int64_t> perm = {1, 0};
  std::vector<int64_t> expected_shape({3, 2});
  std::initializer_list<int32_t> expected_vals = {1, 4,
                                                  2, 5,
                                                  3, 6};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals);
}

TEST(TransposeOpTest, TwoDim_int16) {
  std::vector<int64_t> input_shape({2, 3});
  std::vector<int16_t> input_vals = {
      1, 2, 3,
      4, 5, 6};

  std::vector<int64_t> perm = {1, 0};
  std::vector<int64_t> expected_shape({3, 2});
  std::initializer_list<int16_t> expected_vals = {
      1, 4,
      2, 5,
      3, 6};

#if defined(OPENVINO_CONFIG_MYRIAD) || defined(OPENVINO_CONFIG_VAD_M)
  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals, true, false);
#else
  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals);
#endif
}

TEST(TransposeOpTest, TwoDim_mlfloat16) {
  std::vector<int64_t> input_shape({2, 3});
  std::vector<MLFloat16> input_vals;
  for (uint16_t i = 0; i < 6; ++i)
    input_vals.push_back(MLFloat16(i));

  std::vector<int64_t> perm = {1, 0};
  std::vector<int64_t> expected_shape({3, 2});
  std::initializer_list<MLFloat16> expected_vals =
      {MLFloat16{static_cast<uint16_t>(1)}, MLFloat16{static_cast<uint16_t>(4)},
       MLFloat16{static_cast<uint16_t>(2)}, MLFloat16{static_cast<uint16_t>(5)},
       MLFloat16{static_cast<uint16_t>(3)}, MLFloat16{static_cast<uint16_t>(6)}};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals, false);
}

TEST(TransposeOpTest, TwoDim_int8) {
  std::vector<int64_t> input_shape({2, 3});
  std::vector<int8_t> input_vals = {1, 2, 3,
                                    4, 5, 6};

  std::vector<int64_t> perm = {1, 0};
  std::vector<int64_t> expected_shape({3, 2});
  std::initializer_list<int8_t> expected_vals = {1, 4,
                                                 2, 5,
                                                 3, 6};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals, false);
}

TEST(TransposeOpTest, TwoDimStr) {
  std::vector<int64_t> input_shape({2, 3});
  std::vector<std::string> input_vals = {
      "1", "2", "3",
      "4", "5", "6"};

  std::vector<int64_t> perm = {1, 0};
  std::vector<int64_t> expected_shape({3, 2});
  std::initializer_list<std::string> expected_vals = {
      "1", "4",
      "2", "5",
      "3", "6"};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals);
}

// Test 3 dimensional transpose, with permutation attribute specified
TEST(TransposeOpTest, ThreeDim) {
  std::vector<int64_t> input_shape({4, 2, 3});
  std::vector<float> input_vals = {
      1.0f, 2.0f, 3.0f,
      4.0f, 5.0f, 6.0f,

      1.1f, 2.1f, 3.1f,
      4.1f, 5.1f, 6.1f,

      1.2f, 2.2f, 3.2f,
      4.2f, 5.2f, 6.2f,

      1.3f, 2.3f, 3.3f,
      4.3f, 5.3f, 6.3f};

  std::vector<int64_t> perm = {0, 2, 1};
  std::vector<int64_t> expected_shape({4, 3, 2});
  auto expected_vals = {
      1.0f, 4.0f,
      2.0f, 5.0f,
      3.0f, 6.0f,

      1.1f, 4.1f,
      2.1f, 5.1f,
      3.1f, 6.1f,

      1.2f, 4.2f,
      2.2f, 5.2f,
      3.2f, 6.2f,

      1.3f, 4.3f,
      2.3f, 5.3f,
      3.3f, 6.3f};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals, false);  //TensorRT: illegal error
}

// test when the suffix size is > 1 (last dimension is not moved)
TEST(TransposeOpTest, ThreeDimSuffix) {
  std::vector<int64_t> input_shape({4, 2, 3});
  std::vector<float> input_vals = {
      1.0f, 2.0f, 3.0f,
      4.0f, 5.0f, 6.0f,

      1.1f, 2.1f, 3.1f,
      4.1f, 5.1f, 6.1f,

      1.2f, 2.2f, 3.2f,
      4.2f, 5.2f, 6.2f,

      1.3f, 2.3f, 3.3f,
      4.3f, 5.3f, 6.3f};

  std::vector<int64_t> perm = {1, 0, 2};
  std::vector<int64_t> expected_shape({2, 4, 3});
  auto expected_vals = {
      1.0f, 2.0f, 3.0f,
      1.1f, 2.1f, 3.1f,
      1.2f, 2.2f, 3.2f,
      1.3f, 2.3f, 3.3f,

      4.0f, 5.0f, 6.0f,
      4.1f, 5.1f, 6.1f,
      4.2f, 5.2f, 6.2f,
      4.3f, 5.3f, 6.3f};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals, false);  //TensorRT: illegal error
}

TEST(TransposeOpTest, TransposeReshape) {
  std::vector<int64_t> input_shape({1, 4, 2, 1, 3});
  std::vector<float> input_vals = {
      1.0f, 2.0f, 3.0f,
      4.0f, 5.0f, 6.0f,

      1.1f, 2.1f, 3.1f,
      4.1f, 5.1f, 6.1f,

      1.2f, 2.2f, 3.2f,
      4.2f, 5.2f, 6.2f,

      1.3f, 2.3f, 3.3f,
      4.3f, 5.3f, 6.3f};

  std::vector<int64_t> perm = {1, 3, 2, 4, 0};
  std::vector<int64_t> expected_shape({4, 1, 2, 3, 1});
  auto expected_vals = {
      1.0f, 2.0f, 3.0f,
      4.0f, 5.0f, 6.0f,

      1.1f, 2.1f, 3.1f,
      4.1f, 5.1f, 6.1f,

      1.2f, 2.2f, 3.2f,
      4.2f, 5.2f, 6.2f,

      1.3f, 2.3f, 3.3f,
      4.3f, 5.3f, 6.3f};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals, false);  //TensorRT: illegal error
}

TEST(TransposeOpTest, ThreeDimStr) {
  std::vector<int64_t> input_shape({4, 2, 3});
  std::vector<std::string> input_vals = {
      "1", "2", "3",
      "4", "5", "6",

      "1", "2", "3",
      "4", "5", "6",

      "1", "2", "3",
      "4", "5", "6",

      "1", "2", "3",
      "4", "5", "6"};

  std::vector<int64_t> perm = {0, 2, 1};
  std::vector<int64_t> expected_shape({4, 3, 2});
  std::initializer_list<std::string> expected_vals = {
      "1", "4",
      "2", "5",
      "3", "6",

      "1", "4",
      "2", "5",
      "3", "6",

      "1", "4",
      "2", "5",
      "3", "6",

      "1", "4",
      "2", "5",
      "3", "6"};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals);
}

template <typename T>
static void NumericNCHW2NHWC() {
  std::vector<int64_t> input_shape({1, 3, 2, 2});
  std::vector<T> input_vals = {
      1, 2, 3, 4,
      5, 6, 7, 8,
      9, 10, 11, 12};

  std::vector<int64_t> perm = {0, 2, 3, 1};
  std::vector<int64_t> expected_shape({1, 2, 2, 3});
  std::initializer_list<T> expected_vals = {
      1, 5, 9,
      2, 6, 10,
      3, 7, 11,
      4, 8, 12};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals, false);
}
TEST(TransposeOpTest, NCHW2NHWC) {
  NumericNCHW2NHWC<int8_t>();
  NumericNCHW2NHWC<int16_t>();
  NumericNCHW2NHWC<uint32_t>();
  NumericNCHW2NHWC<uint64_t>();
}

TEST(TransposeOpTest, NCHW2NHWCStr) {
  std::vector<int64_t> input_shape({1, 3, 2, 2});
  std::vector<std::string> input_vals = {
      "1", "2", "3", "4",
      "5", "6", "7", "8",
      "9", "10", "11", "12"};

  std::vector<int64_t> perm = {0, 2, 3, 1};
  std::vector<int64_t> expected_shape({1, 2, 2, 3});
  std::initializer_list<std::string> expected_vals = {
      "1", "5", "9",
      "2", "6", "10",
      "3", "7", "11",
      "4", "8", "12"};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals, false);
}

template <typename T>
static void NumericNHWC2NCHW() {
  std::vector<int64_t> input_shape({2, 2, 2, 2});
  std::vector<T> input_vals = {
      1, 2,
      3, 4,

      5, 6,
      7, 8,

      9, 10,
      11, 12,

      13, 14,
      15, 16};

  std::vector<int64_t> perm = {0, 3, 1, 2};
  std::vector<int64_t> expected_shape({2, 2, 2, 2});
  std::initializer_list<T> expected_vals = {
      1, 3,
      5, 7,

      2, 4,
      6, 8,

      9, 11,
      13, 15,

      10, 12,
      14, 16};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals, false);
}

TEST(TransposeOpTest, NHWC2NCHW) {
  NumericNHWC2NCHW<uint8_t>();
  NumericNHWC2NCHW<int16_t>();
  NumericNHWC2NCHW<uint32_t>();
  NumericNHWC2NCHW<int64_t>();
}

TEST(TransposeOpTest, NHWC2NCHW_String) {
  std::vector<int64_t> input_shape({1, 2, 2, 3});
  std::vector<std::string> input_vals = {
      "1", "2", "3",
      "4", "5", "6",
      "7", "8", "9",
      "10", "11", "12"};

  std::vector<int64_t> perm = {0, 3, 1, 2};
  std::vector<int64_t> expected_shape({1, 3, 2, 2});
  std::initializer_list<std::string> expected_vals = {
      "1", "4", "7", "10",
      "2", "5", "8", "11",
      "3", "6", "9", "12"};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals, false);
}

// test to cover memcpy from single axis moving inwards path
TEST(TransposeOpTest, SingleAxisMovingInwardsBlockCopy) {
  std::vector<int64_t> input_shape({2, 2, 2, 2});
  std::vector<uint64_t> input_vals = {
      1, 2,
      3, 4,

      5, 6,
      7, 8,

      9, 10,
      11, 12,

      13, 14,
      15, 16};

  std::vector<int64_t> perm = {1, 2, 0, 3};
  std::vector<int64_t> expected_shape({2, 2, 2, 2});
  std::initializer_list<uint64_t> expected_vals = {
      1, 2,
      9, 10,

      3, 4,
      11, 12,

      5, 6,
      13, 14,

      7, 8,
      15, 16};

  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals, false);
}

TEST(TransposeOpTest, NDim) {
  std::vector<int64_t> input_shape({2, 2, 2, 2});
  std::vector<float> input_vals = {1.0f, 2.0f, 3.0f, 4.0f,
                                   5.0f, 6.0f, 7.0f, 8.0f,
                                   9.0f, 10.0f, 11.0f, 12.0f,
                                   13.0f, 14.0f, 15.0f, 16.0f};

  std::vector<int64_t> perm = {1, 0, 2, 3};
  auto expected_vals = {1.0f, 2.0f, 3.0f, 4.0f,
                        9.0f, 10.0f, 11.0f, 12.0f,
                        5.0f, 6.0f, 7.0f, 8.0f,
                        13.0f, 14.0f, 15.0f, 16.0f};
  TransposeTest(input_shape, input_vals, &perm, input_shape, expected_vals);

  perm = {1, 0, 3, 2};
  auto expected_vals2 = {1.0f, 3.0f, 2.0f, 4.0f,
                         9.0f, 11.0f, 10.0f, 12.0f,
                         5.0f, 7.0f, 6.0f, 8.0f,
                         13.0f, 15.0f, 14.0f, 16.0f};
  TransposeTest(input_shape, input_vals, &perm, input_shape, expected_vals2);
}

TEST(TransposeOpTest, DoTransposeImpl) {
  std::vector<int64_t> input_shape({5, 2, 1, 3});
  std::vector<float> input_vals(30);
  for (auto it = input_vals.begin(); it != input_vals.end(); ++it) {
    *it = static_cast<float>(std::distance(input_vals.begin(), it));
  }
  std::vector<int64_t> perm = {2, 1, 0, 3};
  std::vector<int64_t> expected_shape({1, 2, 5, 3});
  auto expected_vals = {0.0f, 1.0f, 2.0f, 6.0f, 7.0f, 8.0f,
                        12.0f, 13.0f, 14.0f, 18.0f, 19.0f, 20.0f,
                        24.0f, 25.0f, 26.0f, 3.0f, 4.0f, 5.0f,
                        9.0f, 10.0f, 11.0f, 15.0f, 16.0f, 17.0f,
                        21.0f, 22.0f, 23.0f, 27.0f, 28.0f, 29.0f};
  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals);
}

TEST(TransposeOpTest, DoTransposeImplString) {
  std::vector<int64_t> input_shape({5, 2, 1, 3});
  std::vector<std::string> input_vals(30);
  for (auto it = input_vals.begin(); it != input_vals.end(); ++it) {
    *it = std::string("n") + std::to_string(static_cast<int>(std::distance(input_vals.begin(), it)));
  }
  std::vector<int64_t> perm = {2, 1, 0, 3};
  std::vector<int64_t> expected_shape({1, 2, 5, 3});
  std::initializer_list<std::string> expected_vals = {"n0", "n1", "n2", "n6", "n7", "n8",
                                                      "n12", "n13", "n14", "n18", "n19", "n20",
                                                      "n24", "n25", "n26", "n3", "n4", "n5",
                                                      "n9", "n10", "n11", "n15", "n16", "n17",
                                                      "n21", "n22", "n23", "n27", "n28", "n29"};
  TransposeTest(input_shape, input_vals, &perm, expected_shape, expected_vals);
}

TEST(TransposeOpTest, DoTransposeEltWise) {
  // Configuration where DoTransposeEltWise is called.
  std::vector<int64_t> input_shape({2, 2, 2, 2});
  std::vector<float> input_vals = {1.0f, 2.0f, 3.0f, 4.0f,
                                   5.0f, 6.0f, 7.0f, 8.0f,
                                   9.0f, 10.0f, 11.0f, 12.0f,
                                   13.0f, 14.0f, 15.0f, 16.0f};

  std::vector<int64_t> perm = {1, 0, 3, 2};
  auto expected_vals2 = {1.0f, 3.0f, 2.0f, 4.0f,
                         9.0f, 11.0f, 10.0f, 12.0f,
                         5.0f, 7.0f, 6.0f, 8.0f,
                         13.0f, 15.0f, 14.0f, 16.0f};
  TransposeTest(input_shape, input_vals, &perm, input_shape, expected_vals2);

  // Specific test which tests that function DoTransposeEltWise does not
  // copy values outside the target buffer.
  TensorShape tensor_shape(input_shape);
  std::vector<size_t> stride(input_shape.size());
  for (size_t i = 0; i < input_shape.size(); i++) {
    size_t inpdim = perm[i];
    if (inpdim + 1 < input_shape.size())
      stride[i] = tensor_shape.SizeFromDimension(inpdim + 1);
    else
      stride[i] = 1;
  }

  std::vector<float> input_vals_end = {1.0f, 2.0f, 3.0f, 4.0f,
                                       5.0f, 6.0f, 7.0f, 8.0f,
                                       9.0f, 10.0f, 11.0f, 12.0f,
                                       13.0f, 14.0f, 15.0f, 16.0f,
                                       -1.0f, -1.0f};
  std::vector<float> target(input_vals_end.size(), 17.0f);

  std::vector<float> expected_vals3 = {1.0f, 3.0f, 2.0f, 4.0f,
                                       9.0f, 11.0f, 10.0f, 12.0f,
                                       5.0f, 7.0f, 6.0f, 8.0f,
                                       13.0f, 15.0f, 14.0f, 16.0f,
                                       17.0f, 17.0f};

  DoTransposeEltWise(input_shape.size(), input_shape, 16,
                     stride, (uint8_t*)input_vals_end.data(), (uint8_t*)target.data(),
                     sizeof(float));
  for (size_t i = 0; i < input_vals_end.size(); ++i) {
    ASSERT_TRUE(target[i] == expected_vals3[i]);
  }
}

#if USE_CUDA
constexpr const char* kGpuExecutionProvider = kCudaExecutionProvider;
#elif USE_ROCM
constexpr const char* kGpuExecutionProvider = kRocmExecutionProvider;
#endif

#if defined(USE_CUDA) || defined(USE_ROCM)
static void TestTranspose(
    const std::vector<int64_t>& perm,
    const std::vector<int64_t>& x_dims,
    const std::vector<int64_t>& y_dims,
    double error_tolerance = 1e-4) {
  CompareOpTester test{"Transpose"};

  RandomValueGenerator random{};
  const auto X_data = random.Uniform<float>(x_dims, -10.0, 10.0);
  const auto Y_data = FillZeros<float>(y_dims);

  test.AddAttribute("perm", perm);
  test.AddInput("X", x_dims, X_data);
  test.AddOutput("Y", y_dims, Y_data);

  test.CompareWithCPU(kGpuExecutionProvider, error_tolerance);
}

TEST(TransposeOpTest, Transpose0213) {
  const std::vector<int64_t> X_dims{64, 128, 16, 64};
  const std::vector<int64_t> perm{0, 2, 1, 3};
  const std::vector<int64_t> Y_dims{64, 16, 128, 64};
  TestTranspose(perm, X_dims, Y_dims);
}

TEST(TransposeOpTest, Transpose0231) {
  const std::vector<int64_t> X_dims{64, 128, 16, 64};
  const std::vector<int64_t> perm{0, 2, 3, 1};
  const std::vector<int64_t> Y_dims{64, 16, 64, 128};
  TestTranspose(perm, X_dims, Y_dims);
}

TEST(TransposeOpTest, Transpose0312) {
  const std::vector<int64_t> X_dims{64, 16, 64, 128};
  const std::vector<int64_t> perm{0, 3, 1, 2};
  const std::vector<int64_t> Y_dims{64, 128, 16, 64};
  TestTranspose(perm, X_dims, Y_dims);
}
#endif

}  // namespace test
}  // namespace onnxruntime