xref: /aosp_15_r20/external/ComputeLibrary/tests/validation/reference/Col2Im.cpp (revision c217d954acce2dbc11938adb493fc0abd69584f3)
1  /*
2   * Copyright (c) 2018-2020 Arm Limited.
3   *
4   * SPDX-License-Identifier: MIT
5   *
6   * Permission is hereby granted, free of charge, to any person obtaining a copy
7   * of this software and associated documentation files (the "Software"), to
8   * deal in the Software without restriction, including without limitation the
9   * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
10   * sell copies of the Software, and to permit persons to whom the Software is
11   * furnished to do so, subject to the following conditions:
12   *
13   * The above copyright notice and this permission notice shall be included in all
14   * copies or substantial portions of the Software.
15   *
16   * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17   * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18   * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19   * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20   * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21   * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22   * SOFTWARE.
23   */
24  #include "Col2Im.h"
25  
26  #include "tests/validation/Helpers.h"
27  #include "tests/validation/reference/Utils.h"
28  
29  namespace arm_compute
30  {
31  namespace test
32  {
33  namespace validation
34  {
35  namespace reference
36  {
37  template <typename T>
col2im(const SimpleTensor<T> & src,const TensorShape & dst_shape,unsigned int num_groups)38  SimpleTensor<T> col2im(const SimpleTensor<T> &src, const TensorShape &dst_shape, unsigned int num_groups)
39  {
40      SimpleTensor<T> dst{ dst_shape, src.data_type(), 1 };
41  
42      // Compute reference
43      const size_t batches    = dst_shape.total_size() / (dst_shape.x() * dst_shape.y() * dst_shape.z());
44      const size_t src_width  = src.shape().x();
45      const size_t src_height = src.shape().y();
46  
47      if(num_groups == 1)
48      {
49          // Batches are on the 3rd dimension of the input tensor
50  #if defined(_OPENMP)
51          #pragma omp parallel for collapse(3)
52  #endif /* _OPENMP */
53          for(size_t b = 0; b < batches; ++b)
54          {
55              for(size_t x = 0; x < src_width; ++x)
56              {
57                  for(size_t y = 0; y < src_height; ++y)
58                  {
59                      const int dst_idx = y + x * src_height + b * src_height * src_width;
60                      dst[dst_idx]      = src[coord2index(src.shape(), Coordinates(x, y, b))];
61                  }
62              }
63          }
64      }
65      else
66      {
67  #if defined(_OPENMP)
68          #pragma omp parallel for collapse(4)
69  #endif /* _OPENMP */
70          for(size_t b = 0; b < batches; ++b)
71          {
72              for(size_t g = 0; g < num_groups; ++g)
73              {
74                  for(size_t x = 0; x < src_width; ++x)
75                  {
76                      for(size_t y = 0; y < src_height; ++y)
77                      {
78                          const int dst_idx = y + x * src_height + g * src_height * src_width + b * src_height * src_width * num_groups;
79                          dst[dst_idx]      = src[coord2index(src.shape(), Coordinates(x, y, g, b))];
80                      }
81                  }
82              }
83          }
84      }
85      return dst;
86  }
87  
88  template SimpleTensor<float> col2im(const SimpleTensor<float> &src, const TensorShape &dst_shape, unsigned int num_groups);
89  template SimpleTensor<half> col2im(const SimpleTensor<half> &src, const TensorShape &dst_shape, unsigned int num_groups);
90  template SimpleTensor<uint8_t> col2im(const SimpleTensor<uint8_t> &src, const TensorShape &dst_shape, unsigned int num_groups);
91  } // namespace reference
92  } // namespace validation
93  } // namespace test
94  } // namespace arm_compute
95