/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-roccv/checkouts/latest/include/kernels/device/composite_device.hpp Source File

/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-roccv/checkouts/latest/include/kernels/device/composite_device.hpp Source File#

3 min read time

Applies to Linux

rocCV: /home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-roccv/checkouts/latest/include/kernels/device/composite_device.hpp Source File
composite_device.hpp
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2025 Advanced Micro Devices, Inc. All rights reserved.
3  * Permission is hereby granted, free of charge, to any person obtaining a copy
4  * of this software and associated documentation files (the "Software"), to deal
5  * in the Software without restriction, including without limitation the rights
6  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
7  * copies of the Software, and to permit persons to whom the Software is
8  * furnished to do so, subject to the following conditions:
9  *
10  * The above copyright notice and this permission notice shall be included in
11  * all copies or substantial portions of the Software.
12  *
13  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
16  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
17  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
18  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
19  * THE SOFTWARE.
20  */
21 
22 #pragma once
23 
24 #include <hip/hip_runtime.h>
25 
26 #include "core/detail/casting.hpp"
27 
28 namespace Kernels {
29 namespace Device {
30 template <typename SrcWrapper, typename MaskWrapper, typename DstWrapper>
31 __global__ void composite(SrcWrapper foreground, SrcWrapper background, MaskWrapper mask, DstWrapper output) {
32  using namespace roccv::detail; // For RangeCast, NumElements, etc.
33  using src_type = typename SrcWrapper::ValueType;
34  using dst_type = typename DstWrapper::ValueType;
35  using work_type = MakeType<float, NumElements<src_type>>;
36 
37  const int x = blockIdx.x * blockDim.x + threadIdx.x;
38  const int y = blockIdx.y * blockDim.y + threadIdx.y;
39  const int batch = blockIdx.z;
40 
41  if (x >= foreground.width() || y >= foreground.height()) return;
42 
43  // Range cast all input values to float to avoid overflowing values and keep them in the same range.
44  auto maskFactor = RangeCast<float1>(mask.at(batch, y, x, 0));
45  auto fgVal = RangeCast<work_type>(foreground.at(batch, y, x, 0));
46  auto bgVal = RangeCast<work_type>(background.at(batch, y, x, 0));
47 
48  work_type result = bgVal + maskFactor.x * (fgVal - bgVal);
49 
50  // If number of channels in output is 4, ensure that the last channel (alpha in this case) is always fully on.
51  if constexpr (NumElements<dst_type> == 4) {
52  output.at(batch, y, x, 0) = RangeCast<dst_type>((MakeType<float, 4>){result.x, result.y, result.z, 1.0f});
53  } else {
54  output.at(batch, y, x, 0) = RangeCast<dst_type>(result);
55  }
56 }
57 } // namespace Device
58 } // namespace Kernels
__global__ void composite(SrcWrapper foreground, SrcWrapper background, MaskWrapper mask, DstWrapper output)
Definition: composite_device.hpp:31
Definition: non_max_suppression_helpers.hpp:26
Definition: strided_data_wrap.hpp:33
MakeType_t< T, C >::type MakeType
Definition: type_traits.hpp:97