/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-roccv/checkouts/latest/include/kernels/device/copy_make_border_device.hpp Source File

/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-roccv/checkouts/latest/include/kernels/device/copy_make_border_device.hpp Source File#

2 min read time

Applies to Linux

rocCV: /home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-roccv/checkouts/latest/include/kernels/device/copy_make_border_device.hpp Source File
copy_make_border_device.hpp
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2025 Advanced Micro Devices, Inc. All rights reserved.
3  * Permission is hereby granted, free of charge, to any person obtaining a copy
4  * of this software and associated documentation files (the "Software"), to deal
5  * in the Software without restriction, including without limitation the rights
6  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
7  * copies of the Software, and to permit persons to whom the Software is
8  * furnished to do so, subject to the following conditions:
9  *
10  * The above copyright notice and this permission notice shall be included in
11  * all copies or substantial portions of the Software.
12  *
13  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
16  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
17  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
18  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
19  * THE SOFTWARE.
20  */
21 
22 #pragma once
23 
24 #include <hip/hip_runtime.h>
25 
26 namespace Kernels {
27 namespace Device {
39 template <typename SrcDesc, typename DstDesc>
40 __global__ void copy_make_border(SrcDesc src, DstDesc dst, int32_t top, int32_t left) {
41  int x = blockIdx.x * blockDim.x + threadIdx.x;
42  int y = blockIdx.y * blockDim.y + threadIdx.y;
43  int b = blockIdx.z;
44 
45  if (x >= dst.width() || y >= dst.height() || b >= dst.batches()) return;
46 
47  dst.at(b, y, x, 0) = src.at(b, y - top, x - left, 0);
48 }
49 } // namespace Device
50 } // namespace Kernels
__global__ void copy_make_border(SrcDesc src, DstDesc dst, int32_t top, int32_t left)
GPU kernel for CopyMakeBorder operator.
Definition: copy_make_border_device.hpp:40
Definition: non_max_suppression_helpers.hpp:26