/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-roccv/checkouts/latest/include/core/detail/casting.hpp Source File

/home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-roccv/checkouts/latest/include/core/detail/casting.hpp Source File#

7 min read time
Applies to Linux
rocCV: /home/docs/checkouts/readthedocs.org/user_builds/advanced-micro-devices-roccv/checkouts/latest/include/core/detail/casting.hpp Source File
Go to the documentation of this file.
 /*
  * Copyright (c) 2025 Advanced Micro Devices, Inc. All rights reserved.
  * Permission is hereby granted, free of charge, to any person obtaining a copy
  * of this software and associated documentation files (the "Software"), to deal
  * in the Software without restriction, including without limitation the rights
  * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  * copies of the Software, and to permit persons to whom the Software is
  * furnished to do so, subject to the following conditions:
  *
  * The above copyright notice and this permission notice shall be included in
  * all copies or substantial portions of the Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
  * THE SOFTWARE.
  */
  
 #pragma once
  
 #include <algorithm>
  
 #include "core/detail/type_traits.hpp"
  
 namespace roccv::detail {
  
 template <typename T, typename U, class = std::enable_if_t<!IsCompound<T> && !IsCompound<U>>>
 __device__ __host__ T ScalarSaturateCast(U v) {
     constexpr bool smallToBig = sizeof(U) <= sizeof(T);
     constexpr bool bigToSmall = !smallToBig;
  
     if constexpr (std::is_integral_v<T> && std::is_floating_point_v<U>) {
         // Any float -> any integral
         return static_cast<T>(std::clamp<U>(std::round(v), static_cast<U>(std::numeric_limits<T>::min()),
                                             static_cast<U>(std::numeric_limits<T>::max())));
     } else if constexpr (std::is_integral_v<T> && std::is_integral_v<U> && std::is_signed_v<U> && std::is_signed_v<T> &&
                          smallToBig) {
         // Any integral signed -> Any integral unsigned, small -> big or equal
         return v <= 0 ? 0 : static_cast<T>(v);
     } else if constexpr (std::is_integral_v<U> && std::is_integral_v<T> &&
                          ((std::is_signed_v<U> && std::is_signed_v<T>) ||
                           (std::is_unsigned_v<U> && std::is_unsigned_v<T>)) &&
                          bigToSmall) {
         // Any integral signed -> Any integral signed, big -> small
         // Any integral unsigned -> Any integral unsigned, big -> small
         return v <= std::numeric_limits<T>::min()
                    ? std::numeric_limits<T>::min()
                    : (v >= std::numeric_limits<T>::max() ? std::numeric_limits<T>::max() : static_cast<T>(v));
     } else if constexpr (std::is_integral_v<U> && std::is_unsigned_v<U> && std::is_integral_v<T> &&
                          std::is_signed_v<T>) {
         // Any integral unsigned -> Any integral signed, small -> big or equal
         return v >= std::numeric_limits<T>::max() ? std::numeric_limits<T>::max() : static_cast<T>(v);
     } else if constexpr (std::is_integral_v<U> && std::is_signed_v<U> && std::is_integral_v<T> &&
                          std::is_unsigned_v<T> && bigToSmall) {
         // Any integral signed -> Any integral unsigned, big -> small
         return v <= static_cast<U>(std::numeric_limits<T>::min())
                    ? std::numeric_limits<T>::min()
                    : (v >= static_cast<U>(std::numeric_limits<T>::max()) ? std::numeric_limits<T>::max
                                                                          : static_cast<T>(v));
     } else {
         // All other cases fall into this
         return v;
     }
 }
  
 template <typename T, typename U,
           class = std::enable_if_t<(HasTypeTraits<T> && HasTypeTraits<U>) && (NumElements<T> <= NumElements<U>)>>
 __device__ __host__ T SaturateCast(U v) {
     if constexpr (std::is_same_v<T, U>) {
         return v;
     }
  
     T ret{};
  
     GetElement(ret, 0) = ScalarSaturateCast<BaseType<T>>(GetElement(v, 0));
     if constexpr (NumElements<T> >= 2) GetElement(ret, 1) = ScalarSaturateCast<BaseType<T>>(GetElement(v, 1));
     if constexpr (NumElements<T> >= 3) GetElement(ret, 2) = ScalarSaturateCast<BaseType<T>>(GetElement(v, 2));
     if constexpr (NumElements<T> >= 4) GetElement(ret, 3) = ScalarSaturateCast<BaseType<T>>(GetElement(v, 3));
  
     return ret;
 }
  
 template <typename T, typename U,
           class = std::enable_if_t<(HasTypeTraits<T> && HasTypeTraits<U>) && (!IsCompound<T> && !IsCompound<U>)>>
 __device__ __host__ T ScalarRangeCast(U v) {
     if constexpr (std::is_same_v<T, U>) {
         // Types are the same, no work needed
         return v;
     }
  
     else if constexpr (std::is_integral_v<T> && std::is_floating_point_v<U> && std::is_signed_v<T>) {
         // Float to signed integers
         return v >= T{1}    ? std::numeric_limits<T>::max()
                : v <= T{-1} ? std::numeric_limits<T>::min()
                             : static_cast<T>(std::round(static_cast<U>(std::numeric_limits<T>::max()) * v));
     }
  
     else if constexpr (std::is_integral_v<T> && std::is_floating_point_v<U> && std::is_unsigned_v<T>) {
         // float to unsigned integers
         return v >= T{1}   ? std::numeric_limits<T>::max()
                : v <= T{0} ? 0
                            : static_cast<T>(lrintf(static_cast<U>(std::numeric_limits<T>::max()) * v));
     }
  
     else if constexpr (std::is_floating_point_v<T> && std::is_integral_v<U> && std::is_signed_v<U>) {
         // Signed integer to float
         constexpr T invmax = T{1} / static_cast<T>(std::numeric_limits<U>::max());
         T out = static_cast<T>(v) * invmax;
         return out < T{-1} ? T{-1} : out;
     }
  
     else if constexpr (std::is_floating_point_v<T> && std::is_integral_v<U> && std::is_unsigned_v<U>) {
         // Unsigned integer to float
         constexpr T invmax = T{1} / static_cast<T>(std::numeric_limits<U>::max());
         return static_cast<T>(v) * invmax;
     }
  
     else {
         // All other cases reduce to a saturate cast
         return ScalarSaturateCast<T>(v);
     }
 }
  
 template <typename T, typename U,
           class = std::enable_if_t<(HasTypeTraits<T> && HasTypeTraits<U>) && NumElements<T> <= NumElements<U>>>
 __device__ __host__ T RangeCast(U v) {
     if constexpr (std::is_same_v<T, U>) {
         return v;
     }
  
     T ret{};
  
     GetElement(ret, 0) = ScalarRangeCast<BaseType<T>>(GetElement(v, 0));
     if constexpr (NumElements<T> >= 2) GetElement(ret, 1) = ScalarRangeCast<BaseType<T>>(GetElement(v, 1));
     if constexpr (NumElements<T> >= 3) GetElement(ret, 2) = ScalarRangeCast<BaseType<T>>(GetElement(v, 2));
     if constexpr (NumElements<T> >= 4) GetElement(ret, 3) = ScalarRangeCast<BaseType<T>>(GetElement(v, 3));
  
     return ret;
 }
  
 template <typename T, typename U,
           class = std::enable_if_t<(HasTypeTraits<T> && HasTypeTraits<U>) && NumElements<T> <= NumElements<U>>>
 __device__ __host__ T StaticCast(U v) {
     if constexpr (std::is_same_v<T, U>) {
         // Both same type, just return the value.
         return v;
     } else if constexpr (!IsCompound<T> && !IsCompound<U>) {
         // Both scalar values. Reduces to a standard static cast.
         return static_cast<T>(v);
     } else {
         // Vector types. Perform casting on each element.
         T ret{};
         GetElement(ret, 0) = StaticCast<BaseType<T>>(GetElement(v, 0));
         if constexpr (NumElements<T> >= 2) GetElement(ret, 1) = StaticCast<BaseType<T>>(GetElement(v, 1));
         if constexpr (NumElements<T> >= 3) GetElement(ret, 2) = StaticCast<BaseType<T>>(GetElement(v, 2));
         if constexpr (NumElements<T> >= 4) GetElement(ret, 3) = StaticCast<BaseType<T>>(GetElement(v, 3));
  
         return ret;
     }
 }
 }  // namespace roccv::detail