================ @@ -0,0 +1,142 @@ +//===----------------------------------------------------------------------===// +// +// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. +// See https://llvm.org/LICENSE.txt for license information. +// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception +// +//===----------------------------------------------------------------------===// + +#ifndef _LIBCPP___ALGORITHM_PSTL_BACKENDS_OPENMP_BACKEND_TRANSFORM_H +#define _LIBCPP___ALGORITHM_PSTL_BACKENDS_OPENMP_BACKEND_TRANSFORM_H + +#include <__algorithm/pstl_backends/cpu_backends/backend.h> +#include <__algorithm/pstl_backends/openmp/backend.h> +#include <__algorithm/transform.h> +#include <__config> +#include <__iterator/concepts.h> +#include <__type_traits/is_execution_policy.h> +#include <optional> + +#if !defined(_LIBCPP_HAS_NO_PRAGMA_SYSTEM_HEADER) +# pragma GCC system_header +#endif + +#if !defined(_LIBCPP_HAS_NO_INCOMPLETE_PSTL) && _LIBCPP_STD_VER >= 17 + +_LIBCPP_BEGIN_NAMESPACE_STD + +namespace __par_backend { +inline namespace __omp_gpu_backend { + +//===----------------------------------------------------------------------===// +// Templates for two iterators +//===----------------------------------------------------------------------===// + +template <class _Tp, class _DifferenceType, class _Up, class _Function> +_LIBCPP_HIDE_FROM_ABI optional<__empty> +__omp_parallel_for_simd(_Tp* __first1, _DifferenceType __n, _Up* __first2, _Function __f) noexcept { + __omp_gpu_backend::__omp_map_alloc(__first2, __n); + __omp_gpu_backend::__omp_map_to(__first1, __n); +# pragma omp target teams distribute parallel for simd + for (_DifferenceType __i = 0; __i < __n; ++__i) + *(__first2 + __i) = __f(*(__first1 + __i)); + __omp_gpu_backend::__omp_map_from(__first2, __n); + __omp_gpu_backend::__omp_map_free(__first1, __n); + return __empty{}; +} + +// Extracting the underlying pointer + +template <class _Iterator1, class _DifferenceType, class _Iterator2, class _Function> +_LIBCPP_HIDE_FROM_ABI optional<__empty> +__parallel_for_simd(_Iterator1 __first1, _DifferenceType __n, _Iterator2 __first2, _Function __f) noexcept { + return __omp_gpu_backend::__omp_parallel_for_simd( + __omp_gpu_backend::__omp_extract_base_ptr(__first1), + __n, + __omp_gpu_backend::__omp_extract_base_ptr(__first2), + __f); +} + +//===----------------------------------------------------------------------===// +// Templates for three iterator +//===----------------------------------------------------------------------===// + +template <class _Tp, class _DifferenceType, class _Up, class _Vp, class _Function> +_LIBCPP_HIDE_FROM_ABI optional<__empty> +__omp_parallel_for_simd(_Tp* __first1, _DifferenceType __n, _Up* __first2, _Vp* __first3, _Function __f) noexcept { + __omp_gpu_backend::__omp_map_to(__first1, __n); + __omp_gpu_backend::__omp_map_to(__first2, __n); + __omp_gpu_backend::__omp_map_alloc(__first3, __n); +# pragma omp target teams distribute parallel for simd + for (_DifferenceType __i = 0; __i < __n; ++__i) + *(__first3 + __i) = __f(*(__first1 + __i), *(__first2 + __i)); + __omp_gpu_backend::__omp_map_free(__first1, __n); + __omp_gpu_backend::__omp_map_free(__first2, __n); + __omp_gpu_backend::__omp_map_from(__first3, __n); + return __empty{}; +} + +// Extracting the underlying pointer + +template <class _Iterator1, class _DifferenceType, class _Iterator2, class _Iterator3, class _Function> +_LIBCPP_HIDE_FROM_ABI optional<__empty> __parallel_for_simd( + _Iterator1 __first1, _DifferenceType __n, _Iterator2 __first2, _Iterator3 __first3, _Function __f) noexcept { + return __omp_gpu_backend::__omp_parallel_for_simd( + __omp_gpu_backend::__omp_extract_base_ptr(__first1), + __n, + __omp_gpu_backend::__omp_extract_base_ptr(__first2), + __omp_gpu_backend::__omp_extract_base_ptr(__first3), + __f); +} + +} // namespace __omp_gpu_backend +} // namespace __par_backend + +template <class _ExecutionPolicy, class _ForwardIterator, class _ForwardOutIterator, class _UnaryOperation> +_LIBCPP_HIDE_FROM_ABI optional<_ForwardOutIterator> __pstl_transform( + __omp_backend_tag, + _ForwardIterator __first, + _ForwardIterator __last, + _ForwardOutIterator __result, + _UnaryOperation __op) { + if constexpr (__is_unsequenced_execution_policy_v<_ExecutionPolicy> && + __is_parallel_execution_policy_v<_ExecutionPolicy> && + __libcpp_is_contiguous_iterator<_ForwardIterator>::value && + __libcpp_is_contiguous_iterator<_ForwardOutIterator>::value) { + std::__par_backend::__parallel_for_simd(__first, __last - __first, __result, __op); ---------------- ldionne wrote:
```suggestion std::__omp_parallel_for_simd(std::__unrwap_iter(__first), __last - __first, __result, __op); ``` And then `__parallel_for_simd` goes away too. https://github.com/llvm/llvm-project/pull/66968 _______________________________________________ cfe-commits mailing list cfe-commits@lists.llvm.org https://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits