94 lines
2.9 KiB
Plaintext
94 lines
2.9 KiB
Plaintext
|
/*
|
||
|
* Copyright 2008-2012 NVIDIA Corporation
|
||
|
*
|
||
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
||
|
* you may not use this file except in compliance with the License.
|
||
|
* You may obtain a copy of the License at
|
||
|
*
|
||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||
|
*
|
||
|
* Unless required by applicable law or agreed to in writing, software
|
||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||
|
* See the License for the specific language governing permissions and
|
||
|
* limitations under the License.
|
||
|
*/
|
||
|
|
||
|
|
||
|
#include <thrust/detail/config.h>
|
||
|
#include <thrust/system/omp/detail/reduce_intervals.h>
|
||
|
#include <thrust/iterator/iterator_traits.h>
|
||
|
#include <thrust/detail/function.h>
|
||
|
#include <thrust/detail/cstdint.h>
|
||
|
|
||
|
namespace thrust
|
||
|
{
|
||
|
namespace system
|
||
|
{
|
||
|
namespace omp
|
||
|
{
|
||
|
namespace detail
|
||
|
{
|
||
|
|
||
|
template <typename DerivedPolicy,
|
||
|
typename InputIterator,
|
||
|
typename OutputIterator,
|
||
|
typename BinaryFunction,
|
||
|
typename Decomposition>
|
||
|
void reduce_intervals(execution_policy<DerivedPolicy> &,
|
||
|
InputIterator input,
|
||
|
OutputIterator output,
|
||
|
BinaryFunction binary_op,
|
||
|
Decomposition decomp)
|
||
|
{
|
||
|
// we're attempting to launch an omp kernel, assert we're compiling with omp support
|
||
|
// ========================================================================
|
||
|
// X Note to the user: If you've found this line due to a compiler error, X
|
||
|
// X you need to enable OpenMP support in your compiler. X
|
||
|
// ========================================================================
|
||
|
THRUST_STATIC_ASSERT( (thrust::detail::depend_on_instantiation<InputIterator,
|
||
|
(THRUST_DEVICE_COMPILER_IS_OMP_CAPABLE == THRUST_TRUE)>::value) );
|
||
|
|
||
|
#if (THRUST_DEVICE_COMPILER_IS_OMP_CAPABLE == THRUST_TRUE)
|
||
|
typedef typename thrust::iterator_value<OutputIterator>::type OutputType;
|
||
|
|
||
|
// wrap binary_op
|
||
|
thrust::detail::host_function<BinaryFunction,OutputType> wrapped_binary_op(binary_op);
|
||
|
|
||
|
typedef thrust::detail::intptr_t index_type;
|
||
|
|
||
|
index_type n = static_cast<index_type>(decomp.size());
|
||
|
|
||
|
#if (THRUST_DEVICE_COMPILER_IS_OMP_CAPABLE == THRUST_TRUE)
|
||
|
# pragma omp parallel for
|
||
|
#endif // THRUST_DEVICE_COMPILER_IS_OMP_CAPABLE
|
||
|
for(index_type i = 0; i < n; i++)
|
||
|
{
|
||
|
InputIterator begin = input + decomp[i].begin();
|
||
|
InputIterator end = input + decomp[i].end();
|
||
|
|
||
|
if (begin != end)
|
||
|
{
|
||
|
OutputType sum = thrust::raw_reference_cast(*begin);
|
||
|
|
||
|
++begin;
|
||
|
|
||
|
while (begin != end)
|
||
|
{
|
||
|
sum = wrapped_binary_op(sum, *begin);
|
||
|
++begin;
|
||
|
}
|
||
|
|
||
|
OutputIterator tmp = output + i;
|
||
|
*tmp = sum;
|
||
|
}
|
||
|
}
|
||
|
#endif // THRUST_DEVICE_COMPILER_IS_OMP_CAPABLE
|
||
|
}
|
||
|
|
||
|
} // end namespace detail
|
||
|
} // end namespace omp
|
||
|
} // end namespace system
|
||
|
} // end namespace thrust
|
||
|
|