75 lines
2.0 KiB
C
75 lines
2.0 KiB
C
|
/*
|
||
|
* Copyright 2008-2012 NVIDIA Corporation
|
||
|
*
|
||
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
||
|
* you may not use this file except in compliance with the License.
|
||
|
* You may obtain a copy of the License at
|
||
|
*
|
||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||
|
*
|
||
|
* Unless required by applicable law or agreed to in writing, software
|
||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||
|
* See the License for the specific language governing permissions and
|
||
|
* limitations under the License.
|
||
|
*/
|
||
|
|
||
|
#pragma once
|
||
|
|
||
|
#include <thrust/detail/config.h>
|
||
|
#include <thrust/iterator/iterator_traits.h>
|
||
|
#include <thrust/functional.h>
|
||
|
#include <thrust/system/cuda/detail/block/inclusive_scan.h>
|
||
|
|
||
|
namespace thrust
|
||
|
{
|
||
|
namespace system
|
||
|
{
|
||
|
namespace cuda
|
||
|
{
|
||
|
namespace detail
|
||
|
{
|
||
|
namespace block
|
||
|
{
|
||
|
|
||
|
|
||
|
template<typename Context, typename RandomAccessIterator, typename T, typename BinaryFunction>
|
||
|
inline __device__
|
||
|
typename thrust::iterator_value<RandomAccessIterator>::type
|
||
|
inplace_exclusive_scan(Context &ctx, RandomAccessIterator first, T init, BinaryFunction op)
|
||
|
{
|
||
|
// perform an inclusive scan, then shift right
|
||
|
block::inplace_inclusive_scan(ctx, first, op);
|
||
|
|
||
|
typename thrust::iterator_value<RandomAccessIterator>::type carry = first[ctx.block_dimension() - 1];
|
||
|
|
||
|
ctx.barrier();
|
||
|
|
||
|
typename thrust::iterator_value<RandomAccessIterator>::type left = (ctx.thread_index() == 0) ? init : first[ctx.thread_index() - 1];
|
||
|
|
||
|
ctx.barrier();
|
||
|
|
||
|
first[ctx.thread_index()] = left;
|
||
|
|
||
|
ctx.barrier();
|
||
|
|
||
|
return carry;
|
||
|
}
|
||
|
|
||
|
|
||
|
template<typename Context, typename Iterator, typename T>
|
||
|
inline __device__
|
||
|
typename thrust::iterator_value<Iterator>::type
|
||
|
inplace_exclusive_scan(Context &ctx, Iterator first, T init)
|
||
|
{
|
||
|
return block::inplace_exclusive_scan(ctx, first, init, thrust::plus<typename thrust::iterator_value<Iterator>::type>());
|
||
|
}
|
||
|
|
||
|
|
||
|
} // end namespace block
|
||
|
} // end namespace detail
|
||
|
} // end namespace cuda
|
||
|
} // end namespace system
|
||
|
} // end namespace thrust
|
||
|
|