199 lines
5.9 KiB
C
199 lines
5.9 KiB
C
|
/*
|
||
|
* Copyright 2008-2012 NVIDIA Corporation
|
||
|
*
|
||
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
||
|
* you may not use this file except in compliance with the License.
|
||
|
* You may obtain a copy of the License at
|
||
|
*
|
||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||
|
*
|
||
|
* Unless required by applicable law or agreed to in writing, software
|
||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||
|
* See the License for the specific language governing permissions and
|
||
|
* limitations under the License.
|
||
|
*/
|
||
|
|
||
|
#pragma once
|
||
|
|
||
|
#include <thrust/detail/config.h>
|
||
|
#include <thrust/system/cuda/detail/execution_policy.h>
|
||
|
#include <thrust/detail/raw_pointer_cast.h>
|
||
|
#include <thrust/detail/copy.h>
|
||
|
|
||
|
namespace thrust
|
||
|
{
|
||
|
namespace system
|
||
|
{
|
||
|
namespace cuda
|
||
|
{
|
||
|
namespace detail
|
||
|
{
|
||
|
|
||
|
|
||
|
// XXX WAR an issue with msvc 2005 (cl v14.00) which creates multiply-defined
|
||
|
// symbols resulting from assign_value
|
||
|
#if (THRUST_HOST_COMPILER == THRUST_HOST_COMPILER_MSVC) && (_MSC_VER <= 1400)
|
||
|
|
||
|
namespace
|
||
|
{
|
||
|
|
||
|
template<typename DerivedPolicy, typename Pointer1, typename Pointer2>
|
||
|
inline __host__ __device__
|
||
|
void assign_value_msvc2005_war(thrust::cuda::execution_policy<DerivedPolicy> &exec, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
// XXX war nvbugs/881631
|
||
|
struct war_nvbugs_881631
|
||
|
{
|
||
|
__host__ inline static void host_path(thrust::cuda::execution_policy<DerivedPolicy> &exec, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
thrust::copy(exec, src, src + 1, dst);
|
||
|
}
|
||
|
|
||
|
__device__ inline static void device_path(thrust::cuda::execution_policy<DerivedPolicy> &, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
*thrust::raw_pointer_cast(dst) = *thrust::raw_pointer_cast(src);
|
||
|
}
|
||
|
};
|
||
|
|
||
|
#ifndef __CUDA_ARCH__
|
||
|
war_nvbugs_881631::host_path(exec,dst,src);
|
||
|
#else
|
||
|
war_nvbugs_881631::device_path(exec,dst,src);
|
||
|
#endif // __CUDA_ARCH__
|
||
|
} // end assign_value_msvc2005_war()
|
||
|
|
||
|
} // end anon namespace
|
||
|
|
||
|
template<typename DerivedPolicy, typename Pointer1, typename Pointer2>
|
||
|
inline __host__ __device__
|
||
|
void assign_value(thrust::cuda::execution_policy<DerivedPolicy> &exec, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
return assign_value_msvc2005_war(exec,dst,src);
|
||
|
} // end assign_value()
|
||
|
|
||
|
#else
|
||
|
|
||
|
template<typename DerivedPolicy, typename Pointer1, typename Pointer2>
|
||
|
inline __host__ __device__
|
||
|
void assign_value(thrust::cuda::execution_policy<DerivedPolicy> &exec, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
// XXX war nvbugs/881631
|
||
|
struct war_nvbugs_881631
|
||
|
{
|
||
|
__host__ inline static void host_path(thrust::cuda::execution_policy<DerivedPolicy> &exec, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
thrust::copy(exec, src, src + 1, dst);
|
||
|
}
|
||
|
|
||
|
__device__ inline static void device_path(thrust::cuda::execution_policy<DerivedPolicy> &, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
*thrust::raw_pointer_cast(dst) = *thrust::raw_pointer_cast(src);
|
||
|
}
|
||
|
};
|
||
|
|
||
|
#ifndef __CUDA_ARCH__
|
||
|
war_nvbugs_881631::host_path(exec,dst,src);
|
||
|
#else
|
||
|
war_nvbugs_881631::device_path(exec,dst,src);
|
||
|
#endif // __CUDA_ARCH__
|
||
|
} // end assign_value()
|
||
|
|
||
|
#endif // msvc 2005 WAR
|
||
|
|
||
|
|
||
|
// XXX WAR an issue with msvc 2005 (cl v14.00) which creates multiply-defined
|
||
|
// symbols resulting from assign_value
|
||
|
#if (THRUST_HOST_COMPILER == THRUST_HOST_COMPILER_MSVC) && (_MSC_VER <= 1400)
|
||
|
|
||
|
namespace
|
||
|
{
|
||
|
|
||
|
|
||
|
template<typename System1, typename System2, typename Pointer1, typename Pointer2>
|
||
|
inline __host__ __device__
|
||
|
void assign_value_msvc2005_war(cross_system<System1,System2> &systems, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
// XXX war nvbugs/881631
|
||
|
struct war_nvbugs_881631
|
||
|
{
|
||
|
__host__ inline static void host_path(cross_system<System1,System2> &systems, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
// rotate the systems so that they are ordered the same as (src, dst)
|
||
|
// for the call to thrust::copy
|
||
|
cross_system<System2,System1> rotated_systems = systems.rotate();
|
||
|
thrust::copy(rotated_systems, src, src + 1, dst);
|
||
|
}
|
||
|
|
||
|
__device__ inline static void device_path(cross_system<System1,System2> &systems, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
// XXX forward the true cuda::execution_policy inside systems here
|
||
|
// instead of materializing a tag
|
||
|
thrust::cuda::tag cuda_tag;
|
||
|
thrust::system::cuda::detail::assign_value(cuda_tag, dst, src);
|
||
|
}
|
||
|
};
|
||
|
|
||
|
#if __CUDA_ARCH__
|
||
|
war_nvbugs_881631::device_path(systems,dst,src);
|
||
|
#else
|
||
|
war_nvbugs_881631::host_path(systems,dst,src);
|
||
|
#endif
|
||
|
} // end assign_value_msvc2005_war
|
||
|
|
||
|
|
||
|
} // end anon namespace
|
||
|
|
||
|
|
||
|
template<typename System1, typename System2, typename Pointer1, typename Pointer2>
|
||
|
inline __host__ __device__
|
||
|
void assign_value(cross_system<System1,System2> &systems, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
return assign_value_msvc2005_war(systems,dst,src);
|
||
|
} // end assign_value()
|
||
|
|
||
|
|
||
|
#else
|
||
|
|
||
|
|
||
|
template<typename System1, typename System2, typename Pointer1, typename Pointer2>
|
||
|
inline __host__ __device__
|
||
|
void assign_value(cross_system<System1,System2> &systems, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
// XXX war nvbugs/881631
|
||
|
struct war_nvbugs_881631
|
||
|
{
|
||
|
__host__ inline static void host_path(cross_system<System1,System2> &systems, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
// rotate the systems so that they are ordered the same as (src, dst)
|
||
|
// for the call to thrust::copy
|
||
|
cross_system<System2,System1> rotated_systems = systems.rotate();
|
||
|
thrust::copy(rotated_systems, src, src + 1, dst);
|
||
|
}
|
||
|
|
||
|
__device__ inline static void device_path(cross_system<System1,System2> &systems, Pointer1 dst, Pointer2 src)
|
||
|
{
|
||
|
// XXX forward the true cuda::execution_policy inside systems here
|
||
|
// instead of materializing a tag
|
||
|
thrust::cuda::tag cuda_tag;
|
||
|
thrust::system::cuda::detail::assign_value(cuda_tag, dst, src);
|
||
|
}
|
||
|
};
|
||
|
|
||
|
#if __CUDA_ARCH__
|
||
|
war_nvbugs_881631::device_path(systems,dst,src);
|
||
|
#else
|
||
|
war_nvbugs_881631::host_path(systems,dst,src);
|
||
|
#endif
|
||
|
} // end assign_value()
|
||
|
|
||
|
|
||
|
#endif // msvc 2005 WAR
|
||
|
|
||
|
|
||
|
} // end detail
|
||
|
} // end cuda
|
||
|
} // end system
|
||
|
} // end thrust
|
||
|
|