123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362 |
- //---------------------------------------------------------------------------//
- // Copyright (c) 2013 Kyle Lutz <kyle.r.lutz@gmail.com>
- //
- // Distributed under the Boost Software License, Version 1.0
- // See accompanying file LICENSE_1_0.txt or copy at
- // http://www.boost.org/LICENSE_1_0.txt
- //
- // See http://boostorg.github.com/compute for more information.
- //---------------------------------------------------------------------------//
- #ifndef BOOST_COMPUTE_ALGORITHM_COPY_HPP
- #define BOOST_COMPUTE_ALGORITHM_COPY_HPP
- #include <algorithm>
- #include <iterator>
- #include <boost/utility/enable_if.hpp>
- #include <boost/mpl/and.hpp>
- #include <boost/mpl/not.hpp>
- #include <boost/compute/buffer.hpp>
- #include <boost/compute/system.hpp>
- #include <boost/compute/command_queue.hpp>
- #include <boost/compute/algorithm/detail/copy_on_device.hpp>
- #include <boost/compute/algorithm/detail/copy_to_device.hpp>
- #include <boost/compute/algorithm/detail/copy_to_host.hpp>
- #include <boost/compute/async/future.hpp>
- #include <boost/compute/detail/is_contiguous_iterator.hpp>
- #include <boost/compute/detail/iterator_range_size.hpp>
- #include <boost/compute/iterator/buffer_iterator.hpp>
- #include <boost/compute/type_traits/is_device_iterator.hpp>
- namespace boost {
- namespace compute {
- namespace detail {
- namespace mpl = boost::mpl;
- // meta-function returning true if copy() between InputIterator and
- // OutputIterator can be implemented with clEnqueueCopyBuffer().
- template<class InputIterator, class OutputIterator>
- struct can_copy_with_copy_buffer :
- mpl::and_<
- boost::is_same<
- InputIterator,
- buffer_iterator<typename InputIterator::value_type>
- >,
- boost::is_same<
- OutputIterator,
- buffer_iterator<typename OutputIterator::value_type>
- >,
- boost::is_same<
- typename InputIterator::value_type,
- typename OutputIterator::value_type
- >
- >::type {};
- // host -> device
- template<class InputIterator, class OutputIterator>
- inline OutputIterator
- dispatch_copy(InputIterator first,
- InputIterator last,
- OutputIterator result,
- command_queue &queue,
- typename boost::enable_if_c<
- !is_device_iterator<InputIterator>::value &&
- is_device_iterator<OutputIterator>::value
- >::type* = 0)
- {
- if(is_contiguous_iterator<InputIterator>::value){
- return copy_to_device(first, last, result, queue);
- }
- else {
- // for non-contiguous input we first copy the values to
- // a temporary std::vector and then copy from there
- typedef typename std::iterator_traits<InputIterator>::value_type T;
- std::vector<T> vector(first, last);
- return copy_to_device(vector.begin(), vector.end(), result, queue);
- }
- }
- // host -> device (async)
- template<class InputIterator, class OutputIterator>
- inline future<OutputIterator>
- dispatch_copy_async(InputIterator first,
- InputIterator last,
- OutputIterator result,
- command_queue &queue,
- typename boost::enable_if_c<
- !is_device_iterator<InputIterator>::value &&
- is_device_iterator<OutputIterator>::value
- >::type* = 0)
- {
- BOOST_STATIC_ASSERT_MSG(
- is_contiguous_iterator<InputIterator>::value,
- "copy_async() is only supported for contiguous host iterators"
- );
- return copy_to_device_async(first, last, result, queue);
- }
- // device -> host
- template<class InputIterator, class OutputIterator>
- inline OutputIterator
- dispatch_copy(InputIterator first,
- InputIterator last,
- OutputIterator result,
- command_queue &queue,
- typename boost::enable_if_c<
- is_device_iterator<InputIterator>::value &&
- !is_device_iterator<OutputIterator>::value
- >::type* = 0)
- {
- if(is_contiguous_iterator<OutputIterator>::value){
- return copy_to_host(first, last, result, queue);
- }
- else {
- // for non-contiguous input we first copy the values to
- // a temporary std::vector and then copy from there
- typedef typename std::iterator_traits<InputIterator>::value_type T;
- std::vector<T> vector(iterator_range_size(first, last));
- copy_to_host(first, last, vector.begin(), queue);
- return std::copy(vector.begin(), vector.end(), result);
- }
- }
- // device -> host (async)
- template<class InputIterator, class OutputIterator>
- inline future<OutputIterator>
- dispatch_copy_async(InputIterator first,
- InputIterator last,
- OutputIterator result,
- command_queue &queue,
- typename boost::enable_if_c<
- is_device_iterator<InputIterator>::value &&
- !is_device_iterator<OutputIterator>::value
- >::type* = 0)
- {
- BOOST_STATIC_ASSERT_MSG(
- is_contiguous_iterator<OutputIterator>::value,
- "copy_async() is only supported for contiguous host iterators"
- );
- return copy_to_host_async(first, last, result, queue);
- }
- // device -> device
- template<class InputIterator, class OutputIterator>
- inline OutputIterator
- dispatch_copy(InputIterator first,
- InputIterator last,
- OutputIterator result,
- command_queue &queue,
- typename boost::enable_if<
- mpl::and_<
- is_device_iterator<InputIterator>,
- is_device_iterator<OutputIterator>,
- mpl::not_<
- can_copy_with_copy_buffer<
- InputIterator, OutputIterator
- >
- >
- >
- >::type* = 0)
- {
- return copy_on_device(first, last, result, queue);
- }
- // device -> device (specialization for buffer iterators)
- template<class InputIterator, class OutputIterator>
- inline OutputIterator
- dispatch_copy(InputIterator first,
- InputIterator last,
- OutputIterator result,
- command_queue &queue,
- typename boost::enable_if<
- mpl::and_<
- is_device_iterator<InputIterator>,
- is_device_iterator<OutputIterator>,
- can_copy_with_copy_buffer<
- InputIterator, OutputIterator
- >
- >
- >::type* = 0)
- {
- typedef typename std::iterator_traits<InputIterator>::value_type value_type;
- typedef typename std::iterator_traits<InputIterator>::difference_type difference_type;
- difference_type n = std::distance(first, last);
- if(n < 1){
- // nothing to copy
- return result;
- }
- queue.enqueue_copy_buffer(first.get_buffer(),
- result.get_buffer(),
- first.get_index() * sizeof(value_type),
- result.get_index() * sizeof(value_type),
- static_cast<size_t>(n) * sizeof(value_type));
- return result + n;
- }
- // device -> device (async)
- template<class InputIterator, class OutputIterator>
- inline future<OutputIterator>
- dispatch_copy_async(InputIterator first,
- InputIterator last,
- OutputIterator result,
- command_queue &queue,
- typename boost::enable_if<
- mpl::and_<
- is_device_iterator<InputIterator>,
- is_device_iterator<OutputIterator>,
- mpl::not_<
- can_copy_with_copy_buffer<
- InputIterator, OutputIterator
- >
- >
- >
- >::type* = 0)
- {
- return copy_on_device_async(first, last, result, queue);
- }
- // device -> device (async, specialization for buffer iterators)
- template<class InputIterator, class OutputIterator>
- inline future<OutputIterator>
- dispatch_copy_async(InputIterator first,
- InputIterator last,
- OutputIterator result,
- command_queue &queue,
- typename boost::enable_if<
- mpl::and_<
- is_device_iterator<InputIterator>,
- is_device_iterator<OutputIterator>,
- can_copy_with_copy_buffer<
- InputIterator, OutputIterator
- >
- >
- >::type* = 0)
- {
- typedef typename std::iterator_traits<InputIterator>::value_type value_type;
- typedef typename std::iterator_traits<InputIterator>::difference_type difference_type;
- difference_type n = std::distance(first, last);
- if(n < 1){
- // nothing to copy
- return make_future(result, event());
- }
- event event_ =
- queue.enqueue_copy_buffer(
- first.get_buffer(),
- result.get_buffer(),
- first.get_index() * sizeof(value_type),
- result.get_index() * sizeof(value_type),
- static_cast<size_t>(n) * sizeof(value_type)
- );
- return make_future(result + n, event_);
- }
- // host -> host
- template<class InputIterator, class OutputIterator>
- inline OutputIterator
- dispatch_copy(InputIterator first,
- InputIterator last,
- OutputIterator result,
- command_queue &queue,
- typename boost::enable_if_c<
- !is_device_iterator<InputIterator>::value &&
- !is_device_iterator<OutputIterator>::value
- >::type* = 0)
- {
- (void) queue;
- return std::copy(first, last, result);
- }
- } // end detail namespace
- /// Copies the values in the range [\p first, \p last) to the range
- /// beginning at \p result.
- ///
- /// The generic copy() function can be used for a variety of data
- /// transfer tasks and provides a standard interface to the following
- /// OpenCL functions:
- ///
- /// \li \c clEnqueueReadBuffer()
- /// \li \c clEnqueueWriteBuffer()
- /// \li \c clEnqueueCopyBuffer()
- ///
- /// Unlike the aforementioned OpenCL functions, copy() will also work
- /// with non-contiguous data-structures (e.g. \c std::list<T>) as
- /// well as with "fancy" iterators (e.g. transform_iterator).
- ///
- /// \param first first element in the range to copy
- /// \param last last element in the range to copy
- /// \param result first element in the result range
- /// \param queue command queue to perform the operation
- ///
- /// \return \c OutputIterator to the end of the result range
- ///
- /// For example, to copy an array of \c int values on the host to a vector on
- /// the device:
- /// \code
- /// // array on the host
- /// int data[] = { 1, 2, 3, 4 };
- ///
- /// // vector on the device
- /// boost::compute::vector<int> vec(4, context);
- ///
- /// // copy values to the device vector
- /// boost::compute::copy(data, data + 4, vec.begin(), queue);
- /// \endcode
- ///
- /// The copy algorithm can also be used with standard containers such as
- /// \c std::vector<T>:
- /// \code
- /// std::vector<int> host_vector = ...
- /// boost::compute::vector<int> device_vector = ...
- ///
- /// // copy from the host to the device
- /// boost::compute::copy(
- /// host_vector.begin(), host_vector.end(), device_vector.begin(), queue
- /// );
- ///
- /// // copy from the device to the host
- /// boost::compute::copy(
- /// device_vector.begin(), device_vector.end(), host_vector.begin(), queue
- /// );
- /// \endcode
- ///
- /// \see copy_n(), copy_if(), copy_async()
- template<class InputIterator, class OutputIterator>
- inline OutputIterator copy(InputIterator first,
- InputIterator last,
- OutputIterator result,
- command_queue &queue = system::default_queue())
- {
- return detail::dispatch_copy(first, last, result, queue);
- }
- /// Copies the values in the range [\p first, \p last) to the range
- /// beginning at \p result. The copy is performed asynchronously.
- ///
- /// \see copy()
- template<class InputIterator, class OutputIterator>
- inline future<OutputIterator>
- copy_async(InputIterator first,
- InputIterator last,
- OutputIterator result,
- command_queue &queue = system::default_queue())
- {
- return detail::dispatch_copy_async(first, last, result, queue);
- }
- } // end compute namespace
- } // end boost namespace
- #endif // BOOST_COMPUTE_ALGORITHM_COPY_HPP
|