/******************************************************************************
 * Copyright (c) 2016, NVIDIA CORPORATION.  All rights reserved.
 * Modifications Copyright© 2019 Advanced Micro Devices, Inc. All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are met:
 *     * Redistributions of source code must retain the above copyright
 *       notice, this list of conditions and the following disclaimer.
 *     * Redistributions in binary form must reproduce the above copyright
 *       notice, this list of conditions and the following disclaimer in the
 *       documentation and/or other materials provided with the distribution.
 *     * Neither the name of the NVIDIA CORPORATION nor the
 *       names of its contributors may be used to endorse or promote products
 *       derived from this software without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY
 * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
 * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 *
 ******************************************************************************/
#pragma once

#if THRUST_DEVICE_COMPILER == THRUST_DEVICE_COMPILER_HCC
#include <iterator>
#include <thrust/distance.h>
#include <thrust/system/hip/detail/scan.h>

// rocprim include
#include <rocprim/rocprim.hpp>
#include <thrust/detail/alignment.h>
#include <thrust/detail/cstdint.h>

BEGIN_NS_THRUST

namespace hip_rocprim
{

template <class Derived, class InputIt, class OutputIt, class TransformOp, class ScanOp>
OutputIt THRUST_HIP_FUNCTION
transform_inclusive_scan(execution_policy<Derived>& policy,
                         InputIt                    first,
                         InputIt                    last,
                         OutputIt                   result,
                         TransformOp                transform_op,
                         ScanOp                     scan_op)
{
    // the pseudocode for deducing the type of the temporary used below:
    //
    // if UnaryFunction is AdaptableUnaryFunction
    //   TemporaryType = AdaptableUnaryFunction::result_type
    // else if OutputIterator is a "pure" output iterator
    //   TemporaryType = InputIterator::value_type
    // else
    //   TemporaryType = OutputIterator::value_type
    //
    // XXX upon c++0x, TemporaryType needs to be:
    // result_of_adaptable_function<UnaryFunction>::type
    typedef typename detail::eval_if<detail::has_result_type<TransformOp>::value,
                                     detail::result_type<TransformOp>,
                                     detail::eval_if<detail::is_output_iterator<OutputIt>::value,
                                                     iterator_value<InputIt>,
                                                     iterator_value<OutputIt>>>::type result_type;

    typedef typename iterator_traits<InputIt>::difference_type size_type;
    size_type num_items = static_cast<size_type>(thrust::distance(first, last));
    typedef transform_input_iterator_t<result_type, InputIt, TransformOp>
        transformed_iterator_t;

    return hip_rocprim::inclusive_scan_n(
        policy, transformed_iterator_t(first, transform_op), num_items, result, scan_op
    );
}

template <class Derived,
          class InputIt,
          class OutputIt,
          class TransformOp,
          class T,
          class ScanOp>
OutputIt THRUST_HIP_FUNCTION
transform_exclusive_scan(execution_policy<Derived>& policy,
                         InputIt                    first,
                         InputIt                    last,
                         OutputIt                   result,
                         TransformOp                transform_op,
                         T                          init,
                         ScanOp                     scan_op)
{
    // the pseudocode for deducing the type of the temporary used below:
    //
    // if UnaryFunction is AdaptableUnaryFunction
    //   TemporaryType = AdaptableUnaryFunction::result_type
    // else if OutputIterator is a "pure" output iterator
    //   TemporaryType = InputIterator::value_type
    // else
    //   TemporaryType = OutputIterator::value_type
    //
    // XXX upon c++0x, TemporaryType needs to be:
    // result_of_adaptable_function<UnaryFunction>::type

    typedef typename thrust::detail::eval_if<
            thrust::detail::has_result_type<TransformOp>::value,
            thrust::detail::result_type<TransformOp>,
            thrust::detail::eval_if<thrust::detail::is_output_iterator<OutputIt>::value,
                                    thrust::iterator_value<InputIt>,
                                    thrust::iterator_value<OutputIt>>>::type result_type;

    typedef typename iterator_traits<InputIt>::difference_type size_type;
    size_type num_items = static_cast<size_type>(thrust::distance(first, last));
    typedef transform_input_iterator_t<result_type, InputIt, TransformOp>
        transformed_iterator_t;

    return hip_rocprim::exclusive_scan_n(
        policy, transformed_iterator_t(first, transform_op), num_items, result, init, scan_op
    );
}

} // namespace hip_rocprim

END_NS_THRUST
#endif
