STLdoc/VS2015/amp_8h_source.html

 /***

 * ==++==

 *

 * Copyright (c) Microsoft Corporation.  All rights reserved.

 *

 * ==--==

 * =+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+=+

 *

 * amp.h

 *

 * C++ AMP Library

 *

 * =-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-

 ****/


 #pragma once


 #include <crtdbg.h>

 #include <vector>

 #include <iterator>

 #include <future>


 #include <amprt.h>

 #include <xxamp.h>

 #include <type_traits>


 #define _AMP_H


 #pragma pack(push,8)


 namespace Concurrency

 {


 template <int _Rank> class index

 {

 public:

     _CPP_AMP_VERIFY_RANK(_Rank, index);


     template <typename _Value_type, int _Rank>

     friend class array;


     template <int _Rank, int _Element_size>

     friend class details::_Array_view_shape;


     template <int _Rank, int _Element_size>

     friend class details::_Array_view_base;


     static const int rank = _Rank;

     typedef int value_type;


     index() __GPU

     {

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opAssign>::func(*this, 0);

     }


     index(const index<_Rank>& _Other) __GPU

     {

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opAssign>::func(*this, _Other);

     }


     explicit index(int _I) __GPU

     {

         static_assert(_Rank == 1, "This constructor can only be used to construct an index<1> object.");

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opAssign>::func(*this, _I);

     }


     index(int _I0, int _I1) __GPU

     {

         static_assert(_Rank == 2, "This constructor can only be used to construct an index<2> object.");

         _M_base[0] = _I0;

         _M_base[1] = _I1;

     }


     index(int _I0, int _I1, int _I2) __GPU

     {

         static_assert(_Rank == 3, "This constructor can only be used to construct an index<3> object.");

         _M_base[0] = _I0;

         _M_base[1] = _I1;

         _M_base[2] = _I2;

     }


     explicit index(const int _Array[_Rank]) __GPU

     {

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opAssign>::func(*this, _Array);

     }


     index<_Rank>& operator=(const index<_Rank>& _Other) __GPU

     {

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opAssign>::func(*this, _Other);

         return *this;

     }


     int operator[] (unsigned _Index) const __GPU

     {

         return _M_base[_Index];

     }


     int& operator[] (unsigned _Index) __GPU

     {

         return _M_base[_Index];

     }


     // Operations


     index<_Rank>& operator+=(const index<_Rank>& _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opAddEq>::func(*this, _Rhs);

         return *this;

     }


     index<_Rank>& operator-=(const index<_Rank>& _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opSubEq>::func(*this, _Rhs);

         return *this;

     }


     index<_Rank>& operator+=(int _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opAddEq>::func(*this, _Rhs);

         return *this;

     }


     index<_Rank>& operator-=(int _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opSubEq>::func(*this, _Rhs);

         return *this;

     }


     index<_Rank>& operator*=(int _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opMulEq>::func(*this, _Rhs);

         return *this;

     }


     index<_Rank>& operator/=(int _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opDivEq>::func(*this, _Rhs);

         return *this;

     }


     index<_Rank>& operator%=(int _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opModEq>::func(*this, _Rhs);

         return *this;

     }


     index<_Rank>& operator++() __GPU

     {

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opAddEq>::func(*this, 1);

         return *this;

     }


     index<_Rank> operator++(int) __GPU

     {

         index<_Rank> old_Index(*this);

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opAddEq>::func(*this, 1);

         return old_Index;

     }


     index<_Rank>& operator--() __GPU

     {

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opSubEq>::func(*this, 1);

         return *this;

     }


     index operator--(int) __GPU

     {

         index<_Rank> old_Index(*this);

         details::_compound_assign_op_loop_helper<index<_Rank>, details::opSubEq>::func(*this, 1);

         return old_Index;

     }


 private:

     template<class _Tuple_type>

     friend

     _Tuple_type details::_Create_uninitialized_tuple() __GPU;


     index(details::_eInitializeState) __GPU {}

     //

     // implementation details - end


     int _M_base[_Rank];

 };


 template <int _Rank> class extent

 {

 public:

     _CPP_AMP_VERIFY_RANK(_Rank, extent);


     template <typename _Value_type, int _Rank>

     friend class array;


     template <int _Rank, int _Element_size>

     friend class details::_Array_view_shape;


     template <int _Rank, int _Element_size>

     friend class details::_Array_view_base;


     static const int rank = _Rank;

     typedef int value_type;


     extent() __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opAssign>::func(*this, 0);

     }


     extent(const extent<_Rank>& _Other) __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opAssign>::func(*this, _Other);

     }


     explicit extent(int _I) __GPU

     {

         static_assert(_Rank == 1, "This constructor can only be used to construct an extent<1> object.");

         _M_base[0] = _I;

     }


     extent(int _I0, int _I1) __GPU

     {

         static_assert(_Rank == 2, "This constructor can only be used to construct an extent<2> object.");

         _M_base[0] = _I0;

         _M_base[1] = _I1;

     }


     extent(int _I0, int _I1, int _I2) __GPU

     {

         static_assert(_Rank == 3, "This constructor can only be used to construct an extent<3> object.");

         _M_base[0] = _I0;

         _M_base[1] = _I1;

         _M_base[2] = _I2;

     }


     explicit extent(const int _Array[_Rank]) __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opAssign>::func(*this, _Array);

     }


     extent<_Rank>& operator=(const extent<_Rank>& _Other) __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opAssign>::func(*this, _Other);

         return *this;

     }


     int operator[] (unsigned int _Index) const __GPU

     {

         return _M_base[_Index];

     }


     int& operator[] (unsigned int _Index) __GPU

     {

         return _M_base[_Index];

     }


     unsigned int size() const __GPU

     {

         return static_cast<unsigned int>(_product_helper<extent<_Rank>>::func(_M_base));

     }


     bool contains(const index<rank>& _Index) const __GPU

     {

         return details::_contains<extent<rank>, index<rank>, rank>::func(*this, _Index);

     }


     template <int _Dim0> tiled_extent<_Dim0> tile() const __GPU

     {

         static_assert(rank == 1, "One-dimensional tile() method only available on extent<1>");

         static_assert(_Dim0>0, "All tile dimensions must be positive");


         return tiled_extent<_Dim0>(*this);

     }


     template <int _Dim0, int _Dim1> tiled_extent<_Dim0, _Dim1> tile() const __GPU

     {

         static_assert(rank == 2, "Two-dimensional tile() method only available on extent<2>");

         static_assert(_Dim0>0 && _Dim1>0, "All tile dimensions must be positive");


         return tiled_extent<_Dim0, _Dim1>(*this);

     }


     template <int _Dim0, int _Dim1, int _Dim2> tiled_extent<_Dim0, _Dim1, _Dim2> tile() const __GPU

     {

         static_assert(rank == 3, "Three-dimensional tile() method only available on extent<3>");

         static_assert(_Dim0>0 && _Dim1>0 && _Dim2>0, "All tile dimensions must be positive");


         return tiled_extent<_Dim0, _Dim1, _Dim2>(*this);

     }


     // Operations


     extent<_Rank> operator+(const index<_Rank>& _Rhs) const __GPU

     {

         extent<_Rank> new_extent(details::_do_not_initialize);

         details::_arithmetic_op_loop_helper<extent<_Rank>, details::opAdd>::func(new_extent, *this, _Rhs);

         return new_extent;

     }


     extent<_Rank> operator-(const index<_Rank>& _Rhs) const __GPU

     {

         extent<_Rank> new_extent(details::_do_not_initialize);

         details::_arithmetic_op_loop_helper<extent<_Rank>, details::opSub>::func(new_extent, *this, _Rhs);

         return new_extent;

     }


     extent<_Rank>& operator+=(const extent<_Rank>& _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opAddEq>::func(*this, _Rhs);

         return *this;

     }


     extent<_Rank>& operator-=(const extent<_Rank>& _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opSubEq>::func(*this, _Rhs);

         return *this;

     }


     extent<_Rank>& operator+=(const index<_Rank>& _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opAddEq>::func(*this, _Rhs);

         return *this;

     }


     extent<_Rank>& operator-=(const index<_Rank>& _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opSubEq>::func(*this, _Rhs);

         return *this;

     }


     extent<_Rank>& operator+=(int _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opAddEq>::func(*this, _Rhs);

         return *this;

     }


     extent<_Rank>& operator-=(int _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opSubEq>::func(*this, _Rhs);

         return *this;

     }


     extent<_Rank>& operator*=(int _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opMulEq>::func(*this, _Rhs);

         return *this;

     }


     extent<_Rank>& operator/=(int _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opDivEq>::func(*this, _Rhs);

         return *this;

     }


     extent<_Rank>& operator%=(int _Rhs) __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opModEq>::func(*this, _Rhs);

         return *this;

     }


     extent<_Rank>& operator++() __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opAddEq>::func(*this, 1);

         return *this;

     }


     extent<_Rank> operator++(int) __GPU

     {

         extent<_Rank> old_extent(*this);

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opAddEq>::func(*this, 1);

         return old_extent;

     }


     extent<_Rank>& operator--() __GPU

     {

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opSubEq>::func(*this, 1);

         return *this;

     }


     extent<_Rank> operator--(int) __GPU

     {

         extent<_Rank> old_extent(*this);

         details::_compound_assign_op_loop_helper<extent<_Rank>, details::opSubEq>::func(*this, 1);

         return old_extent;

     }


     // implementation details (compiler helpers) - begin


     // Index mapping for simple zero-based extent domain.

     index<_Rank> _map_index(const index<_Rank>& _Index) const __GPU {

         return _Index;

     }


 private:

     template<class _Tuple_type>

     friend

     _Tuple_type details::_Create_uninitialized_tuple() __GPU;

     extent(details::_eInitializeState) __GPU {}


     // the store

     int _M_base[_Rank];

 };


 namespace details

 {

     template <typename T> struct _Is_extent_or_index : std::false_type { };


     template <int N>

     struct _Is_extent_or_index<index<N>> : std::true_type { };


     template <int N>

     struct _Is_extent_or_index<extent<N>> : std::true_type { };

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, bool>::type

 operator==(const _Tuple_type<_Rank>& _Lhs, const _Tuple_type<_Rank>& _Rhs) __GPU

 {

     return details::_cmp_op_loop_helper<_Tuple_type<_Rank>, details::opEq>::func(_Lhs, _Rhs);

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, bool>::type

 operator!=(const _Tuple_type<_Rank>& _Lhs, const _Tuple_type<_Rank>& _Rhs) __GPU

 {

     return !details::_cmp_op_loop_helper<_Tuple_type<_Rank>, details::opEq>::func(_Lhs, _Rhs);

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, _Tuple_type<_Rank>>::type

 operator+(const _Tuple_type<_Rank>& _Lhs, const _Tuple_type<_Rank>& _Rhs) __GPU

 {

     _Tuple_type<_Rank> new_Tuple = details::_Create_uninitialized_tuple<_Tuple_type<_Rank>>();

     details::_arithmetic_op_loop_helper<_Tuple_type<_Rank>, opAdd>::func(new_Tuple, _Lhs, _Rhs);

     return new_Tuple;

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, _Tuple_type<_Rank>>::type

 operator-(const _Tuple_type<_Rank>& _Lhs, const _Tuple_type<_Rank>& _Rhs) __GPU

 {

     _Tuple_type<_Rank> new_Tuple = details::_Create_uninitialized_tuple<_Tuple_type<_Rank>>();

     details::_arithmetic_op_loop_helper<_Tuple_type<_Rank>, opSub>::func(new_Tuple, _Lhs, _Rhs);

     return new_Tuple;

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, _Tuple_type<_Rank>>::type

 operator+(const _Tuple_type<_Rank>& _Lhs, typename _Tuple_type<_Rank>::value_type _Rhs) __GPU

 {

     _Tuple_type<_Rank> new_Tuple = details::_Create_uninitialized_tuple<_Tuple_type<_Rank>>();

     details::_arithmetic_op_loop_helper<_Tuple_type<_Rank>, opAdd>::func(new_Tuple, _Lhs, _Rhs);

     return new_Tuple;

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, _Tuple_type<_Rank>>::type

 operator+(typename _Tuple_type<_Rank>::value_type _Lhs, const _Tuple_type<_Rank>& _Rhs) __GPU

 {

     _Tuple_type<_Rank> new_Tuple = details::_Create_uninitialized_tuple<_Tuple_type<_Rank>>();

     details::_arithmetic_op_loop_helper<_Tuple_type<_Rank>, opAdd>::func(new_Tuple, _Lhs, _Rhs);

     return new_Tuple;

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, _Tuple_type<_Rank>>::type

 operator-(const _Tuple_type<_Rank>& _Lhs, typename _Tuple_type<_Rank>::value_type _Rhs) __GPU

 {

     _Tuple_type<_Rank> new_Tuple = details::_Create_uninitialized_tuple<_Tuple_type<_Rank>>();

     details::_arithmetic_op_loop_helper<_Tuple_type<_Rank>, opSub>::func(new_Tuple, _Lhs, _Rhs);

     return new_Tuple;

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, _Tuple_type<_Rank>>::type

 operator-(typename _Tuple_type<_Rank>::value_type _Lhs, const _Tuple_type<_Rank>& _Rhs) __GPU

 {

     _Tuple_type<_Rank> new_Tuple = details::_Create_uninitialized_tuple<_Tuple_type<_Rank>>();

     details::_arithmetic_op_loop_helper<_Tuple_type<_Rank>, opSub>::func(new_Tuple, _Lhs, _Rhs);

     return new_Tuple;

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, _Tuple_type<_Rank>>::type

 operator*(const _Tuple_type<_Rank>& _Lhs, typename _Tuple_type<_Rank>::value_type _Rhs) __GPU

 {

     _Tuple_type<_Rank> new_Tuple = details::_Create_uninitialized_tuple<_Tuple_type<_Rank>>();

     details::_arithmetic_op_loop_helper<_Tuple_type<_Rank>, opMul>::func(new_Tuple, _Lhs, _Rhs);

     return new_Tuple;

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, _Tuple_type<_Rank>>::type

 operator*(typename _Tuple_type<_Rank>::value_type _Lhs, const _Tuple_type<_Rank>& _Rhs) __GPU

 {

     _Tuple_type<_Rank> new_Tuple = details::_Create_uninitialized_tuple<_Tuple_type<_Rank>>();

     details::_arithmetic_op_loop_helper<_Tuple_type<_Rank>, opMul>::func(new_Tuple, _Lhs, _Rhs);

     return new_Tuple;

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, _Tuple_type<_Rank>>::type

 operator/(const _Tuple_type<_Rank>& _Lhs, typename _Tuple_type<_Rank>::value_type _Rhs) __GPU

 {

     _Tuple_type<_Rank> new_Tuple = details::_Create_uninitialized_tuple<_Tuple_type<_Rank>>();

     details::_arithmetic_op_loop_helper<_Tuple_type<_Rank>, opDiv>::func(new_Tuple, _Lhs, _Rhs);

     return new_Tuple;

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, _Tuple_type<_Rank>>::type

 operator/(typename _Tuple_type<_Rank>::value_type _Lhs, const _Tuple_type<_Rank>& _Rhs) __GPU

 {

     _Tuple_type<_Rank> new_Tuple = details::_Create_uninitialized_tuple<_Tuple_type<_Rank>>();

     details::_arithmetic_op_loop_helper<_Tuple_type<_Rank>, opDiv>::func(new_Tuple, _Lhs, _Rhs);

     return new_Tuple;

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, _Tuple_type<_Rank>>::type

 operator%(const _Tuple_type<_Rank>& _Lhs, typename _Tuple_type<_Rank>::value_type _Rhs) __GPU

 {

     _Tuple_type<_Rank> new_Tuple = details::_Create_uninitialized_tuple<_Tuple_type<_Rank>>();

     details::_arithmetic_op_loop_helper<_Tuple_type<_Rank>, opMod>::func(new_Tuple, _Lhs, _Rhs);

     return new_Tuple;

 }


 template <int _Rank, template <int> class _Tuple_type>

 typename std::enable_if<details::_Is_extent_or_index<_Tuple_type<_Rank>>::value, _Tuple_type<_Rank>>::type

 operator%(typename _Tuple_type<_Rank>::value_type _Lhs, const _Tuple_type<_Rank>& _Rhs) __GPU

 {

     _Tuple_type<_Rank> new_Tuple = details::_Create_uninitialized_tuple<_Tuple_type<_Rank>>();

     details::_arithmetic_op_loop_helper<_Tuple_type<_Rank>, opMod>::func(new_Tuple, _Lhs, _Rhs);

     return new_Tuple;

 }

 class tile_barrier

 {

 public:

 #pragma warning( suppress : 4100 ) // unreferenced formal parameter

     tile_barrier(const tile_barrier& _Other) __GPU {}


     void wait() const __GPU_ONLY

     {

         __dp_d3d_all_memory_fence_with_tile_barrier();

     }


     void wait_with_all_memory_fence() const __GPU_ONLY

     {

         __dp_d3d_all_memory_fence_with_tile_barrier();

     }


     void wait_with_global_memory_fence() const __GPU_ONLY

     {

         __dp_d3d_device_memory_fence_with_tile_barrier();

     }


     void wait_with_tile_static_memory_fence() const __GPU_ONLY

     {

         __dp_d3d_tile_static_memory_fence_with_tile_barrier();

     }

 };


 template <int _Rank> class _Tiled_index_base

 {

 public:


     _CPP_AMP_VERIFY_RANK(_Rank, tiled_index);


     static const int rank = _Rank;


     const index<rank> global;


     const index<rank> local;


     const index<rank> tile;


     const index<rank> tile_origin;


     const tile_barrier barrier;


     _Tiled_index_base(const index<rank>& _Global,

                      const index<rank>& _Local,

                      const index<rank>& _Tile,

                      const index<rank>& _Tile_origin,

                      const tile_barrier& _Barrier) __GPU

     : global(_Global), local(_Local), tile(_Tile), tile_origin(_Tile_origin), barrier(_Barrier)

     {}


     _Tiled_index_base(const _Tiled_index_base& _Other) __GPU

     : global(_Other.global),

       local(_Other.local),

       tile(_Other.tile),

       tile_origin(_Other.tile_origin),

       barrier(_Other.barrier)

     {}


     operator const index<rank>() const __GPU

     {

         return global;

     }


 private:

     _Tiled_index_base& operator=(const _Tiled_index_base&) __GPU;

 };


 template <int _Dim0, int _Dim1 = 0, int _Dim2 = 0> class tiled_index : public _Tiled_index_base<3>

 {

 public:

     tiled_index(const index<rank>& _Global,

                 const index<rank>& _Local,

                 const index<rank>& _Tile,

                 const index<rank>& _Tile_origin,

                 const tile_barrier& _Barrier) __GPU

     : _Tiled_index_base(_Global, _Local, _Tile, _Tile_origin, _Barrier)

     {}


     tiled_index(const tiled_index& _Other) __GPU

     : _Tiled_index_base(_Other)

     {}


     __declspec(property(get=get_tile_extent)) extent<rank> tile_extent;

     extent<rank> get_tile_extent() const __GPU { return extent<rank>(_Dim0, _Dim1, _Dim2); }


     static const int tile_dim0 = _Dim0;

     static const int tile_dim1 = _Dim1;

     static const int tile_dim2 = _Dim2;


 private:

     tiled_index& operator=(const tiled_index&) __GPU;

 };


 template <int _Dim0, int _Dim1>

 class tiled_index<_Dim0, _Dim1, 0> : public _Tiled_index_base<2>

 {

 public:

     tiled_index(const index<rank>& _Global,

                 const index<rank>& _Local,

                 const index<rank>& _Tile,

                 const index<rank>& _Tile_origin,

                 const tile_barrier& _Barrier) __GPU

     : _Tiled_index_base(_Global, _Local, _Tile, _Tile_origin, _Barrier)

     {}


     tiled_index(const tiled_index& _Other) __GPU

     : _Tiled_index_base(_Other)

     {}


     __declspec(property(get=get_tile_extent)) extent<rank> tile_extent;

     extent<rank> get_tile_extent() const __GPU { return extent<rank>(_Dim0, _Dim1); }


     static const int tile_dim0 = _Dim0;

     static const int tile_dim1 = _Dim1;


 private:

     tiled_index& operator=(const tiled_index&) __GPU;

 };


 template <int _Dim0>

 class tiled_index<_Dim0, 0, 0> : public _Tiled_index_base<1>

 {

 public:

     tiled_index(const index<rank>& _Global,

                 const index<rank>& _Local,

                 const index<rank>& _Tile,

                 const index<rank>& _Tile_origin,

                 const tile_barrier& _Barrier) __GPU

     : _Tiled_index_base(_Global, _Local, _Tile, _Tile_origin, _Barrier)

     {}


     tiled_index(const tiled_index& _Other) __GPU

     : _Tiled_index_base(_Other)

     {}


     __declspec(property(get=get_tile_extent)) extent<rank> tile_extent;

     extent<rank> get_tile_extent() const __GPU { return extent<rank>(_Dim0); }


     static const int tile_dim0 = _Dim0;


 private:

     tiled_index& operator=(const tiled_index&) __GPU;

 };


 template <int _Dim0, int _Dim1 /*=0*/, int _Dim2 /*=0*/> class tiled_extent : public Concurrency::extent<3>

 {

 public:


     static_assert(_Dim0>0, "_Dim0 must be positive");

     static_assert(_Dim1>0, "_Dim1 must be positive");

     static_assert(_Dim2>0, "_Dim2 must be positive");


     tiled_extent() __GPU {}


     tiled_extent(const Concurrency::extent<rank>& _Other) __GPU : Concurrency::extent<rank>(_Other)

     {}


     tiled_extent(const tiled_extent& _Other) __GPU : Concurrency::extent<rank>(_Other)

     {}


     tiled_extent& operator=(const tiled_extent& _Other) __GPU

     {

         Concurrency::extent<rank>::operator=(_Other);

         return *this;

     }


     __declspec(property(get=get_tile_extent)) Concurrency::extent<rank> tile_extent;

     Concurrency::extent<rank> get_tile_extent() const __GPU

     {

         return Concurrency::extent<rank>(_Dim0, _Dim1, _Dim2);

     }


     tiled_extent pad() const __GPU

     {

         Concurrency::extent<rank> _New_extent(((static_cast<unsigned int>((*this)[0]) + _Dim0 - 1)/_Dim0) * _Dim0,

                                               ((static_cast<unsigned int>((*this)[1]) + _Dim1 - 1)/_Dim1) * _Dim1,

                                               ((static_cast<unsigned int>((*this)[2]) + _Dim2 - 1)/_Dim2) * _Dim2);


         return tiled_extent<_Dim0,_Dim1,_Dim2>(_New_extent);

     }


     tiled_extent truncate() const __GPU

     {

         Concurrency::extent<rank> _New_extent(((*this)[0]/_Dim0) * _Dim0, ((*this)[1]/_Dim1) * _Dim1, ((*this)[2]/_Dim2) * _Dim2);

         return tiled_extent<_Dim0,_Dim1,_Dim2>(_New_extent);

     }


     static const int tile_dim0 = _Dim0;

     static const int tile_dim1 = _Dim1;

     static const int tile_dim2 = _Dim2;


     // implementation details (compiler helpers) - begin


     // Given the local index, the tile index, the global index, in the 0-based domain that

     // has same extents as 'this', and a barrier object, return a tiled_index<_Dim0, _Dim1, _Dim2> into

     // the 'this' tiled_extent domain.

     tiled_index<_Dim0, _Dim1, _Dim2> _map_index(const index<rank>& _Local, const index<rank>& _Tile, const index<rank>& _Global, tile_barrier& _Barrier) const __GPU

     {

         index<rank> _Tile_origin = details::_Create_uninitialized_tuple<index<rank>>();

         details::_arithmetic_op_loop_helper<index<rank>, details::opMul>::func(_Tile_origin, _Tile, tile_extent);

         return tiled_index<_Dim0, _Dim1, _Dim2>(_Global, _Local, _Tile, _Tile_origin, _Barrier);

     }

     // implementation details (compiler helpers) - end

 };


 template <int _Dim0, int _Dim1>

 class tiled_extent<_Dim0, _Dim1, 0> : public Concurrency::extent<2>

 {

 public:


     static_assert(_Dim0>0, "_Dim0 must be positive");

     static_assert(_Dim1>0, "_Dim1 must be positive");


     tiled_extent() __GPU {}


     tiled_extent(const Concurrency::extent<rank>& _Other) __GPU : Concurrency::extent<rank>(_Other)

     {}


     tiled_extent(const tiled_extent& _Other) __GPU : Concurrency::extent<rank>(_Other)

     {}


     tiled_extent& operator=(const tiled_extent& _Other) __GPU

     {

         Concurrency::extent<rank>::operator=(_Other);

         return *this;

     }


     __declspec(property(get=get_tile_extent)) Concurrency::extent<rank> tile_extent;

     Concurrency::extent<rank> get_tile_extent() const __GPU

     {

         return Concurrency::extent<rank>(_Dim0, _Dim1);

     }


     tiled_extent pad() const __GPU

     {

         Concurrency::extent<rank> _New_extent(((static_cast<unsigned int>((*this)[0]) + _Dim0 - 1)/_Dim0) * _Dim0,

                                               ((static_cast<unsigned int>((*this)[1]) + _Dim1 - 1)/_Dim1) * _Dim1);

         return tiled_extent<_Dim0,_Dim1>(_New_extent);

     }


     tiled_extent truncate() const __GPU

     {

         Concurrency::extent<rank> _New_extent(((*this)[0]/_Dim0) * _Dim0, ((*this)[1]/_Dim1) * _Dim1);

         return tiled_extent<_Dim0,_Dim1>(_New_extent);

     }


     static const int tile_dim0 = _Dim0;

     static const int tile_dim1 = _Dim1;


     // implementation details (compiler helpers) - begin


     // Given the local index, the tile index, the global index, in the 0-based domain that

     // has same extents as 'this', and a barrier object, return a tiled_index<_Dim0, _Dim1> into

     // the 'this' tiled_extent domain.

     tiled_index<_Dim0, _Dim1> _map_index(const index<rank>& _Local, const index<rank>& _Tile, const index<rank>& _Global, tile_barrier& _Barrier) const __GPU

     {

         index<rank> _Tile_origin = details::_Create_uninitialized_tuple<index<rank>>();

         details::_arithmetic_op_loop_helper<index<rank>, details::opMul>::func(_Tile_origin, _Tile, tile_extent);

         return tiled_index<_Dim0, _Dim1>(_Global, _Local, _Tile, _Tile_origin, _Barrier);

     }

     // implementation details (compiler helpers) - end

 };


 template <int _Dim0>

 class tiled_extent<_Dim0, 0, 0> : public Concurrency::extent<1>

 {

 public:


     static_assert(_Dim0>0, "_Dim0 must be positive");


     tiled_extent() __GPU {}


     tiled_extent(const Concurrency::extent<rank>& _Other) __GPU : Concurrency::extent<rank>(_Other)

     {}


     tiled_extent(const tiled_extent& _Other) __GPU : Concurrency::extent<rank>(_Other)

     {}


     tiled_extent& operator=(const tiled_extent& _Other) __GPU

     {

         Concurrency::extent<rank>::operator=(_Other);

         return *this;

     }


     __declspec(property(get=get_tile_extent)) Concurrency::extent<rank> tile_extent;

     Concurrency::extent<rank> get_tile_extent() const __GPU

     {

         return Concurrency::extent<rank>(_Dim0);

     }


     tiled_extent pad() const __GPU

     {

         Concurrency::extent<rank> _New_extent(((static_cast<unsigned int>((*this)[0]) + _Dim0 - 1)/_Dim0) * _Dim0);

         return tiled_extent<_Dim0>(_New_extent);

     }


     tiled_extent truncate() const __GPU

     {

         Concurrency::extent<rank> _New_extent(((*this)[0]/_Dim0) * _Dim0);

         return tiled_extent<_Dim0>(_New_extent);

     }


     static const int tile_dim0 = _Dim0;


     // implementation details (compiler helpers) - begin


     // Given the local index, the tile index, the global index, in the 0-based domain that

     // has same extents as 'this', and a barrier object, return a tiled_index<_Dim0> into

     // the 'this' tiled_extent domain.

     tiled_index<_Dim0> _map_index(const index<rank>& _Local, const index<rank>& _Tile, const index<rank>& _Global, tile_barrier& _Barrier) const __GPU

     {

         index<rank> _Tile_origin = details::_Create_uninitialized_tuple<index<rank>>();

         details::_arithmetic_op_loop_helper<index<rank>, details::opMul>::func(_Tile_origin, _Tile, tile_extent);

         return tiled_index<_Dim0>(_Global, _Local, _Tile, _Tile_origin, _Barrier);

     }

 };


 namespace details

 {


 template <int _Old_element_size, int _New_element_size>

 int  _Calculate_reinterpreted_size(int _Old_size) __GPU_ONLY

 {

     int _Total_size = _Old_element_size * _Old_size;

     int _New_size = (_Total_size + _New_element_size - 1)/ _New_element_size;


     return _New_size;

 }


 template <int _Old_element_size, int _New_element_size>

 int  _Calculate_reinterpreted_size(int _Old_size) __CPU_ONLY

 {

     int _Total_size = _Old_element_size * _Old_size;

     int _New_size = (_Total_size + _New_element_size - 1)/ _New_element_size;


     if (_New_size * _New_element_size > _Total_size)

         throw runtime_exception("Element type of reinterpret_as does not evenly divide into extent", E_INVALIDARG);


     return _New_size;

 }


 // This class defines the shape of an array view and provides

 // the functionality of translating dimensional indices into

 // flat offsets into the underlying buffer

 template <int _Rank, int _Element_size /* in number of ints */>

 class _Array_view_shape

 {

     typedef _Array_flatten_helper<_Rank, typename Concurrency::extent<_Rank>::value_type, typename Concurrency::index<_Rank>::value_type> _Flatten_helper;

     friend class _Array_view_shape<_Rank+1, _Element_size>;


 public:

     __declspec(property(get=get_extent)) Concurrency::extent<_Rank> extent;

     Concurrency::extent<_Rank> get_extent() const __GPU

     {

         return _M_view_extent;

     }


     ~_Array_view_shape() __GPU {}


 protected:

     int _Base_linear_offset() const __GPU

     {

         return (_M_total_linear_offset - (_Element_size * _Flatten_helper::func(_M_array_multiplier._M_base, _M_view_offset._M_base)));

     }


     _Array_view_shape(const _Array_view_shape& _Other) __GPU

         :

         _M_array_extent(_Other._M_array_extent),

         _M_array_multiplier(_Other._M_array_multiplier),

         _M_view_offset(_Other._M_view_offset),

         _M_total_linear_offset(_Other._M_total_linear_offset),

         _M_view_extent(_Other._M_view_extent)

     {

     }


     // For "section"

     _Array_view_shape(const _Array_view_shape& _Other, const Concurrency::index<_Rank>& _Section_origin, const Concurrency::extent<_Rank>& _Section_extent) __GPU

         :

         _M_array_extent(_Other._M_array_extent),

         _M_array_multiplier(_Other._M_array_multiplier),

         _M_view_offset(_Other._M_view_offset + _Section_origin),

         _M_view_extent(_Section_extent)

     {

         _Is_valid_section(_Other._M_view_extent, _Section_origin, _Section_extent);


         _M_total_linear_offset = _Other._Base_linear_offset() + (_Element_size * _Flatten_helper::func(_M_array_multiplier._M_base, _M_view_offset._M_base));

     }


     _Array_view_shape(int _Base_linear_offset, const Concurrency::extent<_Rank>& _Array_extent) __GPU

         :

         _M_array_extent(_Array_extent),

         _M_view_offset(index<_Rank>()),

         _M_total_linear_offset(_Base_linear_offset),

         _M_view_extent(_Array_extent)

     {

         _Initialize_multiplier();

     }


     _Array_view_shape(int _Base_linear_offset, const Concurrency::extent<_Rank>& _Array_extent,

                       const Concurrency::index<_Rank>& _Section_origin, const Concurrency::extent<_Rank>& _Section_extent) __GPU

         :

         _M_array_extent(_Array_extent),

         _M_view_offset(_Section_origin),

         _M_total_linear_offset(_Base_linear_offset),

         _M_view_extent(_Section_extent)

     {

         _Is_valid_section(_Array_extent, _Section_origin, _Section_extent);


         _Initialize_multiplier();

         _M_total_linear_offset += (_Element_size * _Flatten_helper::func(_M_array_multiplier._M_base, _M_view_offset._M_base));

     }


     _Array_view_shape& operator=(const _Array_view_shape &_Other) __GPU

     {

         _M_array_extent        = _Other._M_array_extent;

         _M_array_multiplier    = _Other._M_array_multiplier;

         _M_view_offset         = _Other._M_view_offset;

         _M_total_linear_offset = _Other._M_total_linear_offset;

         _M_view_extent         = _Other._M_view_extent;

         return *this;

     }


     void _Project0(int _I, _Array_view_shape<_Rank-1,_Element_size>& _Projected_shape) const __GPU

     {

         static_assert(_Rank > 1, "Projection is only supported on array_views with a rank of 2 or higher");


         _Is_valid_projection(_I, this->_M_view_extent);


         typedef Concurrency::extent<_Rank-1> _RES_EXT;

         typedef Concurrency::extent<_Rank> _SRC_EXT;

         typedef Concurrency::index<_Rank-1> _RES_IDX;

         typedef Concurrency::index<_Rank> _SRC_IDX;

         details::_project0<_RES_EXT, _SRC_EXT, _RES_IDX, _SRC_IDX, _Rank>::func(

                          _Projected_shape._M_array_extent, this->_M_array_extent,

                          _Projected_shape._M_array_multiplier, this->_M_array_multiplier,

                          _Projected_shape._M_view_offset, this->_M_view_offset,

                          _Projected_shape._M_view_extent, this->_M_view_extent);


         _Projected_shape._M_total_linear_offset = _M_total_linear_offset + (_Element_size * _I * _M_array_multiplier[0]);

     }


     _Array_view_shape() __GPU

         : _M_array_extent(details::_do_not_initialize),  _M_array_multiplier(details::_do_not_initialize),

         _M_view_offset(details::_do_not_initialize), _M_view_extent(details::_do_not_initialize)

     {

     }


 private:


     void _Initialize_multiplier() __GPU

     {

         details::_Is_valid_extent(_M_array_extent);

         unsigned int _Ext = _M_array_extent[_Rank-1];

         details::_Array_init_helper<Concurrency::extent<_Rank>, Concurrency::extent<_Rank>>::func(_Ext, _M_array_multiplier, _M_array_extent);

     }


 protected:

     Concurrency::extent<_Rank>   _M_array_extent;

     Concurrency::extent<_Rank>   _M_array_multiplier;

     Concurrency::index<_Rank>    _M_view_offset;

     int                          _M_total_linear_offset; // in number of units

     Concurrency::extent<_Rank>   _M_view_extent;

 };


 template <int _Rank, int _Element_size>

 class _Array_view_base : public _Array_view_shape<_Rank,_Element_size /* in number of ints */>

 {

     typedef _Array_flatten_helper<_Rank, typename Concurrency::extent<_Rank>::value_type, typename Concurrency::index<_Rank>::value_type> _Flatten_helper;


     template <int _R, int _S>

     friend class _Array_view_base;


 public:


     typedef details::_Buffer_descriptor _Buffer_descriptor;


     ~_Array_view_base() __GPU

     {

         // Unregister the view; Do not throw exception

         _Unregister(false);

     }


 protected:


     _Array_view_base() __GPU {}


     _Array_view_base(const _Buffer_descriptor& _Buffer_desc, const _Array_view_shape<_Rank, _Element_size>& _Shape) __GPU

         :

         _M_buffer_descriptor(_Buffer_desc),

         _Array_view_shape<_Rank, _Element_size>(_Shape)

     {

         // Register the view

         _Register();

     }


     _Array_view_base(const _Array_view_base& _Other) __GPU

         :

         _M_buffer_descriptor(_Other._M_buffer_descriptor),

         _Array_view_shape<_Rank, _Element_size>(_Other)

     {

         // Register the view

         _Register_copy(_Other);


         // update this buffer descriptor in case _Register_copy was late and missed the update opportunity.

         _M_buffer_descriptor = _Other._M_buffer_descriptor;

     }


     _Array_view_base(const _Array_view_base& _Other, const Concurrency::extent<_Rank>& _Array_extent) __GPU

         :

         _M_buffer_descriptor(_Other._M_buffer_descriptor),

         _Array_view_shape<_Rank, _Element_size>(_Other._Base_linear_offset(), _Array_extent)

     {

         // Register the view

         _Register();

     }


     _Array_view_base(const _Array_view_base& _Other, const Concurrency::index<_Rank>& _Section_origin, const Concurrency::extent<_Rank>& _Section_extent) __GPU

         :

         _M_buffer_descriptor(_Other._M_buffer_descriptor),

         _Array_view_shape<_Rank, _Element_size>(_Other, _Section_origin, _Section_extent)

     {

         // Register the view

         _Register();

     }


     _Array_view_base(const _Buffer_descriptor& _Buffer_desc, const Concurrency::extent<_Rank>& _Array_extent) __GPU

         :

         _M_buffer_descriptor(_Buffer_desc),

         _Array_view_shape<_Rank, _Element_size>(0,_Array_extent)

     {

         // Register the view

         _Register();

     }


     _Array_view_base(const _Buffer_descriptor& _Buffer_desc, int _Base_linear_offset, const Concurrency::extent<_Rank>& _Array_extent) __GPU

         :

         _M_buffer_descriptor(_Buffer_desc),

         _Array_view_shape<_Rank, _Element_size>(_Base_linear_offset,_Array_extent)

     {

         // Register the view

         _Register();

     }


     _Array_view_base(

         const _Buffer_descriptor& _Buffer_desc,

         int _Base_linear_offset,

         const Concurrency::extent<_Rank>& _Array_extent,

         const Concurrency::index<_Rank>& _View_offset,

         const Concurrency::extent<_Rank>& _View_extent

         ) __CPU_ONLY

         :

         _M_buffer_descriptor(_Buffer_desc),

         _Array_view_shape<_Rank, _Element_size>(_Base_linear_offset,_Array_extent,_View_offset,_View_extent)

     {

         // Register the view

         _Register(_Buffer_desc._Get_view_key());

     }


     _Array_view_base(

         const _Buffer_descriptor& _Buffer_desc,

         int _Base_linear_offset,

         const Concurrency::extent<_Rank>& _Array_extent,

         const Concurrency::index<_Rank>& _View_offset,

         const Concurrency::extent<_Rank>& _View_extent

         ) __GPU_ONLY

         :

         _M_buffer_descriptor(_Buffer_desc),

         _Array_view_shape<_Rank, _Element_size>(_Base_linear_offset,_Array_extent,_View_offset,_View_extent)

     {

         // Register the view

         _Register();

     }


     _Array_view_base(const _Buffer_descriptor& _Buffer_desc, const Concurrency::extent<_Rank>& _Array_extent,

                      const Concurrency::index<_Rank>& _Section_origin, const Concurrency::extent<_Rank>& _Section_extent) __GPU

         :

         _M_buffer_descriptor(_Buffer_desc),

         _Array_view_shape<_Rank, _Element_size>(0,_Array_extent,_Section_origin,_Section_extent)

     {

         // Register the view

         _Register();

     }


     _Array_view_base(const Concurrency::extent<_Rank>& _Array_extent) __CPU_ONLY

         :

         _Array_view_shape<_Rank, _Element_size>(0,_Array_extent)

     {

         _Ubiquitous_buffer_ptr _PUBuf = _Ubiquitous_buffer::_Create_ubiquitous_buffer(_Array_extent.size(), _Element_size * sizeof(int));

         _M_buffer_descriptor = _Buffer_descriptor(NULL, _PUBuf, _No_access, _No_access);


         // Register the view

         _Register();

     }


     _Array_view_base(_In_ void * _Data, const Concurrency::extent<_Rank>& _Array_extent) __CPU_ONLY

         :

         _Array_view_shape<_Rank, _Element_size>(0,_Array_extent)

     {

         if (_Data == NULL) {

             throw runtime_exception("Invalid pointer argument (NULL) to array_view constructor", E_INVALIDARG);

         }


         _Buffer_ptr _PBuf = _Buffer::_Create_buffer(_Data, accelerator(accelerator::cpu_accelerator).default_view, _Array_extent.size(), _Element_size * sizeof(int));

         _Ubiquitous_buffer_ptr _PUBuf = _Ubiquitous_buffer::_Create_ubiquitous_buffer(_PBuf);

         _M_buffer_descriptor = _Buffer_descriptor(_Data, _PUBuf, _Read_write_access, _Read_write_access);


         // Register the view

         _Register();

     }


     _Array_view_base(_In_ void * _Data, const Concurrency::extent<_Rank>& _Array_extent) __GPU_ONLY

         :

         _Array_view_shape<_Rank, _Element_size>(0,_Array_extent), _M_buffer_descriptor(_Data, NULL, _Read_write_access, _Read_write_access)

     {

     }


     _Array_view_base(const void * _Data, const Concurrency::extent<_Rank>& _Array_extent) __CPU_ONLY

         :

         _Array_view_shape<_Rank, _Element_size>(0,_Array_extent)

     {

         if (_Data == NULL) {

             throw runtime_exception("Invalid pointer argument (NULL) to array_view constructor", E_INVALIDARG);

         }


         _Buffer_ptr _PBuf = _Buffer::_Create_buffer(const_cast<void*>(_Data), accelerator(accelerator::cpu_accelerator).default_view, _Array_extent.size(), _Element_size * sizeof(int));

         _Ubiquitous_buffer_ptr _PUBuf = _Ubiquitous_buffer::_Create_ubiquitous_buffer(_PBuf);

         _M_buffer_descriptor = _Buffer_descriptor(const_cast<void*>(_Data), _PUBuf, _Read_access, _Read_access);


         // Register the view

         _Register();

     }


     _Array_view_base(const void * _Data, const Concurrency::extent<_Rank>& _Array_extent) __GPU_ONLY

         :

 #pragma warning( push )

 #pragma warning( disable : 4880 )

         // Casting away constness in amp restricted scope might result in

         // undefined behavior, therefore, the compiler will report a level 1 warning

         // for it. But the following const_cast is harmless thus we are suppressing

         // this warning just for this line.

         _Array_view_shape<_Rank, _Element_size>(0,_Array_extent), _M_buffer_descriptor(const_cast<void*>(_Data), NULL, _Read_access, _Read_access)

 #pragma warning( pop )

     {

     }


     _Array_view_base& operator=(const _Array_view_base &_Other) __GPU

     {

         if (this != &_Other)

         {

             // Unregister the current view

             _Unregister();


             _M_buffer_descriptor = _Other._M_buffer_descriptor;

             _Array_view_shape<_Rank, _Element_size>::operator=(_Other);


             // Register the new view

             _Register_copy(_Other);


             // update this buffer descriptor in case _Register_copy was late and missed the update opportunity.

             _M_buffer_descriptor = _Other._M_buffer_descriptor;

         }


         return *this;

     }


     _Ret_ void * _Access(const index<_Rank>& _Index) const __GPU

     {

         int * _Ptr = reinterpret_cast<int *>(_M_buffer_descriptor._M_data_ptr);

         return &_Ptr[this->_M_total_linear_offset + (_Element_size * _Flatten_helper::func(this->_M_array_multiplier._M_base, _Index._M_base))];

     }


     _Ret_ void * _Access(_Access_mode _Requested_mode, const index<_Rank>& _Index) const __CPU_ONLY

     {

         // Refresh the data ptr if we do not have requested access

         if ((_M_buffer_descriptor._M_curr_cpu_access_mode & _Requested_mode) != _Requested_mode) {

             _M_buffer_descriptor._Get_CPU_access(_Requested_mode);

         }


         return _Access(_Index);

     }


     _Ret_ void * _Access(_Access_mode /*_Requested_mode*/, const index<_Rank>& _Index) const __GPU_ONLY

     {

         return _Access(_Index);

     }


     _Array_view_base _Section(const Concurrency::index<_Rank>& _Section_origin, const Concurrency::extent<_Rank>& _Section_extent) const __GPU

     {

         auto _View = _Array_view_base(*this, _Section_origin, _Section_extent);


         // Register the constructed view with the section buffer view shape

         _View._Register(_Array_view_base::_Create_section_buffer_shape(this->_M_buffer_descriptor, _Section_origin, _Section_extent));


         return _View;

     }


     _Array_view_base _Section(const index<_Rank>& _Idx) const __GPU

     {

         return _Section(_Idx, this->extent - _Idx);

     }


     void _Project0(int _I, _Array_view_base<_Rank-1,_Element_size>& _Projected_view) const __GPU

     {

         _Projected_view._M_buffer_descriptor = this->_M_buffer_descriptor;

         _Array_view_shape<_Rank, _Element_size>::_Project0(_I, _Projected_view);


         // Register the constructed view with the projection buffer view shape

         _Projected_view._Register(_Array_view_base::_Create_projection_buffer_shape(this->_M_buffer_descriptor, 0, _I));

     }


     template <int _New_element_size>

     _Array_view_base<_Rank,_New_element_size> _Reinterpret_as() const __GPU

     {

         static_assert(_Rank==1, "reinterpret_as is only permissible on array views of rank 1");

         int _New_size = _Calculate_reinterpreted_size<_Element_size,_New_element_size>(this->_M_view_extent.size());

         return _Array_view_base<_Rank,_New_element_size>(this->_M_buffer_descriptor,

                                                          this->_M_total_linear_offset,

                                                          Concurrency::extent<_Rank>(_New_size));

     }


     template <int _New_rank>

     _Array_view_base<_New_rank, _Element_size> _View_as(const Concurrency::extent<_New_rank>& _View_extent) const __GPU

     {

         static_assert(_Rank==1, "view_as is only permissible on array views of rank 1");

         return _Array_view_base<_New_rank, _Element_size>(this->_M_buffer_descriptor,

                                                           this->_M_total_linear_offset,

                                                           _View_extent,

                                                           index<_New_rank>(),

                                                           _View_extent);

     }


     _Ret_ _View_shape* _Create_buffer_view_shape() const __CPU_ONLY

     {

         unsigned int bufElemSize = static_cast<unsigned int>(_M_buffer_descriptor._Get_buffer_ptr()->_Get_master_buffer_elem_size());

         unsigned int elemSize = _Element_size * sizeof(int);


         size_t linearOffsetInBytes = this->_Base_linear_offset() * sizeof(int);


         size_t baseLSDExtentInBytes = this->_M_array_extent[_Rank - 1];

         baseLSDExtentInBytes *= elemSize;


         size_t viewLSDOffsetInBytes = this->_M_view_offset[_Rank - 1];

         viewLSDOffsetInBytes *= elemSize;


         size_t viewLSDExtentInBytes = this->_M_view_extent[_Rank - 1];

         viewLSDExtentInBytes *= elemSize;


         // The base array extent, view extent, and view offset must be compatible with the underlying

         // buffer's element size

         if (((linearOffsetInBytes % bufElemSize) != 0) ||

             ((baseLSDExtentInBytes % bufElemSize) != 0) ||

             ((viewLSDOffsetInBytes % bufElemSize) != 0) ||

             ((viewLSDExtentInBytes % bufElemSize) != 0))

         {

             throw runtime_exception("The array_view base extent, view offset and/or view extent is incompatible with the underlying buffer", E_FAIL);

         }


         // The shape to be passed to the underlying buffer for registration must be in terms of

         // the element size of the buffer

         _ASSERTE((linearOffsetInBytes / bufElemSize) <= UINT_MAX);

         unsigned int linearOffset = static_cast<unsigned int>(linearOffsetInBytes / bufElemSize);


         unsigned int baseExtent[_Rank];

         unsigned int viewOffset[_Rank];

         unsigned int viewExtent[_Rank];

 #pragma warning( push )

 #pragma warning( disable : 6294 )

 #pragma warning( disable : 6201 ) //  Index '-1' is out of valid index range '0' to '0' for possibly stack allocated buffer 'baseExtent'.

         for (int i = 0; i < _Rank - 1; ++i) {

             baseExtent[i] = this->_M_array_extent[i];

             viewOffset[i] = this->_M_view_offset[i];

             viewExtent[i] = this->_M_view_extent[i];

         }

 #pragma warning( pop )


         // The extent in the least significant dimension needs to be adjusted for

         // difference in element size between the buffer and ourselves

         _ASSERTE((baseLSDExtentInBytes / bufElemSize) <= UINT_MAX);

         baseExtent[_Rank - 1] = static_cast<unsigned int>(baseLSDExtentInBytes / bufElemSize);


         _ASSERTE((viewLSDOffsetInBytes / bufElemSize) <= UINT_MAX);

         viewOffset[_Rank - 1] = static_cast<unsigned int>(viewLSDOffsetInBytes / bufElemSize);


         _ASSERTE((viewLSDExtentInBytes / bufElemSize) <= UINT_MAX);

         viewExtent[_Rank - 1] = static_cast<unsigned int>(viewLSDExtentInBytes / bufElemSize);


         return _View_shape::_Create_view_shape(_Rank, linearOffset, baseExtent, viewOffset, viewExtent);

     }


 protected:


     // Underlying storage

     _Buffer_descriptor _M_buffer_descriptor;


 private:


     void _Register(_In_opt_ const _View_key _Source_view_key = nullptr) __CPU_ONLY

     {

         _M_buffer_descriptor._Get_buffer_ptr()->_Register_view(_M_buffer_descriptor._Get_view_key(),

                                                                accelerator(accelerator::cpu_accelerator).default_view,

                                                                _Create_buffer_view_shape(),

                                                                _Source_view_key);


         if (_M_buffer_descriptor._M_curr_cpu_access_mode != _No_access)

         {

             _Buffer_ptr _PBuf;

             _Get_access_async(_M_buffer_descriptor._Get_view_key(),

                               accelerator(accelerator::cpu_accelerator).default_view,

                               _M_buffer_descriptor._M_curr_cpu_access_mode,

                               _PBuf)._Get();


             _M_buffer_descriptor._M_data_ptr = _PBuf->_Get_host_ptr();

         }

     }


     void _Register_copy(const _Array_view_base &_Other) __CPU_ONLY

     {

         _M_buffer_descriptor._Get_buffer_ptr()->_Register_view_copy(_M_buffer_descriptor._Get_view_key(), _Other._M_buffer_descriptor._Get_view_key());

     }


     void _Register(_In_ void* _Shape) __CPU_ONLY

     {

         if (_Shape == NULL) {

             return;

         }


         // Unregister and register with the right shape

         _Unregister();


         _M_buffer_descriptor._Get_buffer_ptr()->_Register_view(_M_buffer_descriptor._Get_view_key(),

                                                                accelerator(accelerator::cpu_accelerator).default_view,

                                                                reinterpret_cast<_View_shape*>(_Shape));


         if (_M_buffer_descriptor._M_curr_cpu_access_mode != _No_access)

         {

             _Buffer_ptr _PBuf;

             _Get_access_async(_M_buffer_descriptor._Get_view_key(),

                               accelerator(accelerator::cpu_accelerator).default_view,

                               _M_buffer_descriptor._M_curr_cpu_access_mode,

                               _PBuf)._Get();


             _M_buffer_descriptor._M_data_ptr = _PBuf->_Get_host_ptr();

         }

     }


     void _Unregister(bool _Throw_exception = true) __CPU_ONLY

     {

         if (!_Throw_exception && (std::current_exception() == nullptr)) {

             _Throw_exception = true;

         }


         try

         {

             _M_buffer_descriptor._Get_buffer_ptr()->_Unregister_view(_M_buffer_descriptor._Get_view_key());

         }

         catch(...)

         {

             if (_Throw_exception) {

                 throw;

             }

         }

     }


     static _Ret_ void* _Create_projection_buffer_shape(const _Buffer_descriptor& _Descriptor, unsigned int _Dim, int _Dim_offset) __CPU_ONLY

     {

         _View_shape* _Base_shape = _Get_buffer_view_shape(_Descriptor);


         std::vector<unsigned int> _New_view_extent(_Base_shape->_Get_rank());

         std::vector<unsigned int> _New_view_offset(_Base_shape->_Get_rank());

         bool *_New_projection_info = new bool[_Base_shape->_Get_rank()];

         for (unsigned int _I = 0; _I < _Base_shape->_Get_rank(); ++_I)

         {

             _New_view_extent[_I] = _Base_shape->_Get_view_extent()[_I];

             _New_view_offset[_I] = _Base_shape->_Get_view_offset()[_I];

             _New_projection_info[_I] = _Base_shape->_Get_projection_info()[_I];

         }


         // The _Dim'th non-projected dimension needs to be found

         unsigned int _UnProjectedDimCount = 0;

         for (unsigned int _I = 0; _I < _Base_shape->_Get_rank(); ++_I)

         {

             if (_Base_shape->_Get_projection_info()[_I]) {

                 continue;

             }


             if (_UnProjectedDimCount == _Dim) {

                 _New_view_extent[_I] = 1;

                 _New_view_offset[_I] += _Dim_offset;

                 _New_projection_info[_I] = true;

                 break;

             }

             else {

                 _UnProjectedDimCount++;

             }

         }


         auto _PView_shape = _View_shape::_Create_view_shape(_Base_shape->_Get_rank(),

                                                             _Base_shape->_Get_linear_offset(),

                                                             _Base_shape->_Get_base_extent(),

                                                             _New_view_offset.data(),

                                                             _New_view_extent.data(),

                                                             _New_projection_info);


         delete [] _New_projection_info;


         return _PView_shape;

     }


     static _Ret_ void* _Create_section_buffer_shape(const _Buffer_descriptor& _Descriptor,

                                               const Concurrency::index<_Rank>& _Section_origin, const Concurrency::extent<_Rank>& _Section_extent) __CPU_ONLY

     {

         _View_shape* _Base_shape = _Get_buffer_view_shape(_Descriptor);

         if (_Base_shape->_Get_rank() == _Rank) {

             return NULL;

         }


         std::vector<unsigned int> _New_view_extent(_Base_shape->_Get_rank());

         std::vector<unsigned int> _New_view_offset(_Base_shape->_Get_rank());

         unsigned int _I = 0, _J = 0;

         while (_I < _Base_shape->_Get_rank())

         {

             if (_Base_shape->_Get_projection_info()[_I])

             {

                 _New_view_extent[_I] = _Base_shape->_Get_view_extent()[_I];

                 _New_view_offset[_I] = _Base_shape->_Get_view_offset()[_I];

             }

             else

             {

                 // If _J is the least significant dimension, then we need to adjust the

                 // offset and extent for the underlying buffer's element size

                 if (_J == (_Rank - 1))

                 {

                     unsigned int bufElemSize = static_cast<unsigned int>(_Descriptor._Get_buffer_ptr()->_Get_master_buffer_elem_size());

                     unsigned int elemSize = _Element_size * sizeof(int);


                     size_t sectionLSDOriginInBytes = _Section_origin[_J];

                     sectionLSDOriginInBytes *= elemSize;


                     size_t sectionLSDExtentInBytes = _Section_extent[_J];

                     sectionLSDExtentInBytes *= elemSize;


                     // The section offset and extent must be compatible with the underlying

                     // buffer's element size

                     if (((sectionLSDOriginInBytes % bufElemSize) != 0) ||

                         ((sectionLSDExtentInBytes % bufElemSize) != 0))

                     {

                         throw runtime_exception("The array_view section origin and/or extent is incompatible with the underlying buffer", E_FAIL);

                     }


                     // The extent in the least significant dimension needs to be adjusted for

                     // difference in element size between the buffer and ourselves

                     _ASSERTE((sectionLSDOriginInBytes / bufElemSize) <= UINT_MAX);

                     _New_view_offset[_I] = _Base_shape->_Get_view_offset()[_I] + static_cast<unsigned int>(sectionLSDOriginInBytes / bufElemSize);


                     _ASSERTE((sectionLSDExtentInBytes / bufElemSize) <= UINT_MAX);

                     _New_view_extent[_I] = static_cast<unsigned int>(sectionLSDExtentInBytes / bufElemSize);

                 }

                 else

                 {

                     _New_view_extent[_I] = _Section_extent[_J];

                     _New_view_offset[_I] = _Base_shape->_Get_view_offset()[_I] + _Section_origin[_J];

                 }


                 _J++;

             }


             _I++;

         }


         _ASSERTE(_J == _Rank);


         return _View_shape::_Create_view_shape(_Base_shape->_Get_rank(),

                                                _Base_shape->_Get_linear_offset(),

                                                _Base_shape->_Get_base_extent(),

                                                _New_view_offset.data(),

                                                _New_view_extent.data(),

                                                _Base_shape->_Get_projection_info());

     }


     void _Register() __GPU_ONLY {}


     void _Register_copy(const _Array_view_base &/*_Other*/) __GPU_ONLY

     {

     }


     void _Register(_In_ void* /*_Shape*/) __GPU_ONLY

     {

     }


     void _Unregister(bool /*_Throw_exception*/ = true) __GPU_ONLY

     {

     }


     static _Ret_ void* _Create_projection_buffer_shape(const _Buffer_descriptor& /*_Descriptor*/, int /*_Dim*/, int /*_I*/) __GPU_ONLY

     {

         return NULL;

     }


     static _Ret_ void* _Create_section_buffer_shape(const _Buffer_descriptor& /*_Descriptor*/, const Concurrency::index<_Rank>& /*_Section_origin*/, const Concurrency::extent<_Rank>& /*_Section_extent*/) __GPU_ONLY

     {

         return NULL;

     }

 };


 template<typename _Container>

 struct _Is_container

 {

     template<class _Uty> static auto _Fn(_Uty _Val, decltype(_Val.size(), _Val.data(), 0)) -> std::true_type;

     template<class _Uty> static auto _Fn(_Uty _Val, ...) -> std::false_type;

     typedef decltype(_Fn(std::declval<_Container>(),0)) type;

 };


 } // namespace details


 template <typename _Value_type, int _Rank = 1> class array_view : public _Array_view_base<_Rank, sizeof(_Value_type)/sizeof(int)>

 {

     typedef _Array_view_base<_Rank, sizeof(_Value_type)/sizeof(int)> _Base;


     _CPP_AMP_VERIFY_RANK(_Rank, array_view);

     static_assert(0 == (sizeof(_Value_type) % sizeof(int)), "only value types whose size is a multiple of the size of an integer are allowed in array views");


     friend class details::_Array_view_projection_helper<_Value_type,_Rank>;

     friend class details::_Array_view_projection_helper<_Value_type,_Rank+1>;


     friend class array_view<_Value_type, _Rank>;

     friend class array_view<const _Value_type, _Rank>;


     friend class array_view<_Value_type, _Rank+1>;

     friend class array_view<const _Value_type, _Rank+1>;


     template <typename _T, int _R>

     friend class array;


     friend const _Buffer_descriptor& details::_Get_buffer_descriptor<array_view<_Value_type, _Rank>>(const array_view<_Value_type, _Rank>& _Array) __GPU;


 public:

     static const int rank = _Rank;

     typedef typename _Value_type value_type;


     ~array_view() __GPU {}


     array_view(array<_Value_type,_Rank>& _Src) __GPU

         : _Base(_Get_buffer_descriptor(_Src), _Src.extent)

     {

         _Initialize();

     }


     array_view(const array_view& _Other) __GPU

         : _Base(_Other)

     {

         _Initialize();

     }


     explicit array_view(const Concurrency::extent<_Rank>& _Extent) __CPU_ONLY

         :_Base(_Extent)

     {

         _Initialize(_Extent.size(), true);

     }


     template <typename _Container> array_view(const Concurrency::extent<_Rank>& _Extent, _Container& _Src) __CPU_ONLY

         :_Base(_Src.data(),_Extent)

     {

         static_assert( std::is_same<decltype(_Src.data()), _Value_type*>::value, "container element type and array view element type must match");

         _Initialize(_Src.size());

     }


     array_view(const Concurrency::extent<_Rank>& _Extent, _Value_type * _Src) __GPU

         :_Base(_Src,_Extent)

     {

         _Initialize();

     }


     explicit array_view(int _E0) __CPU_ONLY

         :_Base(Concurrency::extent<1>(_E0))

     {

         static_assert(_Rank == 1, "rank must be 1");

         _Initialize(this->get_extent().size(), true);

     }


     template <typename _Container> explicit array_view(_Container& _Src, typename std::enable_if<details::_Is_container<_Container>::type::value,void **>::type = 0) __CPU_ONLY

         :_Base(_Src.data(), Concurrency::extent<1>(static_cast<int>(_Src.size())))

     {

         if (_Src.size() > INT_MAX) {

             throw runtime_exception("Invalid _Src container argument - _Src size is greater than INT_MAX", E_INVALIDARG);

         }

         static_assert( std::is_same<decltype(_Src.data()), _Value_type*>::value, "container element type and array view element type must match");

         static_assert(_Rank == 1, "rank must be 1");

         _Initialize(_Src.size());

     }


     template <typename _Container> explicit array_view(int _E0, _Container& _Src) __CPU_ONLY

         :_Base(_Src.data(), Concurrency::extent<1>(_E0))

     {

         static_assert( std::is_same<decltype(_Src.data()), _Value_type*>::value, "container element type and array view element type must match");

         static_assert(_Rank == 1, "rank must be 1");

         _Initialize(_Src.size());

     }


     explicit array_view(int _E0, int _E1) __CPU_ONLY

         :_Base(Concurrency::extent<2>(_E0,_E1))

     {

         static_assert(_Rank == 2, "rank must be 2");

         _Initialize(this->get_extent().size(), true);

     }


     template <typename _Container> explicit array_view(int _E0, int _E1, _Container& _Src) __CPU_ONLY

         :_Base(_Src.data(), Concurrency::extent<2>(_E0,_E1))

     {

         static_assert( std::is_same<decltype(_Src.data()), _Value_type*>::value, "container element type and array view element type must match");

         static_assert(_Rank == 2, "rank must be 2");

         _Initialize(_Src.size());

     }


     explicit array_view(int _E0, int _E1, int _E2) __CPU_ONLY

         :_Base(Concurrency::extent<3>(_E0,_E1,_E2))

     {

         static_assert(_Rank == 3, "rank must be 3");

         _Initialize(this->get_extent().size(), true);

     }


     template <typename _Container> explicit array_view(int _E0, int _E1, int _E2, _Container& _Src) __CPU_ONLY

         :_Base(_Src.data(), Concurrency::extent<3>(_E0,_E1,_E2))

     {

         static_assert( std::is_same<decltype(_Src.data()), _Value_type*>::value, "container element type and array view element type must match");

         static_assert(_Rank == 3, "rank must be 3");

         _Initialize(_Src.size());

     }


     explicit array_view(int _E0, _In_ _Value_type * _Src) __GPU

         :_Base(_Src, Concurrency::extent<1>(_E0))

     {

         static_assert(_Rank == 1, "rank must be 1");

         _Initialize();

     }


     template <int _Size> explicit array_view(_In_ _Value_type (&_Src) [_Size]) __GPU

         :_Base(_Src, Concurrency::extent<1>(_Size))

     {

         static_assert(_Rank == 1, "rank must be 1");

         _Initialize();

     }


     explicit array_view(int _E0, int _E1, _In_ _Value_type * _Src) __GPU

         :_Base(_Src, Concurrency::extent<2>(_E0,_E1))

     {

         static_assert(_Rank == 2, "rank must be 2");

         _Initialize();

     }


     explicit array_view(int _E0, int _E1, int _E2, _In_ _Value_type * _Src) __GPU

         :_Base(_Src, Concurrency::extent<3>(_E0,_E1,_E2))

     {

         static_assert(_Rank == 3, "rank must be 3");

         _Initialize();

     }


     array_view& operator=(const array_view& _Other) __GPU

     {

         _Base::operator=(_Other);

         return *this;

     }


     void copy_to(array<_Value_type,_Rank>& _Dest) const __CPU_ONLY

     {

         copy(*this,_Dest);

     }


     void copy_to(const array_view<_Value_type,_Rank>& _Dest) const __CPU_ONLY

     {

         copy(*this,_Dest);

     }


     typename details::_Projection_result_type<_Value_type,_Rank>::_Result_type operator[] (int _I) const __GPU

     {

         return details::_Array_view_projection_helper<_Value_type,_Rank>::_Project0(this, _I);

     }


     _Value_type& get_ref(const index<_Rank>& _Index) const __GPU

     {

         void *_Ptr = _Access(_Index);

         return *reinterpret_cast<value_type*>(_Ptr);

     }


     _Value_type& operator[] (const index<_Rank>& _Index) const __GPU

     {

         return this->operator()(_Index);

     }


     _Value_type& operator() (const index<_Rank>& _Index) const __GPU

     {

         void * _Ptr = _Access(_Read_write_access, _Index);

         return *reinterpret_cast<_Value_type*>(_Ptr);

     }


     typename details::_Projection_result_type<_Value_type,_Rank>::_Result_type operator() (int _I) const __GPU

     {

         return details::_Array_view_projection_helper<_Value_type,_Rank>::_Project0(this, _I);

     }


     _Value_type& operator() (int _I0, int _I1) const __GPU

     {

         static_assert(_Rank == 2, "value_type& array_view::operator()(int,int) is only permissible on array_view<T, 2>");

         return this->operator()(index<2>(_I0,_I1));

     }


     _Value_type& operator() (int _I0, int _I1, int _I2) const __GPU

     {

         static_assert(_Rank == 3, "value_type& array_view::operator()(int,int,int) is only permissible on array_view<T, 3>");

         return this->operator()(index<3>(_I0,_I1,_I2));

     }


     array_view section(const Concurrency::index<_Rank>& _Section_origin, const Concurrency::extent<_Rank>& _Section_extent) const __GPU

     {

         return _Convert<_Value_type>(_Section(_Section_origin, _Section_extent));

     }


     array_view section(const Concurrency::index<_Rank>& _Idx) const __GPU

     {

         return section(_Idx, this->extent - _Idx);

     }


     array_view section(const Concurrency::extent<_Rank>& _Ext) const __GPU

     {

         return section(Concurrency::index<_Rank>(), _Ext);

     }


     array_view section(int _I0, int _E0) const __GPU

     {

         static_assert(_Rank == 1, "rank must be 1");

         return section(Concurrency::index<1>(_I0), Concurrency::extent<1>(_E0));

     }


     array_view section(int _I0, int _I1, int _E0, int _E1) const __GPU

     {

         static_assert(_Rank == 2, "rank must be 2");

         return section(Concurrency::index<2>(_I0,_I1), Concurrency::extent<2>(_E0,_E1));

     }


     array_view section(int _I0, int _I1, int _I2, int _E0, int _E1, int _E2) const __GPU

     {

         static_assert(_Rank == 3, "rank must be 3");

         return section(Concurrency::index<3>(_I0,_I1,_I2), Concurrency::extent<3>(_E0,_E1,_E2));

     }


     template <typename _Value_type2> array_view<_Value_type2, _Rank> reinterpret_as() const __GPU

     {

         return _Convert<_Value_type2>(this->template _Reinterpret_as<sizeof(_Value_type2)/sizeof(int)>());

     }


     template <int _New_rank> array_view<_Value_type,_New_rank> view_as(const Concurrency::extent<_New_rank>& _View_extent) const __GPU

     {

         return _Convert<_Value_type>(_View_as(_View_extent));

     }


     _Ret_ _Value_type* data() const __GPU

     {

         static_assert(_Rank == 1, "array_view::data() is only permissible on array_view<T, 1>");

         return &this->operator[](index<_Rank>());

     }


     void refresh() const __CPU_ONLY

     {

         // If the array_view corresponds to a ubiquitous buffer with no data source,

         // then refresh is a no-op

         if (!this->_M_buffer_descriptor._Get_buffer_ptr()->_Has_data_source()) {

             return;

         }


         _Buffer_ptr _PBuf;

         _Get_access_async(this->_M_buffer_descriptor._Get_view_key(), this->_M_buffer_descriptor._Get_buffer_ptr()->_Get_master_accelerator_view(), _Write_access, _PBuf)._Get();

     }


     concurrency::completion_future synchronize_to_async(const accelerator_view& _Accl_view, access_type _Access_type = access_type_read) const __CPU_ONLY

     {

         auto _Async_op_id = details::_Get_amp_trace()->_Launch_array_view_synchronize_event_helper(this->_M_buffer_descriptor);


         _Buffer_ptr _PBuf;

         _Event _Ev;


         if (_Access_type != access_type_none) {

             _Ev = _Get_access_async(this->_M_buffer_descriptor._Get_view_key(), _Accl_view, _Get_synchronize_access_mode(_Access_type), _PBuf);

         }


         return details::_Get_amp_trace()->_Start_async_op_wait_event_helper(_Async_op_id, _Ev);

     }


     concurrency::completion_future synchronize_async(access_type _Access_type = access_type_read) const __CPU_ONLY

     {

         auto _Async_op_id = details::_Get_amp_trace()->_Launch_array_view_synchronize_event_helper(this->_M_buffer_descriptor);


         _Buffer_ptr _PBuf;

         _Event _Ev;


         // If the array_view corresponds to a ubiquitous buffer with no data source, then synchronize is a no-op

         if ((_Access_type != access_type_none) && this->_M_buffer_descriptor._Get_buffer_ptr()->_Has_data_source())

         {

             _Ev = _Get_access_async(this->_M_buffer_descriptor._Get_view_key(),

                                     this->_M_buffer_descriptor._Get_buffer_ptr()->_Get_master_accelerator_view(),

                                     _Get_synchronize_access_mode(_Access_type),

                                     _PBuf);

         }


         return details::_Get_amp_trace()->_Start_async_op_wait_event_helper(_Async_op_id, _Ev);

     }


     void synchronize_to(const accelerator_view& _Accl_view, access_type _Access_type = access_type_read) const __CPU_ONLY

     {

         auto _Span_id = details::_Get_amp_trace()->_Start_array_view_synchronize_event_helper(this->_M_buffer_descriptor);


         _Buffer_ptr _PBuf;


         if (_Access_type != access_type_none) {

             _Get_access_async(this->_M_buffer_descriptor._Get_view_key(), _Accl_view, _Get_synchronize_access_mode(_Access_type), _PBuf)._Get();

         }


         details::_Get_amp_trace()->_Write_end_event(_Span_id);

     }


     void synchronize(access_type _Access_type = access_type_read) const __CPU_ONLY

     {

         auto _Span_id = details::_Get_amp_trace()->_Start_array_view_synchronize_event_helper(this->_M_buffer_descriptor);


         _Buffer_ptr _PBuf;


         // If the array_view corresponds to a ubiquitous buffer with no data source, then synchronize is a no-op

         if ((_Access_type != access_type_none) && this->_M_buffer_descriptor._Get_buffer_ptr()->_Has_data_source())

         {

             _Get_access_async(this->_M_buffer_descriptor._Get_view_key(),

                               this->_M_buffer_descriptor._Get_buffer_ptr()->_Get_master_accelerator_view(),

                               _Get_synchronize_access_mode(_Access_type),

                               _PBuf)._Get();

         }


         details::_Get_amp_trace()->_Write_end_event(_Span_id);

     }


     void discard_data() const __CPU_ONLY

     {

         this->_M_buffer_descriptor._Get_buffer_ptr()->_Discard(this->_M_buffer_descriptor._Get_view_key());

     }


     accelerator_view get_source_accelerator_view() const

     {

         if (this->_M_buffer_descriptor._Get_buffer_ptr()->_Has_data_source()) {

             return this->_M_buffer_descriptor._Get_buffer_ptr()->_Get_master_accelerator_view();

         }

         else {

             throw runtime_exception("Cannot query source accelerator_view for an array_view without a data source.", E_INVALIDARG);

         }

     }


     __declspec(property(get=get_source_accelerator_view)) accelerator_view source_accelerator_view;


 private:

     template <typename _T, int _R>

     static array_view<_T,_R> _Convert(const _Array_view_base<_R,sizeof(_T)/sizeof(int)>& _Other) __GPU

     {

         static_assert(sizeof(array_view<_T,_R>) == sizeof(_Array_view_base<_R,sizeof(_T)/sizeof(int)>), "ASSERT FAILURE: implementation relies on binary conversion between the two");

         return (*reinterpret_cast<const array_view<_T,_R>*>(&_Other));

     }


     void _Project0(int _I, array_view<_Value_type, _Rank-1> &_Projected_view) const __GPU

     {

         _Base::_Project0(_I, _Projected_view);

         _Projected_view._Initialize();

     }


     array_view() __GPU {}


     array_view(const array_view& _Other, const Concurrency::index<_Rank>& _Section_origin, const Concurrency::extent<_Rank>& _Section_extent) __GPU

         :_Base(_Other, _Section_origin, _Section_extent)

     {

         _Initialize();

     }


     array_view(_Buffer_descriptor& _Src_buffer, const Concurrency::extent<_Rank>& _Extent) __GPU

         :_Base(_Src_buffer,_Extent)

     {

         _Initialize();

     }


     void _Initialize() __GPU

     {

         // Set the type access mode

         this->_M_buffer_descriptor._M_type_access_mode = _Read_write_access;

     }


     void _Initialize(size_t _Src_data_size, bool _Discard_data = false) __CPU_ONLY

     {

         // Ensure that the _Src_data_size is at least as big as the size

         // of the array_view

         if (_Src_data_size < this->extent.size()) {

             throw runtime_exception("Invalid _Src container argument - _Src size is less than the size of the array_view.", E_INVALIDARG);

         }


         _Initialize();


         if (_Discard_data) {

             discard_data();

         }

     }


 };  // class array_view<T,R>


 // array_view<const T,R>

 template <typename _Value_type, int _Rank>

 class array_view<const _Value_type, _Rank> : public _Array_view_base<_Rank, sizeof(_Value_type)/sizeof(int)>

 {

     _CPP_AMP_VERIFY_RANK(_Rank, array_view);

     static_assert(0 == (sizeof(_Value_type) % sizeof(int)), "only value types whose size is a multiple of the size of an integer are allowed in array views");


     typedef _Array_view_base<_Rank, sizeof(_Value_type)/sizeof(int)> _Base;


     friend class details::_Const_array_view_projection_helper<_Value_type,_Rank>;

     friend class details::_Const_array_view_projection_helper<_Value_type,_Rank+1>;


     friend class array_view<_Value_type, _Rank>;

     friend class array_view<const _Value_type, _Rank>;


     friend class array_view<_Value_type, _Rank+1>;

     friend class array_view<const _Value_type, _Rank+1>;


     friend const _Buffer_descriptor& details::_Get_buffer_descriptor<array_view<const _Value_type, _Rank>>(const array_view<const _Value_type, _Rank>& _Array) __GPU;


 public:

     static const int rank = _Rank;

     typedef typename const _Value_type value_type;


     ~array_view() __GPU {}


     array_view(const array<_Value_type,_Rank>& _Src) __GPU

         :_Base(_Get_buffer_descriptor(_Src), _Src.extent)

     {

         _Initialize();

     }


     array_view(const array_view<_Value_type,_Rank>& _Src) __GPU

         :_Base(_Src)

     {

         _Initialize();

     }


     array_view(const array_view<const _Value_type,_Rank>& _Src) __GPU

         :_Base(_Src)

     {

     }


     template <typename _Container> array_view(const Concurrency::extent<_Rank>& _Extent, const _Container& _Src) __CPU_ONLY

         :_Base(_Src.data(),_Extent)

     {

         static_assert( std::is_same<typename std::remove_const<typename std::remove_reference<decltype(*_Src.data())>::type>::type, _Value_type>::value, "container element type and array view element type must match");

         _Initialize(_Src.size());

     }


     template <typename _Container> explicit array_view(const _Container& _Src, typename std::enable_if<details::_Is_container<_Container>::type::value,void **>::type = 0) __CPU_ONLY

         :_Base(_Src.data(), Concurrency::extent<1>(static_cast<int>(_Src.size())))

     {

         if (_Src.size() > INT_MAX) {

             throw runtime_exception("Invalid _Src container argument - _Src size is greater than INT_MAX", E_INVALIDARG);

         }

         static_assert( std::is_same<decltype(_Src.data()), const _Value_type*>::value, "container element type and array view element type must match");

         static_assert(_Rank == 1, "rank must be 1");

         _Initialize(_Src.size());

     }


     template <typename _Container> array_view(const Concurrency::extent<_Rank>& _Extent, _Container& _Src) __CPU_ONLY

         :_Base(_Src.data(),_Extent)

     {

         static_assert( std::is_same<typename std::remove_const<typename std::remove_reference<decltype(*_Src.data())>::type>::type, _Value_type>::value, "container element type and array view element type must match");

         _Initialize(_Src.size());

     }


     array_view(const Concurrency::extent<_Rank>& _Extent, const _Value_type * _Src) __GPU

         :_Base(_Src,_Extent)

     {

         _Initialize();

     }


     array_view(const Concurrency::extent<_Rank>& _Extent, _In_ _Value_type * _Src) __GPU

         :_Base(_Src,_Extent)

     {

         _Initialize();

     }


     template <typename _Container> array_view(int _E0, const _Container& _Src) __CPU_ONLY

         :_Base(_Src.data(), Concurrency::extent<1>(_E0))

     {

         static_assert( std::is_same<typename std::remove_const<typename std::remove_reference<decltype(*_Src.data())>::type>::type, _Value_type>::value, "container element type and array view element type must match");

         static_assert(_Rank == 1, "rank must be 1");

         _Initialize(_Src.size());

     }


     template <int _Size> explicit array_view(const _In_ _Value_type (&_Src) [_Size]) __GPU

         :_Base(_Src, Concurrency::extent<1>(_Size))

     {

         static_assert(_Rank == 1, "rank must be 1");

         _Initialize();

     }


     template <typename _Container> array_view(int _E0, int _E1, const _Container& _Src) __CPU_ONLY

         :_Base(_Src.data(), Concurrency::extent<2>(_E0,_E1))

     {

         static_assert( std::is_same<typename std::remove_const<typename std::remove_reference<decltype(*_Src.data())>::type>::type, _Value_type>::value, "container element type and array view element type must match");

         static_assert(_Rank == 2, "rank must be 2");

         _Initialize(_Src.size());

     }


     template <typename _Container> array_view(int _E0, int _E1, int _E2, const _Container& _Src) __CPU_ONLY

         :_Base(_Src.data(), Concurrency::extent<3>(_E0,_E1,_E2))

     {

         static_assert( std::is_same<typename std::remove_const<typename std::remove_reference<decltype(*_Src.data())>::type>::type, _Value_type>::value, "container element type and array view element type must match");

         static_assert(_Rank == 3, "rank must be 3");

         _Initialize(_Src.size());

     }


     array_view(int _E0, const _Value_type * _Src) __GPU

         :_Base(_Src, Concurrency::extent<1>(_E0))

     {

         static_assert(_Rank == 1, "rank must be 1");

         _Initialize();

     }


     array_view(int _E0, int _E1, const _Value_type * _Src) __GPU

         :_Base(_Src, Concurrency::extent<2>(_E0,_E1))

     {

         static_assert(_Rank == 2, "rank must be 2");

         _Initialize();

     }


     array_view(int _E0, int _E1, int _E2, const _Value_type * _Src) __GPU

         :_Base(_Src, Concurrency::extent<3>(_E0,_E1,_E2))

     {

         static_assert(_Rank == 3, "rank must be 3");

         _Initialize();

     }


     array_view(int _E0, _In_ _Value_type * _Src) __GPU

         :_Base(_Src, Concurrency::extent<1>(_E0))

     {

         static_assert(_Rank == 1, "rank must be 1");

         _Initialize();

     }


     array_view(int _E0, int _E1, _In_ _Value_type * _Src) __GPU

         :_Base(_Src, Concurrency::extent<2>(_E0,_E1))

     {

         static_assert(_Rank == 2, "rank must be 2");

         _Initialize();

     }


     array_view(int _E0, int _E1, int _E2, _In_ _Value_type * _Src) __GPU

         :_Base(_Src, Concurrency::extent<3>(_E0,_E1,_E2))

     {

         static_assert(_Rank == 3, "rank must be 3");

         _Initialize();

     }


     array_view& operator=(const array_view& _Other) __GPU

     {

         _Base::operator=(_Other);

         return *this;

     }


     array_view& operator=(const array_view<_Value_type, _Rank>& _Other) __GPU

     {

         _Base::operator=(_Other);

         return *this;

     }


     void copy_to(array<_Value_type,_Rank>& _Dest) const __CPU_ONLY

     {

         copy(*this,_Dest);

     }


     void copy_to(const array_view<_Value_type,_Rank>& _Dest) const __CPU_ONLY

     {

         copy(*this,_Dest);

     }


     typename details::_Projection_result_type<_Value_type,_Rank>::_Const_result_type operator[] (int _I) const __GPU

     {

         return details::_Const_array_view_projection_helper<_Value_type,_Rank>::_Project0(this, _I);

     }


     const _Value_type& get_ref(const index<_Rank>& _Index) const __GPU

     {

         void *_Ptr = _Access(_Index);

         return *reinterpret_cast<value_type*>(_Ptr);

     }


     const _Value_type& operator[] (const index<_Rank>& _Index) const __GPU

     {

         return this->operator()(_Index);

     }


     const _Value_type& operator() (const index<_Rank>& _Index) const __GPU

     {

         void * _Ptr = _Access(_Read_access, _Index);

         return *reinterpret_cast<value_type*>(_Ptr);

     }


     typename details::_Projection_result_type<_Value_type,_Rank>::_Const_result_type operator() (int _I) const __GPU

     {

         return details::_Const_array_view_projection_helper<_Value_type,_Rank>::_Project0(this, _I);

     }


     const _Value_type& operator() (int _I0, int _I1) const __GPU

     {

         static_assert(_Rank == 2, "value_type& array_view::operator()(int,int) is only permissible on array_view<T, 2>");

         return this->operator()(index<2>(_I0,_I1));

     }


     const _Value_type& operator() (int _I0, int _I1, int _I2) const __GPU

     {

         static_assert(_Rank == 3, "value_type& array_view::operator()(int,int,int) is only permissible on array_view<T, 3>");

         return this->operator()(index<3>(_I0,_I1,_I2));

     }


     array_view section(const Concurrency::index<_Rank>& _Section_origin, const Concurrency::extent<_Rank>& _Section_extent) const __GPU

     {

         return _Convert<_Value_type>(_Section(_Section_origin, _Section_extent));

     }


     array_view section(const Concurrency::extent<_Rank>& _Ext) const __GPU

     {

         return section(Concurrency::index<_Rank>(), _Ext);

     }


     array_view section(const Concurrency::index<_Rank>& _Idx) const __GPU

     {

         return section(_Idx, this->extent - _Idx);

     }


     array_view section(int _I0, int _E0) const __GPU

     {

         static_assert(_Rank == 1, "rank must be 1");

         return section(Concurrency::index<1>(_I0), Concurrency::extent<1>(_E0));

     }


     array_view section(int _I0, int _I1, int _E0, int _E1) const __GPU

     {

         static_assert(_Rank == 2, "rank must be 2");

         return section(Concurrency::index<2>(_I0,_I1), Concurrency::extent<2>(_E0,_E1));

     }


     array_view section(int _I0, int _I1, int _I2, int _E0, int _E1, int _E2) const __GPU

     {

         static_assert(_Rank == 3, "rank must be 3");

         return section(Concurrency::index<3>(_I0,_I1,_I2), Concurrency::extent<3>(_E0,_E1,_E2));

     }


     template <typename _Value_type2> array_view<const _Value_type2, _Rank> reinterpret_as() const __GPU

     {

         return _Convert<_Value_type2>(this->template _Reinterpret_as<sizeof(_Value_type2)/sizeof(int)>());

     }


     template <int _New_rank> array_view<const _Value_type,_New_rank> view_as(const Concurrency::extent<_New_rank>& _View_extent) const __GPU

     {

         return _Convert<_Value_type>(_View_as(_View_extent));

     }


     const _Value_type* data() const __GPU

     {

         static_assert(_Rank == 1, "array_view::data() is only permissible on array_view<T, 1>");

         return &this->operator[](index<_Rank>());

     }


     void refresh() const __CPU_ONLY

     {

         _Buffer_ptr _PBuf;

         _Get_access_async(this->_M_buffer_descriptor._Get_view_key(), this->_M_buffer_descriptor._Get_buffer_ptr()->_Get_master_accelerator_view(), _Write_access, _PBuf)._Get();

     }


     concurrency::completion_future synchronize_to_async(const accelerator_view& _Accl_view) const __CPU_ONLY

     {

         auto _Async_op_id = details::_Get_amp_trace()->_Launch_array_view_synchronize_event_helper(this->_M_buffer_descriptor);


         _Buffer_ptr _PBuf;

         _Event _Ev;


         _Ev = _Get_access_async(this->_M_buffer_descriptor._Get_view_key(), _Accl_view, _Read_access, _PBuf);


         return details::_Get_amp_trace()->_Start_async_op_wait_event_helper(_Async_op_id, _Ev);

     }


     concurrency::completion_future synchronize_async() const __CPU_ONLY

     {

         auto _Async_op_id = details::_Get_amp_trace()->_Launch_array_view_synchronize_event_helper(this->_M_buffer_descriptor);


         _Buffer_ptr _PBuf;

         _Event _Ev;


         // If the array_view corresponds to a ubiquitous buffer with no data source,

         // then synchronize is a no-op

         if (this->_M_buffer_descriptor._Get_buffer_ptr()->_Has_data_source()) {

             _Ev = _Get_access_async(this->_M_buffer_descriptor._Get_view_key(), this->_M_buffer_descriptor._Get_buffer_ptr()->_Get_master_accelerator_view(), _Read_access, _PBuf);

         }


         return details::_Get_amp_trace()->_Start_async_op_wait_event_helper(_Async_op_id, _Ev);

     }


     void synchronize_to(const accelerator_view& _Accl_view) const __CPU_ONLY

     {

         auto _Span_id = details::_Get_amp_trace()->_Start_array_view_synchronize_event_helper(this->_M_buffer_descriptor);


         _Buffer_ptr _PBuf;


         _Get_access_async(this->_M_buffer_descriptor._Get_view_key(), _Accl_view, _Read_access, _PBuf)._Get();


         details::_Get_amp_trace()->_Write_end_event(_Span_id);

     }


     void synchronize() const __CPU_ONLY

     {

         auto _Span_id = details::_Get_amp_trace()->_Start_array_view_synchronize_event_helper(this->_M_buffer_descriptor);


         _Buffer_ptr _PBuf;


         // If the array_view corresponds to a ubiquitous buffer with no data source,

         // then synchronize is a no-op

         if (this->_M_buffer_descriptor._Get_buffer_ptr()->_Has_data_source()) {

             _Get_access_async(this->_M_buffer_descriptor._Get_view_key(), this->_M_buffer_descriptor._Get_buffer_ptr()->_Get_master_accelerator_view(), _Read_access, _PBuf)._Get();

         }


         details::_Get_amp_trace()->_Write_end_event(_Span_id);

     }


     accelerator_view get_source_accelerator_view() const

     {

         if (this->_M_buffer_descriptor._Get_buffer_ptr()->_Has_data_source()) {

             return this->_M_buffer_descriptor._Get_buffer_ptr()->_Get_master_accelerator_view();

         }

         else {

             throw runtime_exception("Cannot query source accelerator_view for an array_view without a data source.", E_INVALIDARG);

         }

     }


     __declspec(property(get=get_source_accelerator_view)) accelerator_view source_accelerator_view;


 private:

     template <typename _T, int _R>

     static array_view<const _T,_R> _Convert(const _Array_view_base<_R,sizeof(_T)/sizeof(int)>& _Other) __GPU

     {

         static_assert(sizeof(array_view<const _T,_R>) == sizeof(_Array_view_base<_R,sizeof(_T)/sizeof(int)>), "ASSERT FAILURE: implementation relies on binary conversion between the two");

         return (*reinterpret_cast<const array_view<const _T,_R>*>(&_Other));

     }


     void _Project0(int _I, array_view<const _Value_type, _Rank-1> &_Projected_view) const __GPU

     {

         _Base::_Project0(_I, _Projected_view);

         _Projected_view._Initialize();

     }


     array_view() __GPU {}


     array_view(const array_view& _Other, const Concurrency::index<_Rank>& _Section_origin, const Concurrency::extent<_Rank>& _Section_extent) __GPU

         :

         _Base(_Other, _Section_origin, _Section_extent)

     {

         _Initialize();

     }


     void _Initialize() __GPU

     {

         // Set the type access mode

         this->_M_buffer_descriptor._M_type_access_mode = _Read_access;

     }


     void _Initialize(size_t _Src_data_size) __CPU_ONLY

     {

         // Ensure that the _Src_data_size is at least as big as the size

         // of the array_view

         if (_Src_data_size < this->extent.size()) {

             throw runtime_exception("Invalid _Src container argument - _Src size is less than the size of the array_view.", E_INVALIDARG);

         }


         _Initialize();

     }


 };  // class array_view<const T,R>


 // Forward declarations for copy functions

 template <typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array<_Value_type,_Rank>& _Src, array<_Value_type,_Rank>& _Dest);

 template <typename _Value_type, int _Rank> void copy(const array<_Value_type,_Rank>& _Src, array<_Value_type,_Rank>& _Dest);

 template <typename InputIterator, typename _Value_type, int _Rank> concurrency::completion_future copy_async(InputIterator _SrcFirst, InputIterator _SrcLast, array<_Value_type, _Rank> &_Dest);

 template <typename InputIterator, typename _Value_type, int _Rank> void copy(InputIterator _SrcFirst, InputIterator _SrcLast, array<_Value_type, _Rank> &_Dest);

 template <typename InputIterator, typename _Value_type, int _Rank> concurrency::completion_future copy_async(InputIterator _SrcFirst, array<_Value_type, _Rank> &_Dest);

 template <typename InputIterator, typename _Value_type, int _Rank> void copy(InputIterator _SrcFirst, array<_Value_type, _Rank> &_Dest);

 template <typename OutputIterator, typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array<_Value_type, _Rank> &_Src, OutputIterator _DestIter);

 template <typename OutputIterator, typename _Value_type, int _Rank> void copy(const array<_Value_type, _Rank> &_Src, OutputIterator _DestIter);

 template <typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array<_Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest);

 template <typename _Value_type, int _Rank> void copy(const array<_Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest);

 template <typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array_view<const _Value_type, _Rank>& _Src, array<_Value_type, _Rank>& _Dest);

 template <typename _Value_type, int _Rank> void copy(const array_view<const _Value_type, _Rank>& _Src, array<_Value_type, _Rank>& _Dest);

 template <typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array_view<_Value_type, _Rank>& _Src, array<_Value_type, _Rank>& _Dest);

 template <typename _Value_type, int _Rank> void copy(const array_view<_Value_type, _Rank>& _Src, array<_Value_type, _Rank>& _Dest);

 template <typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array_view<const _Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest);

 template <typename _Value_type, int _Rank> void copy(const array_view<const _Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest);

 template <typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array_view<_Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest);

 template <typename _Value_type, int _Rank> void copy(const array_view<_Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest);

 template <typename InputIterator, typename _Value_type, int _Rank> concurrency::completion_future copy_async(InputIterator _SrcFirst, InputIterator _SrcLast, const array_view<_Value_type, _Rank> &_Dest);

 template <typename InputIterator, typename _Value_type, int _Rank> concurrency::completion_future copy_async(InputIterator _SrcFirst, const array_view<_Value_type, _Rank> &_Dest);

 template <typename InputIterator, typename _Value_type, int _Rank> void copy(InputIterator _SrcFirst, InputIterator _SrcLast, const array_view<_Value_type, _Rank> &_Dest);

 template <typename InputIterator, typename _Value_type, int _Rank> void copy(InputIterator _SrcFirst, const array_view<_Value_type, _Rank> &_Dest);

 template <typename OutputIterator, typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array_view<_Value_type, _Rank> &_Src, OutputIterator _DestIter);

 template <typename OutputIterator, typename _Value_type, int _Rank> void copy(const array_view<_Value_type, _Rank> &_Src, OutputIterator _DestIter);


 namespace direct3d

 {

     template<typename _Value_type, int _Rank>

     array<_Value_type, _Rank> make_array(const Concurrency::extent<_Rank> &_Extent, const Concurrency::accelerator_view &_Av, _In_ IUnknown *_D3D_buffer) __CPU_ONLY;

 }


 template <typename _Value_type, int _Rank = 1> class array

 {

     // internal storage abstraction

     typedef details::_Buffer_descriptor _Buffer_descriptor;

     typedef _Array_flatten_helper<_Rank, typename Concurrency::extent<_Rank>::value_type, typename Concurrency::index<_Rank>::value_type> _Flatten_helper;


     _CPP_AMP_VERIFY_RANK(_Rank, array);

     static_assert(!std::is_const<_Value_type>::value, "array<const _Value_type> is not supported");

     static_assert(0 == (sizeof(_Value_type) % sizeof(int)), "only value types whose size is a multiple of the size of an integer are allowed in array");


     // Friends

     template<typename _Value_type, int _Rank>

     friend array<_Value_type,_Rank> direct3d::make_array(const Concurrency::extent<_Rank> &_Extent, const Concurrency::accelerator_view &_Av, _In_ IUnknown *_D3D_buffer) __CPU_ONLY;

     friend const _Buffer_descriptor& details::_Get_buffer_descriptor<array<_Value_type,_Rank>>(const array<_Value_type,_Rank>& _Array) __GPU;

     friend _Ret_ _Ubiquitous_buffer* details::_Get_buffer<array<_Value_type,_Rank>>(const array<_Value_type,_Rank>& _Array) __CPU_ONLY;

     friend _Event details::_Get_access_async<array<_Value_type,_Rank>>(const array<_Value_type,_Rank>& _Array, _Access_mode _Mode, _Buffer_ptr &_Buf_ptr) __CPU_ONLY;


     public:

     static const int rank = _Rank;

     typedef typename _Value_type value_type;


     explicit array(const Concurrency::extent<_Rank> & _Extent) __CPU_ONLY

         : _M_extent(_Extent)

     {

         _Initialize(details::_Select_default_accelerator().default_view, access_type_auto);

     }


     explicit array(int _E0) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0))

     {

         static_assert(_Rank == 1, "array(int) is only permissible on array<T, 1>");

         _Initialize(details::_Select_default_accelerator().default_view, access_type_auto);

     }


     explicit array(int _E0, int _E1) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1))

     {

         static_assert(_Rank == 2, "array(int, int) is only permissible on array<T, 2>");

         _Initialize(details::_Select_default_accelerator().default_view, access_type_auto);

     }


     explicit array(int _E0, int _E1, int _E2) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1, _E2))

     {

         static_assert(_Rank == 3, "array(int, int, int) is only permissible on array<T, 3>");

         _Initialize(details::_Select_default_accelerator().default_view, access_type_auto);

     }


     array(const Concurrency::extent<_Rank>& _Extent, Concurrency::accelerator_view _Av, access_type _Cpu_access_type = access_type_auto) __CPU_ONLY

         : _M_extent(_Extent)

     {

         _Initialize(_Av, _Cpu_access_type);

     }


     array(int _E0, Concurrency::accelerator_view _Av, access_type _Cpu_access_type = access_type_auto) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0))

     {

         static_assert(_Rank == 1, "array(int, accelerator_view) is only permissible on array<T, 1>");

         _Initialize(_Av, _Cpu_access_type);

     }


     array(int _E0, int _E1, Concurrency::accelerator_view _Av, access_type _Cpu_access_type = access_type_auto) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1))

     {

         static_assert(_Rank == 2, "array(int, int, accelerator_view) is only permissible on array<T, 2>");

         _Initialize(_Av, _Cpu_access_type);

     }


     array(int _E0, int _E1, int _E2, Concurrency::accelerator_view _Av, access_type _Cpu_access_type = access_type_auto) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1, _E2))

     {

         static_assert(_Rank == 3, "array(int, int, int, accelerator_view) is only permissible on array<T, 3>");

         _Initialize(_Av, _Cpu_access_type);

     }


     array(const Concurrency::extent<_Rank>& _Extent, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY

         : _M_extent(_Extent)

     {

         _Initialize(_Av, _Associated_Av);

     }


     array(int _E0, accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0))

     {

         static_assert(_Rank == 1, "array(int, accelerator_view, accelerator_view) is only permissible on array<T, 1>");

         _Initialize(_Av, _Associated_Av);

     }


     array(int _E0, int _E1, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1))

     {

         static_assert(_Rank == 2, "array(int, int, accelerator_view, accelerator_view) is only permissible on array<T, 2>");

         _Initialize(_Av, _Associated_Av);

     }


     array(int _E0, int _E1, int _E2, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1, _E2))

     {

         static_assert(_Rank == 3, "array(int, int, int, accelerator_view, accelerator_view) is only permissible on array<T, 3>");

         _Initialize(_Av, _Associated_Av);

     }


     template <typename _InputIterator> array(const Concurrency::extent<_Rank>& _Extent, _InputIterator _Src_first, _InputIterator _Src_last) __CPU_ONLY

         : _M_extent(_Extent)

     {

         _Initialize(details::_Select_default_accelerator().default_view, _Src_first, _Src_last, access_type_auto);

     }


     template <typename _InputIterator> array(const Concurrency::extent<_Rank>& _Extent, _InputIterator _Src_first) __CPU_ONLY

         : _M_extent(_Extent)

     {

         _InputIterator _Src_last = _Src_first;

         std::advance(_Src_last, this->extent.size());


         _Initialize(details::_Select_default_accelerator().default_view, _Src_first, _Src_last, access_type_auto);

     }


     template <typename _InputIterator> array(int _E0, _InputIterator _Src_first, _InputIterator _Src_last) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0))

     {

         static_assert(_Rank == 1, "array(int, iterator, iterator) is only permissible on array<T, 1>");

         _Initialize(details::_Select_default_accelerator().default_view, _Src_first, _Src_last, access_type_auto);

     }


     template <typename _InputIterator> array(int _E0, _InputIterator _Src_first) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0))

     {

         static_assert(_Rank == 1, "array(int, iterator) is only permissible on array<T, 1>");


         _InputIterator _Src_last = _Src_first;

         std::advance(_Src_last, this->extent.size());


         _Initialize(details::_Select_default_accelerator().default_view, _Src_first, _Src_last, access_type_auto);

     }


     template <typename _InputIterator> array(int _E0, int _E1, _InputIterator _Src_first, _InputIterator _Src_last) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1))

     {

         static_assert(_Rank == 2, "array(int, int, iterator, iterator) is only permissible on array<T, 2>");

         _Initialize(details::_Select_default_accelerator().default_view, _Src_first, _Src_last, access_type_auto);

     }


     template <typename _InputIterator> array(int _E0, int _E1, _InputIterator _Src_first) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1))

     {

         static_assert(_Rank == 2, "array(int, int, iterator) is only permissible on array<T, 2>");


         _InputIterator _Src_last = _Src_first;

         std::advance(_Src_last, this->extent.size());


         _Initialize(details::_Select_default_accelerator().default_view, _Src_first, _Src_last, access_type_auto);

     }


     template <typename _InputIterator> array(int _E0, int _E1, int _E2, _InputIterator _Src_first, _InputIterator _Src_last) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1, _E2))

     {

         static_assert(_Rank == 3, "array(int, int, int, iterator, iterator) is only permissible on array<T, 3>");

         _Initialize(details::_Select_default_accelerator().default_view, _Src_first, _Src_last, access_type_auto);

     }


     template <typename _InputIterator> array(int _E0, int _E1, int _E2, _InputIterator _Src_first) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1, _E2))

     {

         static_assert(_Rank == 3, "array(int, int, int, iterator) is only permissible on array<T, 3>");


         _InputIterator _Src_last = _Src_first;

         std::advance(_Src_last, this->extent.size());


         _Initialize(details::_Select_default_accelerator().default_view, _Src_first, _Src_last, access_type_auto);

     }


     template <typename _InputIterator> array(const Concurrency::extent<_Rank>& _Extent, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, access_type _Cpu_access_type = access_type_auto) __CPU_ONLY

         : _M_extent(_Extent)

     {

         _Initialize(_Av, _Src_first, _Src_last, _Cpu_access_type);

     }


     template <typename _InputIterator> array(const Concurrency::extent<_Rank>& _Extent, _InputIterator _Src_first, Concurrency::accelerator_view _Av, access_type _Cpu_access_type = access_type_auto) __CPU_ONLY

         : _M_extent(_Extent)

     {

         _InputIterator _Src_last = _Src_first;

         std::advance(_Src_last, this->extent.size());


         _Initialize(_Av, _Src_first, _Src_last, _Cpu_access_type);

     }


     template <typename _InputIterator> array(int _E0, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, access_type _Cpu_access_type = access_type_auto) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0))

     {

         static_assert(_Rank == 1, "array(int, iterator, iterator) is only permissible on array<T, 1>");

         _Initialize(_Av, _Src_first, _Src_last, _Cpu_access_type);

     }


     template <typename _InputIterator> array(int _E0, _InputIterator _Src_first, Concurrency::accelerator_view _Av, access_type _Cpu_access_type = access_type_auto) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0))

     {

         static_assert(_Rank == 1, "array(int, iterator) is only permissible on array<T, 1>");


         _InputIterator _Src_last = _Src_first;

         std::advance(_Src_last, this->extent.size());


         _Initialize(_Av, _Src_first, _Src_last, _Cpu_access_type);

     }


     template <typename _InputIterator> array(int _E0, int _E1, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, access_type _Cpu_access_type = access_type_auto) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1))

     {

         static_assert(_Rank == 2, "array(int, int, iterator, iterator) is only permissible on array<T, 2>");

         _Initialize(_Av, _Src_first, _Src_last, _Cpu_access_type);

     }


     template <typename _InputIterator> array(int _E0, int _E1, _InputIterator _Src_first, Concurrency::accelerator_view _Av, access_type _Cpu_access_type = access_type_auto) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1))

     {

         static_assert(_Rank == 2, "array(int, int, iterator) is only permissible on array<T, 2>");


         _InputIterator _Src_last = _Src_first;

         std::advance(_Src_last, this->extent.size());


         _Initialize(_Av, _Src_first, _Src_last, _Cpu_access_type);

     }


     template <typename _InputIterator> array(int _E0, int _E1, int _E2, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, access_type _Cpu_access_type = access_type_auto) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1, _E2))

     {

         static_assert(_Rank == 3, "array(int, int, int, iterator, iterator) is only permissible on array<T, 3>");

         _Initialize(_Av, _Src_first, _Src_last, _Cpu_access_type);

     }


     template <typename _InputIterator> array(int _E0, int _E1, int _E2, _InputIterator _Src_first, Concurrency::accelerator_view _Av, access_type _Cpu_access_type = access_type_auto) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1, _E2))

     {

         static_assert(_Rank == 3, "array(int, int, int, iterator) is only permissible on array<T, 3>");


         _InputIterator _Src_last = _Src_first;

         std::advance(_Src_last, this->extent.size());


         _Initialize(_Av, _Src_first, _Src_last, _Cpu_access_type);

     }


     template <typename _InputIterator> array(const Concurrency::extent<_Rank>& _Extent, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY

         : _M_extent(_Extent)

     {

         _Initialize(_Av, _Associated_Av, _Src_first, _Src_last);

     }


     template <typename _InputIterator> array(const Concurrency::extent<_Rank>& _Extent, _InputIterator _Src_first, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY

         : _M_extent(_Extent)

     {

         _InputIterator _Src_last = _Src_first;

         std::advance(_Src_last, this->extent.size());


         _Initialize(_Av, _Associated_Av, _Src_first, _Src_last);

     }


     template <typename _InputIterator> array(int _E0, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0))

     {

         static_assert(_Rank == 1, "array(int, iterator, iterator, accelerator_view, accelerator_view) is only permissible on array<T, 1>");

         _Initialize(_Av, _Associated_Av, _Src_first, _Src_last);

     }


     template <typename _InputIterator> array(int _E0, _InputIterator _Src_first, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av)

         : _M_extent(Concurrency::extent<_Rank>(_E0))

     {

         static_assert(_Rank == 1, "array(int, iterator, accelerator_view, accelerator_view) is only permissible on array<T, 1>");


         _InputIterator _Src_last = _Src_first;

         std::advance(_Src_last, this->extent.size());


         _Initialize(_Av, _Associated_Av, _Src_first, _Src_last);

     }


     template <typename _InputIterator> array(int _E0, int _E1, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1))

     {

         static_assert(_Rank == 2, "array(int, int, iterator, iterator, accelerator_view, accelerator_view) is only permissible on array<T, 2>");

         _Initialize(_Av, _Associated_Av, _Src_first, _Src_last);

     }


     template <typename _InputIterator> array(int _E0, int _E1, _InputIterator _Src_first, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1))

     {

         static_assert(_Rank == 2, "array(int, int, iterator, accelerator_view, accelerator_view) is only permissible on array<T, 2>");


         _InputIterator _Src_last = _Src_first;

         std::advance(_Src_last, this->extent.size());


         _Initialize(_Av, _Associated_Av, _Src_first, _Src_last);

     }


     template <typename _InputIterator> array(int _E0, int _E1, int _E2, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1, _E2))

     {

         static_assert(_Rank == 3, "array(int, int, int, iterator, iterator, accelerator_view, accelerator_view) is only permissible on array<T, 3>");

         _Initialize(_Av, _Associated_Av, _Src_first, _Src_last);

     }


     template <typename _InputIterator> array(int _E0, int _E1, int _E2, _InputIterator _Src_first, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY

         : _M_extent(Concurrency::extent<_Rank>(_E0, _E1, _E2))

     {

         static_assert(_Rank == 3, "array(int, int, int, iterator, accelerator_view, accelerator_view) is only permissible on array<T, 3>");


         _InputIterator _Src_last = _Src_first;

         std::advance(_Src_last, this->extent.size());


         _Initialize(_Av, _Associated_Av, _Src_first, _Src_last);

     }


     explicit array(const array_view<const _Value_type,_Rank>& _Src) __CPU_ONLY

         :_M_extent(_Src.extent)

     {

         _Initialize(details::_Select_default_accelerator().default_view, access_type_auto);

         Concurrency::copy(_Src,*this);

     }


     array(const array_view<const _Value_type,_Rank>& _Src, accelerator_view _Av, access_type _Cpu_access_type = access_type_auto) __CPU_ONLY

         :_M_extent(_Src.extent)

     {

         _Initialize(_Av, _Cpu_access_type);

         Concurrency::copy(_Src,*this);

     }


     array(const array_view<const _Value_type,_Rank>& _Src, accelerator_view _Av, accelerator_view _Associated_Av) __CPU_ONLY

         :_M_extent(_Src.extent)

     {

         _Initialize(_Av, _Associated_Av);

         Concurrency::copy(_Src,*this);

     }


     array(const array& _Other) __CPU_ONLY

         : _M_extent(_Other._M_extent)

     {

         _Initialize(_Other.accelerator_view, _Other.associated_accelerator_view);

         Concurrency::copy(_Other, *this);

     }


     array(array && _Other) __CPU_ONLY

         : _M_extent(_Other._M_extent), _M_multiplier(_Other._M_multiplier)

         , _M_buffer_descriptor(_Other._M_buffer_descriptor)

     {

         // Register this

         this->_Register_copy(_Other);


         // Release the _Other array

         _Other._Unregister();

         _Other._M_buffer_descriptor._M_data_ptr = NULL;

         _Other._M_buffer_descriptor._Set_buffer_ptr(NULL);

     }


     array & operator= (const array & _Other) __CPU_ONLY

     {

         if (this != &_Other)

         {

             // First unregister myself from the current buffer

             _Unregister();


             _M_extent = _Other._M_extent;

             _Initialize(_Other.accelerator_view, _Other.associated_accelerator_view);

             Concurrency::copy(_Other, *this);

         }

         return *this;

     }


     array & operator= (array && _Other) __CPU_ONLY

     {

         if (this != &_Other)

         {

             // First unregister myself from the current buffer

             _Unregister();


             _M_extent = _Other._M_extent;

             _M_multiplier = _Other._M_multiplier;

             _M_buffer_descriptor = _Other._M_buffer_descriptor;

             this->_Register_copy(_Other);


             // Release the _Other array

             _Other._Unregister();

             _Other._M_buffer_descriptor._M_data_ptr = NULL;

             _Other._M_buffer_descriptor._Set_buffer_ptr(NULL);

         }

         return *this;

     }


     array& operator=(const array_view<const _Value_type,_Rank>& _Src) __CPU_ONLY

     {

         Concurrency::copy(_Src,*this);

         return *this;

     }


     void copy_to(array<_Value_type,_Rank>& _Dest) const __CPU_ONLY

     {

         Concurrency::copy(*this, _Dest);

     }


     void copy_to(const array_view<_Value_type,_Rank>& _Dest) const __CPU_ONLY

     {

         Concurrency::copy(*this,_Dest);

     }


     __declspec(property(get=get_extent)) Concurrency::extent<_Rank> extent;

     Concurrency::extent<_Rank> get_extent() const __GPU

     {

         return _M_extent;

     }


     __declspec(property(get=get_accelerator_view)) Concurrency::accelerator_view accelerator_view;

     Concurrency::accelerator_view get_accelerator_view() const __CPU_ONLY

     {

         return _Get_buffer()->_Get_master_buffer()->_Get_access_on_accelerator_view();

     }


     __declspec(property(get=get_associated_accelerator_view)) Concurrency::accelerator_view associated_accelerator_view;

     Concurrency::accelerator_view get_associated_accelerator_view() const __CPU_ONLY

     {

         return _Get_buffer()->_Get_master_buffer()->_Get_accelerator_view();

     }


     __declspec(property(get=get_cpu_access_type)) access_type cpu_access_type;

     access_type get_cpu_access_type() const __CPU_ONLY

     {

         return _Get_buffer()->_Get_master_buffer()->_Get_allowed_host_access_type();

     }


     _Value_type& operator[] (const index<_Rank>& _Index) __GPU

     {

         // Refresh the data ptr if needed

         _Refresh_data_ptr(_Read_write_access);


         _Value_type * _Ptr = reinterpret_cast<_Value_type *>(_M_buffer_descriptor._M_data_ptr);

         return _Ptr[_Flatten_helper::func(_M_multiplier._M_base, _Index._M_base)];

     }


     const _Value_type& operator[] (const index<_Rank>& _Index) const __GPU

     {

         // Refresh the data ptr if needed

 #pragma warning( push )

 #pragma warning( disable : 4880 )

         // Casting away constness in amp restricted scope might result in

         // undefined behavior, therefore, the compiler will report a level 1 warning

         // for it. But the following const_cast is harmless thus we are suppressing

         // this warning just for this line.

         const_cast<array*>(this)->_Refresh_data_ptr(_Read_access);

 #pragma warning( pop )


         _Value_type * _Ptr = reinterpret_cast<_Value_type *>(_M_buffer_descriptor._M_data_ptr);

         return _Ptr[_Flatten_helper::func(_M_multiplier._M_base, _Index._M_base)];

     }


     typename details::_Projection_result_type<_Value_type,_Rank>::_Result_type operator[](int _I)  __GPU

     {

         return details::_Array_projection_helper<_Value_type,_Rank>::_Project0(this,_I);

     }


     typename details::_Projection_result_type<_Value_type,_Rank>::_Const_result_type operator[](int _I)  const __GPU

     {

         return details::_Const_array_projection_helper<_Value_type,_Rank>::_Project0(this,_I);

     }


     _Value_type& operator() (const index<_Rank>& _Index) __GPU

     {

         return this->operator[](_Index);

     }


     const _Value_type& operator() (const index<_Rank>& _Index) const __GPU

     {

         return this->operator[](_Index);

     }


     _Value_type& operator() (int _I0, int _I1) __GPU

     {

         static_assert(_Rank == 2, "value_type& array::operator()(int, int) is only permissible on array<T, 2>");

         return this->operator[](index<2>(_I0, _I1));

     }


     const _Value_type& operator() (int _I0, int _I1) const __GPU

     {

         static_assert(_Rank == 2, "const value_type& array::operator()(int, int) is only permissible on array<T, 2>");

         return this->operator[](index<2>(_I0, _I1));

     }


     _Value_type& operator() (int _I0, int _I1, int _I2) __GPU

     {

         static_assert(_Rank == 3, "value_type& array::operator()(int, int, int) is only permissible on array<T, 3>");

         return this->operator[](index<3>(_I0, _I1, _I2));

     }


     const _Value_type& operator() (int _I0, int _I1, int _I2) const __GPU

     {

         static_assert(_Rank == 3, "const value_type& array::operator()(int, int, int) const is only permissible on array<T, 3>");

         return this->operator[](index<3>(_I0, _I1, _I2));

     }


     typename details::_Projection_result_type<_Value_type,_Rank>::_Result_type operator()(int _I)  __GPU

     {

         return details::_Array_projection_helper<_Value_type,_Rank>::_Project0(this,_I);

     }


     typename details::_Projection_result_type<_Value_type,_Rank>::_Const_result_type operator()(int _I)  const __GPU

     {

         return details::_Const_array_projection_helper<_Value_type,_Rank>::_Project0(this,_I);

     }


     array_view<_Value_type,_Rank> section(const Concurrency::index<_Rank>& _Section_origin, const Concurrency::extent<_Rank>& _Section_extent) __GPU

     {

         array_view<_Value_type,_Rank> _T1(*this);

         return _T1.section(_Section_origin, _Section_extent);

     }


     array_view<const _Value_type,_Rank> section(const Concurrency::index<_Rank>& _Section_origin, const Concurrency::extent<_Rank>& _Section_extent) const __GPU

     {

         array_view<const _Value_type,_Rank> _T1(*this);

         return _T1.section(_Section_origin, _Section_extent);

     }


     array_view<_Value_type,_Rank> section(const Concurrency::extent<_Rank>& _Ext) __GPU

     {

         return section(Concurrency::index<_Rank>(), _Ext);

     }


     array_view<const _Value_type,_Rank> section(const Concurrency::extent<_Rank>& _Ext) const __GPU

     {

         return section(Concurrency::index<_Rank>(), _Ext);

     }


     array_view<_Value_type,_Rank> section(const index<_Rank>& _Idx) __GPU

     {

         array_view<_Value_type,_Rank> _T1(*this);

         return _T1.section(_Idx);

     }


     array_view<const _Value_type,_Rank> section(const index<_Rank>& _Idx) const __GPU

     {

         array_view<const _Value_type,_Rank> _T1(*this);

         return _T1.section(_Idx);

     }


     array_view<_Value_type,1> section(int _I0, int _E0) __GPU

     {

         array_view<_Value_type,_Rank> _T1(*this);

         return _T1.section(_I0,_E0);

     }


     array_view<const _Value_type,1> section(int _I0, int _E0) const __GPU

     {

         array_view<const _Value_type,_Rank> _T1(*this);

         return _T1.section(_I0,_E0);

     }


     array_view<_Value_type,2> section(int _I0, int _I1, int _E0, int _E1) __GPU

     {

         array_view<_Value_type,_Rank> _T1(*this);

         return _T1.section(_I0,_I1,_E0,_E1);

     }


     array_view<const _Value_type,2> section(int _I0, int _I1, int _E0, int _E1) const __GPU

     {

         array_view<const _Value_type,_Rank> _T1(*this);

         return _T1.section(_I0,_I1,_E0,_E1);

     }


     array_view<_Value_type,3> section(int _I0, int _I1, int _I2, int _E0, int _E1, int _E2) __GPU

     {

         array_view<_Value_type,_Rank> _T1(*this);

         return _T1.section(_I0,_I1,_I2,_E0,_E1,_E2);

     }


     array_view<const _Value_type,3> section(int _I0, int _I1, int _I2, int _E0, int _E1, int _E2) const __GPU

     {

         array_view<const _Value_type,_Rank> _T1(*this);

         return _T1.section(_I0,_I1,_I2,_E0,_E1,_E2);

     }


     template <typename _Value_type2> array_view<_Value_type2,1> reinterpret_as() __GPU

     {

         return array_view<_Value_type,1>(_M_buffer_descriptor, Concurrency::extent<1>(extent.size())).template reinterpret_as<_Value_type2>();

     }


     template <typename _Value_type2> array_view<const _Value_type2,1> reinterpret_as() const __GPU

     {

 #pragma warning( push )

 #pragma warning( disable : 4880 )

         // Casting away constness in amp restricted scope might result in

         // undefined behavior, therefore, the compiler will report a level 1 warning

         // for it. But the following const_cast is harmless thus we are suppressing

         // this warning just for this line.

         return const_cast<array*>(this)->reinterpret_as<_Value_type2>();

 #pragma warning( pop )

     }


     template <int _New_rank> array_view<_Value_type,_New_rank> view_as(const Concurrency::extent<_New_rank>& _View_extent) __GPU

     {

         return array_view<_Value_type,_New_rank>(_M_buffer_descriptor, _View_extent);

     }


     template <int _New_rank> array_view<const _Value_type,_New_rank> view_as(const Concurrency::extent<_New_rank>& _View_extent) const __GPU

     {

 #pragma warning( push )

 #pragma warning( disable : 4880 )

         // Casting away constness in amp restricted scope might result in

         // undefined behavior, therefore, the compiler will report a level 1 warning

         // for it. But the following const_cast is harmless thus we are suppressing

         // this warning just for this line.

         return const_cast<array*>(this)->view_as<_New_rank>(_View_extent);

 #pragma warning( pop )

     }


     operator std::vector<_Value_type>() const __CPU_ONLY

     {

         std::vector<_Value_type> _return_vector(extent.size());

         Concurrency::copy(*this, _return_vector.begin());


         return _return_vector;

     }


     _Ret_ _Value_type* data() __GPU

     {

         _Refresh_data_ptr(_Read_write_access, false /* _Exception */);

         return reinterpret_cast<_Value_type*>(_M_buffer_descriptor._M_data_ptr);

     }


     const _Value_type* data() const __GPU

     {

 #pragma warning( push )

 #pragma warning( disable : 4880 )

         // Casting away constness in amp restricted scope might result in

         // undefined behavior, therefore, the compiler will report a level 1 warning

         // for it. But the following const_cast is harmless thus we are suppressing

         // this warning just for this line.

         const_cast<array*>(this)->_Refresh_data_ptr(_Read_access, false /* _Exception */);

 #pragma warning( pop )

         return reinterpret_cast<const _Value_type*>(_M_buffer_descriptor._M_data_ptr);

     }


     ~array() __CPU_ONLY noexcept(false)

     {

         bool _Can_throw = (std::current_exception() == nullptr);


         // Destructor should not throw if we are already processing

         // an exception and another exception will result in termination

         try {

             _Unregister();

         }

         catch(...)

         {

             if (_Can_throw) {

                 throw;

             }

         }

     }


 private:


     // No default constructor

     array() __CPU_ONLY;


     // Private constructor used by direct3d::make_array

     array(const Concurrency::extent<_Rank>& _Extent, _Buffer_descriptor _Buffer_descriptor)

         : _M_extent(_Extent), _M_buffer_descriptor(_Buffer_descriptor)

     {

         _Initialize();


         // Register this

         this->_Register();

     }


     // Initialize

     unsigned int _Initialize() __CPU_ONLY

     {

         details::_Is_valid_extent(_M_extent);


         // Arrays always have a type access mode of '_Is_array_mode'

         // This is the mechanism for differentiating between arrays and array_views by the runtime

         _M_buffer_descriptor._M_type_access_mode = _Is_array_mode;

         unsigned int totalExtent = _M_extent[_Rank-1];

         details::_Array_init_helper<Concurrency::extent<_Rank>, Concurrency::extent<_Rank>>::func(totalExtent, _M_multiplier, _M_extent);


         return totalExtent;

     }


     // Initialize and allocate on specified accelerator_view

     void _Initialize(Concurrency::accelerator_view _Av, access_type _Cpu_access_type) __CPU_ONLY

     {

         unsigned int totalExtent = _Initialize();

         // release the existing buffer if any before allocation new one

         _M_buffer_descriptor._Set_buffer_ptr(NULL);


         _Buffer_ptr _PBuf = _Buffer::_Create_buffer(_Av, _Av, totalExtent, sizeof(_Value_type), false /* _Is_temp */, _Cpu_access_type);


         _M_buffer_descriptor._Set_buffer_ptr(_Ubiquitous_buffer::_Create_ubiquitous_buffer(_PBuf));

         _Register();

     }


     // Initialize and allocate on specified accelerator_view and copy specified data

     template <typename _InputIterator>

     void _Initialize(Concurrency::accelerator_view _Av, _InputIterator _Src_first, _InputIterator _Src_last, access_type _Cpu_access_type) __CPU_ONLY

     {

         _Initialize(_Av, _Cpu_access_type);

         copy(_Src_first, _Src_last, *this);

     }


     // Initialize and allocate on specified accelerator_views

     void _Initialize(Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY

     {

         unsigned int totalExtent = _Initialize();


         // Staging arrays can only be created if the accelerator_view is on the cpu_accelerator

         _Buffer_ptr _PBuf = NULL;


         // release the existing buffer if any before allocation new one

         _M_buffer_descriptor._Set_buffer_ptr(NULL);


         if (_Is_cpu_accelerator(_Av.accelerator))

         {

             // If the accelerator _Associated_Av supports zero-copy and the default cpu access type

             // for the accelerator is access_type_read_write, create a zero-copy buffer instead of a

             // staging buffer

             if (_Associated_Av.accelerator.supports_cpu_shared_memory && (_Get_recommended_buffer_host_access_mode(_Associated_Av) == _Read_write_access)) {

                 _PBuf = _Buffer::_Create_buffer(_Associated_Av, _Av, totalExtent, sizeof(_Value_type), false /* _Is_temp */, access_type_read_write);

             }

             else {

                 _PBuf = _Buffer::_Create_stage_buffer(_Associated_Av, _Av, totalExtent, sizeof(_Value_type));

             }


             _PBuf->_Map_buffer(_Read_write_access, true /* _Wait */);

         }

         else

         {

             _PBuf = _Buffer::_Create_buffer(_Av, _Av, totalExtent, sizeof(_Value_type), false /* _Is_temp */, access_type_auto);

         }


         _M_buffer_descriptor._Set_buffer_ptr(_Ubiquitous_buffer::_Create_ubiquitous_buffer(_PBuf));

         _Register();

     }


     // Initialize and allocate on specified accelerator_views

     template <typename _InputIterator>

     void _Initialize(Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av, _InputIterator _Src_first, _InputIterator _Src_last) __CPU_ONLY

     {

         _Initialize(_Av, _Associated_Av);

         copy(_Src_first, _Src_last, *this);

     }


     void _Register() __CPU_ONLY

     {

         Concurrency::accelerator_view cpuAv = _Is_cpu_accelerator(this->accelerator_view.accelerator) ?

                                                this->accelerator_view : accelerator(accelerator::cpu_accelerator).default_view;

         _M_buffer_descriptor._Get_buffer_ptr()->_Register_view(_M_buffer_descriptor._Get_view_key(), cpuAv, _Create_buffer_view_shape());


         _M_buffer_descriptor._Get_buffer_ptr()->_Discard(_M_buffer_descriptor._Get_view_key());


         // If the array is on the CPU accelerator then we will ensure that the descriptor

         // indicates CPU access

         if (_Is_cpu_accelerator(this->accelerator_view.accelerator))

         {

             _Buffer_ptr _PBuf = NULL;

             this->_Get_access_async(_Read_write_access, _PBuf, false)._Get();

         }

     }


     void _Register_copy(const array &_Other) __CPU_ONLY

     {

         _M_buffer_descriptor._Get_buffer_ptr()->_Register_view_copy(_M_buffer_descriptor._Get_view_key(), _Other._M_buffer_descriptor._Get_view_key());

     }


     void _Unregister() __CPU_ONLY

     {

         // No need to unregister if the array was moved causing the buffer ptr to be set to NULL

         if (_M_buffer_descriptor._Get_buffer_ptr() != NULL) {

             _M_buffer_descriptor._Get_buffer_ptr()->_Unregister_view(_M_buffer_descriptor._Get_view_key());

         }

     }


     _Ret_ _Ubiquitous_buffer* _Get_buffer() const __CPU_ONLY

     {

         return _M_buffer_descriptor._Get_buffer_ptr();

     }


     _Event _Get_access_async(_Access_mode _Mode, _Buffer_ptr &_Buf_ptr, bool _Zero_copy_cpu_access = false) const __CPU_ONLY

     {

         _ASSERTE(!_Zero_copy_cpu_access || (_Get_buffer()->_Get_master_buffer()->_Get_allowed_host_access_mode() != _No_access));


         _Buffer_ptr _PBuf;

         Concurrency::accelerator_view _Access_av = _Zero_copy_cpu_access ? accelerator(accelerator::cpu_accelerator).default_view : this->accelerator_view;

         _Event _Ev = details::_Get_access_async(_M_buffer_descriptor._Get_view_key(),

                                                 _Access_av,

                                                 _Mode, _PBuf);

         _Buf_ptr = _PBuf;


         if (_Is_cpu_accelerator(_Access_av.accelerator)) {

             _Ev = _Ev._Add_continuation(std::function<_Event()>([_PBuf, this]() mutable -> _Event {

                 const_cast<array*>(this)->_M_buffer_descriptor._M_data_ptr = _PBuf->_Get_host_ptr();

                 return _Event();

             }));

         }


         return _Ev;

     }


     _Ret_ _View_shape* _Create_buffer_view_shape() const

     {

         _ASSERTE(_Get_buffer()->_Get_master_buffer_elem_size() == sizeof(_Value_type));


         unsigned int _ZeroOffset[_Rank] = {0};

         unsigned int _View_extent[_Rank];

         for(int i=0; i<_Rank; ++i)

         {

             _View_extent[i] = static_cast<unsigned int>(this->_M_extent[i]);

         }

         return _View_shape::_Create_view_shape(static_cast<unsigned int>(_Rank), 0, &_View_extent[0], &_ZeroOffset[0], &_View_extent[0]);

     }


     bool _Has_cpu_access() const __CPU_ONLY

     {

         return (_Get_buffer()->_Get_master_buffer()->_Get_allowed_host_access_mode() != _No_access);

     }


     void _Refresh_data_ptr(_Access_mode _Requested_mode, bool _Exception = true) __CPU_ONLY

     {

         _ASSERTE(_Is_valid_access_mode(_Requested_mode));


         // For an array that has CPU access, the maximum CPU access allowed is that allowed by

         // the underlying _Buffer allocation

         _Requested_mode = static_cast<_Access_mode>(_Requested_mode & _Get_buffer()->_Get_master_buffer()->_Get_allowed_host_access_mode());


         // Refresh the data ptr if we do not have requested access

         if ((_Requested_mode == _No_access) || ((_M_buffer_descriptor._M_curr_cpu_access_mode & _Requested_mode) != _Requested_mode))

         {

             if (_Has_cpu_access() && (_Requested_mode != _No_access))

             {

                 auto _Span_id = details::_Get_amp_trace()->_Start_array_view_synchronize_event_helper(_M_buffer_descriptor);

                 _Buffer_ptr _PBuf;

                 bool _Zero_copy_cpu_access = !_Is_cpu_accelerator(this->accelerator_view.accelerator);

                 this->_Get_access_async(_Requested_mode, _PBuf, _Zero_copy_cpu_access)._Get();

                 details::_Get_amp_trace()->_Write_end_event(_Span_id);

             }

             else

             {

                 if (_Exception)

                 {

                     if (!_Has_cpu_access()) {

                         throw runtime_exception("The array is not accessible on CPU.", E_FAIL);

                     }

                     else {

                         throw runtime_exception("The array is not accessible for reading on CPU.", E_FAIL);

                     }

                 }

             }

         }

     }


     void _Refresh_data_ptr(_Access_mode /*_Requested_mode*/, bool /*_Exception*/ = true) __GPU_ONLY

     {

     }


 private:

     // Data members


     Concurrency::extent<_Rank> _M_extent;


     // Descriptor of the buffer underlying the array

     _Buffer_descriptor _M_buffer_descriptor;


     // The vector used for index calculation.

     Concurrency::extent<_Rank> _M_multiplier;

 };


 namespace details

 {

 template <typename _Value_type, int _Rank>

 _Event _Copy_async_impl(const array<_Value_type,_Rank>& _Src, array<_Value_type,_Rank>& _Dest)

 {

     if (_Src.extent.size() > _Dest.extent.size())

     {

         throw runtime_exception("Invalid _Src argument. _Src size exceeds total size of the _Dest.", E_INVALIDARG);

     }


     // We can obliterate the exisiting content of dest if it is about to be totally overwritten

     _Access_mode _Dest_access_mode = (_Src.extent.size() == _Dest.extent.size()) ? _Write_access : _Read_write_access;


     _Buffer_ptr _PBufSrc, _PBufDest;

     _Event _Ev = _Get_access_async(_Src, _Read_access, _PBufSrc);

     _Ev = _Ev._Add_event(_Get_access_async(_Dest, _Dest_access_mode, _PBufDest));

     size_t _NumElemsToCopy = (_Src.extent.size() * sizeof(_Value_type)) / _PBufSrc->_Get_elem_size();

     return _Ev._Add_continuation(std::function<_Event()>([_PBufSrc, _PBufDest, _NumElemsToCopy]() mutable -> _Event {

         return details::_Copy_impl(_PBufSrc, 0, _PBufDest, 0, _NumElemsToCopy);

     }));

 }


 template <typename InputIterator, typename _Value_type, int _Rank>

 _Event _Copy_async_impl(InputIterator _SrcFirst, InputIterator _SrcLast, array<_Value_type, _Rank> &_Dest)

 {

     size_t _NumElemsToCopy = std::distance(_SrcFirst, _SrcLast);

     // We can obliterate the exisiting content of dest if it is about to be totally overwritten

     _Access_mode _Dest_access_mode = (_NumElemsToCopy == _Dest.extent.size()) ? _Write_access : _Read_write_access;

     _Buffer_ptr _PDestBuf;

     _Event _Ev = _Get_access_async(_Dest, _Dest_access_mode, _PDestBuf);


     return _Ev._Add_continuation(std::function<_Event()>([_SrcFirst, _SrcLast, _PDestBuf, _NumElemsToCopy]() mutable -> _Event {

         return details::_Copy_impl<InputIterator, _Value_type>(_SrcFirst, _SrcLast, _NumElemsToCopy, _PDestBuf, 0);

     }));

 }


 template <typename OutputIterator, typename _Value_type, int _Rank>

 _Event _Copy_async_impl(const array<_Value_type, _Rank> &_Src, OutputIterator _DestIter)

 {

     _Buffer_ptr _PSrcBuf;

     _Event _Ev = _Get_access_async(_Src, _Read_access, _PSrcBuf);

     size_t _NumElemsToCopy = (_Src.extent.size() * sizeof(_Value_type)) / _PSrcBuf->_Get_elem_size();

     return _Ev._Add_continuation(std::function<_Event()>([_PSrcBuf, _NumElemsToCopy, _DestIter]() mutable -> _Event {

         return details::_Copy_impl<OutputIterator, _Value_type>(_PSrcBuf, 0, _NumElemsToCopy, _DestIter);

     }));

 }


 template <typename _Value_type, int _Rank>

 _Event _Copy_async_impl(const array<_Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest)

 {

     const _Buffer_descriptor &_SrcBufDesc = _Get_buffer_descriptor(_Src);

     const _Buffer_descriptor &_DestBufDesc = _Get_buffer_descriptor(_Dest);

     if (_SrcBufDesc._Get_buffer_ptr() == _DestBufDesc._Get_buffer_ptr()) {

         throw runtime_exception("Cannot copy between overlapping regions of the same buffer.", E_INVALIDARG);

     }


     _Buffer_ptr _PSrcBuf, _PDestBuf;

     _Event _Ev = _Get_access_async(_Src, _Read_access, _PSrcBuf);


     // The source accelerator_view is driven by array's master location,

     // therefore we can pass nullptr to avoid unnecessary computation

     auto _AccelInfo = _Get_src_dest_accelerator_view(nullptr, &_DestBufDesc);


     _Ev = _Ev._Add_event(_Get_access_async(_DestBufDesc._Get_view_key(), _AccelInfo.second, _Write_access, _PDestBuf));

     _View_shape_ptr _PSrcShape = _Get_buffer_view_shape(_SrcBufDesc);

     _View_shape_ptr _PDestShape = _Get_buffer_view_shape(_DestBufDesc);

     return _Ev._Add_continuation(std::function<_Event()>([_PSrcBuf, _PSrcShape, _PDestBuf, _PDestShape]() mutable -> _Event {

         return details::_Copy_impl(_PSrcBuf, _PSrcShape, _PDestBuf, _PDestShape);

     }));

 }


 template <typename _Value_type, int _Rank>

 _Event _Copy_async_impl(const array_view<const _Value_type, _Rank>& _Src, array<_Value_type, _Rank>& _Dest)

 {

     const _Buffer_descriptor &_SrcBufDesc = _Get_buffer_descriptor(_Src);

     const _Buffer_descriptor &_DestBufDesc = _Get_buffer_descriptor(_Dest);

     if (_SrcBufDesc._Get_buffer_ptr() == _DestBufDesc._Get_buffer_ptr()) {

         throw runtime_exception("Cannot copy between overlapping regions of the same buffer.", E_INVALIDARG);

     }


     auto _AccelInfo = _Get_src_dest_accelerator_view(&_SrcBufDesc, &_DestBufDesc);


     _Buffer_ptr _PSrcBuf, _PDestBuf;

     _Event _Ev = _Get_access_async(_SrcBufDesc._Get_view_key(), _AccelInfo.first, _Read_access, _PSrcBuf);

     _Ev = _Ev._Add_event(_Get_access_async(_Dest, _Write_access, _PDestBuf));

     _View_shape_ptr _PSrcShape = _Get_buffer_view_shape(_SrcBufDesc);

     _View_shape_ptr _PDestShape = _Get_buffer_view_shape(_DestBufDesc);

     return _Ev._Add_continuation(std::function<_Event()>([_PSrcBuf, _PSrcShape, _PDestBuf, _PDestShape]() mutable -> _Event {

         return details::_Copy_impl(_PSrcBuf, _PSrcShape, _PDestBuf, _PDestShape);

     }));

 }


 template <typename _Value_type, int _Rank>

 _Event _Copy_async_impl(const array_view<const _Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest)

 {

     const _Buffer_descriptor &_SrcBufDesc = _Get_buffer_descriptor(_Src);

     const _Buffer_descriptor &_DestBufDesc = _Get_buffer_descriptor(_Dest);

     _View_shape_ptr _PSrcShape = _Get_buffer_view_shape(_SrcBufDesc);

     _View_shape_ptr _PDestShape = _Get_buffer_view_shape(_DestBufDesc);

     if ((_SrcBufDesc._Get_buffer_ptr() == _DestBufDesc._Get_buffer_ptr()) && _PSrcShape->_Overlaps(_PDestShape)) {

         throw runtime_exception("Cannot copy between overlapping regions of the same buffer.", E_INVALIDARG);

     }


     auto _AccelInfo = _Get_src_dest_accelerator_view(&_SrcBufDesc, &_DestBufDesc);


     _Buffer_ptr _PSrcBuf, _PDestBuf;

     _Event _Ev = _Get_access_async(_SrcBufDesc._Get_view_key(), _AccelInfo.first, _Read_access, _PSrcBuf);

     _Ev = _Ev._Add_event(_Get_access_async(_DestBufDesc._Get_view_key(), _AccelInfo.second, _Write_access, _PDestBuf));

     return _Ev._Add_continuation(std::function<_Event()>([_PSrcBuf, _PSrcShape, _PDestBuf, _PDestShape]() mutable -> _Event {

         return details::_Copy_impl(_PSrcBuf, _PSrcShape, _PDestBuf, _PDestShape);

     }));

 }


 template <typename InputIterator, typename _Value_type, int _Rank>

 _Event _Copy_async_impl(InputIterator _SrcFirst, InputIterator _SrcLast, const array_view<_Value_type, _Rank> &_Dest)

 {

     static_assert(!std::is_const<_Value_type>::value, "Cannot copy to array_view<const _Value_type, _Rank>.");


     size_t _Src_size = std::distance(_SrcFirst, _SrcLast);


     // Source cannot be greater than destination

     if (_Src_size > _Dest.extent.size())

     {

         throw runtime_exception("Number of elements in range between [_SrcFirst, _SrcLast) exceeds total size of the _Dest.", E_INVALIDARG);

     }


 #pragma warning( push )

 #pragma warning( disable : 4127 ) // Disable warning about constant conditional expression

     // Higher ranks need to have as many elements as in _Dest array_view

     if ((_Rank > 1) && (_Src_size != _Dest.extent.size()))

     {

         throw runtime_exception("For _Rank > 1 the number of elements in range between [_SrcFirst, _SrcLast) has to be equal to total size of the _Dest.", E_INVALIDARG);

     }

 #pragma warning( pop )


     // We can obliterate the exisiting content of dest if it is about to be totally overwritten

     _Access_mode _Dest_access_mode = (_Src_size == _Dest.extent.size()) ? _Write_access : _Read_write_access;


     // Get read-write access for array_view on cpu_accelerator and take underlying pointer to data

     const _Buffer_descriptor &_DestBufDesc = _Get_buffer_descriptor(_Dest);


     auto _AccelInfo = _Get_src_dest_accelerator_view(nullptr, &_DestBufDesc);


     _Buffer_ptr _PDestBuf;

     _Event _Ev = _Get_access_async(_DestBufDesc._Get_view_key(), _AccelInfo.second, _Dest_access_mode, _PDestBuf);


     _View_shape_ptr _Dst_shape = _Get_buffer_view_shape(_DestBufDesc);


     // If the _Dst shape is linear then perform a linear copy

     unsigned int _Dst_linear_offset, _Dst_linear_size;

     if (_Dst_shape->_Is_view_linear(_Dst_linear_offset, _Dst_linear_size))

     {

         _Ev = _Ev._Add_continuation(std::function<_Event()>([_PDestBuf, _SrcFirst, _SrcLast, _Src_size, _Dst_linear_offset]() mutable -> _Event {

             return details::_Copy_impl<InputIterator, _Value_type>(_SrcFirst, _SrcLast, _Src_size, _PDestBuf, _Dst_linear_offset);

         }));

     }

     else

     {

         _View_shape_ptr _Reinterpreted_dst_shape = _Create_reinterpreted_shape(_Dst_shape, _PDestBuf->_Get_elem_size(), sizeof(_Value_type));


         // Source has as many elements as in destination, reshape source to match destination shape

         std::vector<unsigned int> _Src_offset(_Reinterpreted_dst_shape->_Get_rank(), 0);

         _View_shape_ptr _Src_shape = details::_View_shape::_Create_view_shape(_Reinterpreted_dst_shape->_Get_rank(), 0 /* linear offset*/,

                                                                               _Reinterpreted_dst_shape->_Get_view_extent(), _Src_offset.data(),

                                                                               _Reinterpreted_dst_shape->_Get_view_extent());


         _Ev = _Ev._Add_continuation(std::function<_Event()>([_PDestBuf, _SrcFirst, _Src_shape, _Dst_shape]() mutable -> _Event {

             return details::_Copy_impl<InputIterator, _Value_type>(_SrcFirst, _Src_shape, _PDestBuf, _Dst_shape);

         }));

     }


     return _Ev;

 }


 template <typename OutputIterator, typename _Value_type, int _Rank>

 _Event _Copy_async_impl(const array_view<_Value_type, _Rank> &_Src, OutputIterator _DestIter)

 {

     // Caller is responsible for passing valid _DestIter


     // Get read access for array_view on cpu_accelerator and take underlying pointer to data

     const _Buffer_descriptor &_SrcBufDesc = _Get_buffer_descriptor(_Src);


     auto _AccelInfo = _Get_src_dest_accelerator_view(&_SrcBufDesc, nullptr);


     _Buffer_ptr _PSrcBuf;

     _Event _Ev = _Get_access_async(_SrcBufDesc._Get_view_key(), _AccelInfo.first, _Read_access, _PSrcBuf);


     // Get source shape

     _View_shape_ptr _Src_shape = _Get_buffer_view_shape(_SrcBufDesc);


     // If the _Src_shape is linear then perform a linear copy

     unsigned int _Src_linear_offset, _Src_linear_size;

     if (_Src_shape->_Is_view_linear(_Src_linear_offset, _Src_linear_size))

     {

         _Ev = _Ev._Add_continuation(std::function<_Event()>([_PSrcBuf, _Src_linear_offset, _Src_linear_size, _DestIter]() mutable -> _Event {

             return details::_Copy_impl<OutputIterator, _Value_type>(_PSrcBuf, _Src_linear_offset, _Src_linear_size, _DestIter);

         }));

     }

     else

     {

         _View_shape_ptr _Reinterpreted_src_shape = _Create_reinterpreted_shape(_Src_shape, _PSrcBuf->_Get_elem_size(), sizeof(_Value_type));


         // Valid destination should have space for as many elements as in source array_view, reshape to match source view shape

         std::vector<unsigned int> _Dst_offset(_Reinterpreted_src_shape->_Get_rank(), 0);

         _View_shape_ptr _Dst_shape = details::_View_shape::_Create_view_shape(_Reinterpreted_src_shape->_Get_rank(), 0 /* linear offset*/,

                                                                               _Reinterpreted_src_shape->_Get_view_extent(), _Dst_offset.data(),

                                                                               _Reinterpreted_src_shape->_Get_view_extent());


         _Ev = _Ev._Add_continuation(std::function<_Event()>([_PSrcBuf, _Src_shape, _DestIter, _Dst_shape]() mutable -> _Event {

             return details::_Copy_impl<OutputIterator, _Value_type>(_PSrcBuf, _Src_shape, _DestIter, _Dst_shape);

         }));

     }


     return _Ev;

 }


 }


 template <typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array<_Value_type,_Rank>& _Src, array<_Value_type,_Rank>& _Dest)

 {

     auto _Async_op_id = details::_Get_amp_trace()->_Launch_async_copy_event_helper(details::_Get_buffer_descriptor(_Src),

                                                                                    details::_Get_buffer_descriptor(_Dest),

                                                                                    sizeof(_Value_type) * _Src.extent.size());


     auto _Ev = _Copy_async_impl(_Src, _Dest);


     return details::_Get_amp_trace()->_Start_async_op_wait_event_helper(_Async_op_id, _Ev);

 }


 template <typename _Value_type, int _Rank> void copy(const array<_Value_type,_Rank>& _Src, array<_Value_type,_Rank>& _Dest)

 {

     auto _Span_id = details::_Get_amp_trace()->_Start_copy_event_helper(details::_Get_buffer_descriptor(_Src),

                                                                         details::_Get_buffer_descriptor(_Dest),

                                                                         sizeof(_Value_type) * _Src.extent.size());


     _Copy_async_impl(_Src, _Dest)._Get();


     details::_Get_amp_trace()->_Write_end_event(_Span_id);

 }


 template <typename InputIterator, typename _Value_type, int _Rank> concurrency::completion_future copy_async(InputIterator _SrcFirst, InputIterator _SrcLast, array<_Value_type, _Rank> &_Dest)

 {

     auto _Async_op_id = details::_Get_amp_trace()->_Launch_async_copy_event_helper(nullptr,

                                                                                    details::_Get_buffer_descriptor(_Dest),

                                                                                    sizeof(_Value_type) * std::distance(_SrcFirst, _SrcLast));


     _Event _Ev = _Copy_async_impl(_SrcFirst, _SrcLast, _Dest);


     return details::_Get_amp_trace()->_Start_async_op_wait_event_helper(_Async_op_id, _Ev);

 }


 template <typename InputIterator, typename _Value_type, int _Rank> void copy(InputIterator _SrcFirst, InputIterator _SrcLast, array<_Value_type, _Rank> &_Dest)

 {

     auto _Span_id = details::_Get_amp_trace()->_Start_copy_event_helper(nullptr,

                                                                         details::_Get_buffer_descriptor(_Dest),

                                                                         sizeof(_Value_type) * std::distance(_SrcFirst, _SrcLast));


     _Copy_async_impl(_SrcFirst, _SrcLast, _Dest)._Get();


     details::_Get_amp_trace()->_Write_end_event(_Span_id);

 }


 template <typename InputIterator, typename _Value_type, int _Rank> concurrency::completion_future copy_async(InputIterator _SrcFirst, array<_Value_type, _Rank> &_Dest)

 {

     InputIterator _SrcLast = _SrcFirst;

     std::advance(_SrcLast, _Dest.extent.size());

     return copy_async(_SrcFirst, _SrcLast, _Dest);

 }


 template <typename InputIterator, typename _Value_type, int _Rank> void copy(InputIterator _SrcFirst, array<_Value_type, _Rank> &_Dest)

 {

     InputIterator _SrcLast = _SrcFirst;

     std::advance(_SrcLast, _Dest.extent.size());

     copy(_SrcFirst, _SrcLast, _Dest);

 }


 template <typename OutputIterator, typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array<_Value_type, _Rank> &_Src, OutputIterator _DestIter)

 {

     _CPP_AMP_VERIFY_MUTABLE_ITERATOR(OutputIterator);


     auto _Async_op_id = details::_Get_amp_trace()->_Launch_async_copy_event_helper(details::_Get_buffer_descriptor(_Src),

                                                                                    nullptr,

                                                                                    sizeof(_Value_type) * _Src.extent.size());

     _Event _Ev = _Copy_async_impl(_Src, _DestIter);


     return details::_Get_amp_trace()->_Start_async_op_wait_event_helper(_Async_op_id, _Ev);

 }


 template <typename OutputIterator, typename _Value_type, int _Rank> void copy(const array<_Value_type, _Rank> &_Src, OutputIterator _DestIter)

 {

     _CPP_AMP_VERIFY_MUTABLE_ITERATOR(OutputIterator);


     auto _Span_id = details::_Get_amp_trace()->_Start_copy_event_helper(details::_Get_buffer_descriptor(_Src),

                                                                         nullptr,

                                                                         sizeof(_Value_type) * _Src.extent.size());


     _Copy_async_impl(_Src, _DestIter)._Get();


     details::_Get_amp_trace()->_Write_end_event(_Span_id);

 }


 template <typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array<_Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest)

 {

     auto _Async_op_id = details::_Get_amp_trace()->_Launch_async_copy_event_helper(details::_Get_buffer_descriptor(_Src),

                                                                                    details::_Get_buffer_descriptor(_Dest),

                                                                                    sizeof(_Value_type) * _Src.extent.size());


     _Event _Ev = _Copy_async_impl(_Src, _Dest);


     return details::_Get_amp_trace()->_Start_async_op_wait_event_helper(_Async_op_id, _Ev);

 }


 template <typename _Value_type, int _Rank> void copy(const array<_Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest)

 {

     auto _Span_id = details::_Get_amp_trace()->_Start_copy_event_helper(details::_Get_buffer_descriptor(_Src),

                                                                         details::_Get_buffer_descriptor(_Dest),

                                                                         sizeof(_Value_type) * _Src.extent.size());


     _Copy_async_impl(_Src, _Dest)._Get();


     details::_Get_amp_trace()->_Write_end_event(_Span_id);

 }


 template <typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array_view<const _Value_type, _Rank>& _Src, array<_Value_type, _Rank>& _Dest)

 {

     auto _Async_op_id = details::_Get_amp_trace()->_Launch_async_copy_event_helper(details::_Get_buffer_descriptor(_Src),

                                                                                    details::_Get_buffer_descriptor(_Dest),

                                                                                    sizeof(_Value_type) * _Src.extent.size());


     _Event _Ev = _Copy_async_impl(_Src, _Dest);


     return details::_Get_amp_trace()->_Start_async_op_wait_event_helper(_Async_op_id, _Ev);

 }


 template <typename _Value_type, int _Rank> void copy(const array_view<const _Value_type, _Rank>& _Src, array<_Value_type, _Rank>& _Dest)

 {

     auto _Span_id = details::_Get_amp_trace()->_Start_copy_event_helper(details::_Get_buffer_descriptor(_Src),

                                                                         details::_Get_buffer_descriptor(_Dest),

                                                                         sizeof(_Value_type) * _Src.extent.size());


     _Copy_async_impl(_Src, _Dest)._Get();


     details::_Get_amp_trace()->_Write_end_event(_Span_id);

 }


 template <typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array_view<_Value_type, _Rank>& _Src, array<_Value_type, _Rank>& _Dest)

 {

     return copy_async<_Value_type, _Rank>(array_view<const _Value_type, _Rank>(_Src), _Dest);

 }


 template <typename _Value_type, int _Rank> void copy(const array_view<_Value_type, _Rank>& _Src, array<_Value_type, _Rank>& _Dest)

 {

     copy<_Value_type, _Rank>(array_view<const _Value_type, _Rank>(_Src), _Dest);

 }


 template <typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array_view<const _Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest)

 {

     auto _Async_op_id = details::_Get_amp_trace()->_Launch_async_copy_event_helper(details::_Get_buffer_descriptor(_Src),

                                                                                    details::_Get_buffer_descriptor(_Dest),

                                                                                    sizeof(_Value_type) * _Src.extent.size());


     _Event _Ev = _Copy_async_impl(_Src, _Dest);


     return details::_Get_amp_trace()->_Start_async_op_wait_event_helper(_Async_op_id, _Ev);

 }


 template <typename _Value_type, int _Rank> void copy(const array_view<const _Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest)

 {

     auto _Span_id = details::_Get_amp_trace()->_Start_copy_event_helper(details::_Get_buffer_descriptor(_Src),

                                                                         details::_Get_buffer_descriptor(_Dest),

                                                                         sizeof(_Value_type) * _Src.extent.size());


     _Copy_async_impl(_Src, _Dest)._Get();


     details::_Get_amp_trace()->_Write_end_event(_Span_id);

 }


 template <typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array_view<_Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest)

 {

     return copy_async<_Value_type, _Rank>(array_view<const _Value_type, _Rank>(_Src), _Dest);

 }


 template <typename _Value_type, int _Rank> void copy(const array_view<_Value_type, _Rank>& _Src, const array_view<_Value_type, _Rank>& _Dest)

 {

     copy<_Value_type, _Rank>(array_view<const _Value_type, _Rank>(_Src), _Dest);

 }


 template <typename InputIterator, typename _Value_type, int _Rank> concurrency::completion_future copy_async(InputIterator _SrcFirst, InputIterator _SrcLast, const array_view<_Value_type, _Rank> &_Dest)

 {

     auto _Async_op_id = details::_Get_amp_trace()->_Launch_async_copy_event_helper(nullptr,

                                                                                    details::_Get_buffer_descriptor(_Dest),

                                                                                    sizeof(_Value_type) * std::distance(_SrcFirst, _SrcLast));


     _Event _Ev = _Copy_async_impl(_SrcFirst, _SrcLast, _Dest);


     return details::_Get_amp_trace()->_Start_async_op_wait_event_helper(_Async_op_id, _Ev);

 }


 template <typename InputIterator, typename _Value_type, int _Rank> concurrency::completion_future copy_async(InputIterator _SrcFirst, const array_view<_Value_type, _Rank> &_Dest)

 {

     InputIterator _SrcLast = _SrcFirst;

     std::advance(_SrcLast, _Dest.extent.size());

     return copy_async(_SrcFirst, _SrcLast, _Dest);

 }


 template <typename InputIterator, typename _Value_type, int _Rank> void copy(InputIterator _SrcFirst, InputIterator _SrcLast, const array_view<_Value_type, _Rank> &_Dest)

 {

     auto _Span_id = details::_Get_amp_trace()->_Start_copy_event_helper(nullptr,

                                                                         details::_Get_buffer_descriptor(_Dest),

                                                                         sizeof(_Value_type) * std::distance(_SrcFirst, _SrcLast));


     _Copy_async_impl(_SrcFirst, _SrcLast, _Dest)._Get();


     details::_Get_amp_trace()->_Write_end_event(_Span_id);

 }


 template <typename InputIterator, typename _Value_type, int _Rank> void copy(InputIterator _SrcFirst, const array_view<_Value_type, _Rank> &_Dest)

 {

     InputIterator _SrcLast = _SrcFirst;

     std::advance(_SrcLast, _Dest.extent.size());

     copy(_SrcFirst, _SrcLast, _Dest);

 }


 template <typename OutputIterator, typename _Value_type, int _Rank> concurrency::completion_future copy_async(const array_view<_Value_type, _Rank> &_Src, OutputIterator _DestIter)

 {

     _CPP_AMP_VERIFY_MUTABLE_ITERATOR(OutputIterator);


     // Caller is responsible for passing valid _DestIter

     auto _Async_op_id = details::_Get_amp_trace()->_Launch_async_copy_event_helper(details::_Get_buffer_descriptor(_Src),

                                                                                    nullptr,

                                                                                    sizeof(_Value_type) * _Src.extent.size());


     _Event _Ev = _Copy_async_impl(_Src, _DestIter);


     return details::_Get_amp_trace()->_Start_async_op_wait_event_helper(_Async_op_id, _Ev);

 }


 template <typename OutputIterator, typename _Value_type, int _Rank> void copy(const array_view<_Value_type, _Rank> &_Src, OutputIterator _DestIter)

 {

     _CPP_AMP_VERIFY_MUTABLE_ITERATOR(OutputIterator);


     auto _Span_id = details::_Get_amp_trace()->_Start_copy_event_helper(details::_Get_buffer_descriptor(_Src),

                                                                         nullptr,

                                                                         sizeof(_Value_type) * _Src.extent.size());


     _Copy_async_impl(_Src, _DestIter)._Get();


     details::_Get_amp_trace()->_Write_end_event(_Span_id);

 }


 // Namespace for Direct3D specific functionality

 namespace direct3d

 {

     template<typename _Value_type, int _Rank> _Ret_ IUnknown *get_buffer(const array<_Value_type, _Rank> &_Array) __CPU_ONLY

     {

         _Buffer_ptr _PBuf;

         _Get_access_async(_Array, _Read_write_access, _PBuf)._Get();

         return details::_D3D_interop::_Get_D3D_buffer(_PBuf);

     }


     template<typename _Value_type, int _Rank> array<_Value_type, _Rank> make_array(const Concurrency::extent<_Rank> &_Extent, const Concurrency::accelerator_view &_Av, _In_ IUnknown *_D3D_buffer) __CPU_ONLY

     {

         details::_Is_valid_extent(_Extent);


         if (_D3D_buffer == NULL)

         {

             throw runtime_exception("NULL D3D buffer pointer.", E_INVALIDARG);

         }


         if (!details::_Is_D3D_accelerator_view(_Av))

         {

             throw runtime_exception("Cannot create D3D buffer on a non-D3D accelerator_view.", E_INVALIDARG);

         }


         _Ubiquitous_buffer_ptr _PBuf = _Ubiquitous_buffer::_Create_ubiquitous_buffer(_Buffer::_Create_buffer(_D3D_buffer, _Av, _Extent.size(), sizeof(_Value_type)));

         return array<_Value_type, _Rank>(_Extent, _Buffer_descriptor(_PBuf->_Get_master_buffer()->_Get_host_ptr(), _PBuf, _Is_array_mode, _Read_write_access));

     }


 } // namespace Concurrency::direct3d


 //=============================================================================

 // Atomic Operation Library

 //=============================================================================


 #define AS_UINT_PTR(p) reinterpret_cast<unsigned int *>(p)

 #define AS_UINT(v)     *(reinterpret_cast<unsigned int *>(&(v)))

 #define AS_INT(v)      *(reinterpret_cast<int *>(&(v)))

 #define AS_FLOAT(v)    *(reinterpret_cast<float *>(&(v)))


 inline int atomic_fetch_add(_Inout_ int * _Dest, int _Value) __GPU_ONLY

 {

     unsigned int _Ret;

     _Ret = __dp_d3d_interlocked_add(AS_UINT_PTR(_Dest), AS_UINT(_Value));

     return AS_INT(_Ret);

 }


 inline unsigned int atomic_fetch_add(_Inout_ unsigned int * _Dest, unsigned int _Value) __GPU_ONLY

 {

     return __dp_d3d_interlocked_add(_Dest, _Value);

 }


 inline int atomic_fetch_sub(_Inout_ int * _Dest, int _Value) __GPU_ONLY

 {

     unsigned int _Ret;

     int _Neg = -_Value;

     _Ret = __dp_d3d_interlocked_add(AS_UINT_PTR(_Dest), AS_UINT(_Neg));

     return AS_INT(_Ret);

 }


 inline unsigned int atomic_fetch_sub(_Inout_ unsigned int * _Dest, unsigned int _Value) __GPU_ONLY

 {

 #pragma warning( push )

 #pragma warning( disable : 4146 )

     // Warning 4146: unary minus operator applied to unsigned type, result

     // still unsigned.

     //

     // This is what we want here. The resulted unsigned value have the

     // right binary representation for achieving subtraction

     return __dp_d3d_interlocked_add(_Dest, (-_Value));

 #pragma warning( pop )

 }


 inline int atomic_fetch_inc(_Inout_ int * _Dest) __GPU_ONLY

 {

     unsigned int _Ret;

     _Ret = __dp_d3d_interlocked_add(AS_UINT_PTR(_Dest), 1U);

     return AS_INT(_Ret);

 }


 inline unsigned int atomic_fetch_inc(_Inout_ unsigned int * _Dest) __GPU_ONLY

 {

     return __dp_d3d_interlocked_add(_Dest, 1U);

 }


 inline int atomic_fetch_dec(_Inout_ int * _Dest) __GPU_ONLY

 {

 #pragma warning( push )

 #pragma warning( disable : 4146 )

     // Warning 4146: unary minus operator applied to unsigned type, result

     // still unsigned.

     unsigned int _Ret;

     _Ret = __dp_d3d_interlocked_add(AS_UINT_PTR(_Dest), (-(1U)));

     return AS_INT(_Ret);

 #pragma warning( pop )

 }


 inline unsigned int atomic_fetch_dec(_Inout_ unsigned int * _Dest) __GPU_ONLY

 {

 #pragma warning( push )

 #pragma warning( disable : 4146 )

     // Warning 4146: unary minus operator applied to unsigned type, result

     // still unsigned.

     return __dp_d3d_interlocked_add(_Dest, (-(1U)));

 #pragma warning( pop )

 }


 inline int atomic_exchange(_Inout_ int * _Dest, int _Value) __GPU_ONLY

 {

     unsigned int _Ret = __dp_d3d_interlocked_exchange(AS_UINT_PTR(_Dest), AS_UINT(_Value));

     return AS_INT(_Ret);

 }


 inline unsigned int atomic_exchange(_Inout_ unsigned int * _Dest, unsigned int _Value) __GPU_ONLY

 {

     return __dp_d3d_interlocked_exchange(_Dest, _Value);

 }


 inline float atomic_exchange(_Inout_ float * _Dest, float _Value) __GPU_ONLY

 {

     unsigned int _Ret = __dp_d3d_interlocked_exchange(AS_UINT_PTR(_Dest), AS_UINT(_Value));

     return AS_FLOAT(_Ret);

 }


 inline bool atomic_compare_exchange(_Inout_ int * _Dest, _Inout_ int * _Expected_value, int _Value) __GPU_ONLY

 {

     int _Old = *_Expected_value;

     unsigned int _Ret = __dp_d3d_interlocked_compare_exchange(AS_UINT_PTR(_Dest), AS_UINT(_Value), AS_UINT(_Old));

     if (_Ret == AS_UINT(_Old))

     {

         return true;

     }

     else

     {

         *_Expected_value = AS_INT(_Ret);

         return false;

     }

 }


 inline bool atomic_compare_exchange(_Inout_ unsigned int * _Dest, _Inout_ unsigned int * _Expected_value, unsigned int _Value) __GPU_ONLY

 {

     unsigned int _Old = *_Expected_value;

     unsigned int _Ret = __dp_d3d_interlocked_compare_exchange(_Dest, _Value, _Old);

     if (_Ret == _Old)

     {

         return true;

     }

     else

     {

         *_Expected_value = _Ret;

         return false;

     }

 }


 inline int atomic_fetch_max(_Inout_ int * _Dest, int _Value) __GPU_ONLY

 {

     return __dp_d3d_interlocked_max_int(_Dest, _Value);

 }


 inline unsigned int atomic_fetch_max(_Inout_ unsigned int * _Dest, unsigned int _Value) __GPU_ONLY

 {

     return __dp_d3d_interlocked_max_uint(_Dest, _Value);

 }


 inline int atomic_fetch_min(_Inout_ int * _Dest, int _Value) __GPU_ONLY

 {

     return __dp_d3d_interlocked_min_int(_Dest, _Value);

 }


 inline unsigned int atomic_fetch_min(_Inout_ unsigned int * _Dest, unsigned int _Value) __GPU_ONLY

 {

     return __dp_d3d_interlocked_min_uint(_Dest, _Value);

 }


 inline int atomic_fetch_and(_Inout_ int * _Dest, int _Value) __GPU_ONLY

 {

     unsigned int _Ret;

     _Ret = __dp_d3d_interlocked_and(AS_UINT_PTR(_Dest), AS_UINT(_Value));

     return AS_INT(_Ret);

 }


 inline unsigned int atomic_fetch_and(_Inout_ unsigned int * _Dest, unsigned int _Value) __GPU_ONLY

 {

     return __dp_d3d_interlocked_and(_Dest, _Value);

 }


 inline int atomic_fetch_or(_Inout_ int * _Dest, int _Value) __GPU_ONLY

 {

     unsigned int _Ret;

     _Ret = __dp_d3d_interlocked_or(AS_UINT_PTR(_Dest), AS_UINT(_Value));

     return AS_INT(_Ret);

 }


 inline unsigned int atomic_fetch_or(_Inout_ unsigned int * _Dest, unsigned int _Value) __GPU_ONLY

 {

     return __dp_d3d_interlocked_or(_Dest, _Value);

 }


 inline int atomic_fetch_xor(_Inout_ int * _Dest, int _Value) __GPU_ONLY

 {

     unsigned int _Ret;

     _Ret = __dp_d3d_interlocked_xor(AS_UINT_PTR(_Dest), AS_UINT(_Value));

     return AS_INT(_Ret);

 }


 inline unsigned int atomic_fetch_xor(_Inout_ unsigned int * _Dest, unsigned int _Value) __GPU_ONLY

 {

     return __dp_d3d_interlocked_xor(_Dest, _Value);

 }


 //=============================================================================

 // parallel_for_each

 //=============================================================================


 template <int _Rank, typename _Kernel_type> void parallel_for_each(const extent<_Rank>& _Compute_domain, const _Kernel_type &_Kernel)

 {

     _Host_Scheduling_info _SchedulingInfo = {accelerator::get_auto_selection_view()};

     details::_Parallel_for_each(&_SchedulingInfo, _Compute_domain, _Kernel);

 }


 template <int _Dim0, int _Dim1, int _Dim2, typename _Kernel_type> void parallel_for_each(const tiled_extent<_Dim0, _Dim1, _Dim2>& _Compute_domain, const _Kernel_type& _Kernel)

 {

     _Host_Scheduling_info _SchedulingInfo = {accelerator::get_auto_selection_view()};

     details::_Parallel_for_each(&_SchedulingInfo, _Compute_domain, _Kernel);

 }


 template <int _Dim0, int _Dim1, typename _Kernel_type> void parallel_for_each(const tiled_extent<_Dim0, _Dim1>& _Compute_domain, const _Kernel_type& _Kernel)

 {

     _Host_Scheduling_info _SchedulingInfo = {accelerator::get_auto_selection_view()};

     details::_Parallel_for_each(&_SchedulingInfo, _Compute_domain, _Kernel);

 }


 template <int _Dim0, typename _Kernel_type> void parallel_for_each(const tiled_extent<_Dim0>& _Compute_domain, const _Kernel_type& _Kernel)

 {

     _Host_Scheduling_info _SchedulingInfo = {accelerator::get_auto_selection_view()};

     details::_Parallel_for_each(&_SchedulingInfo, _Compute_domain, _Kernel);

 }


 template <int _Rank, typename _Kernel_type> void parallel_for_each(const accelerator_view& _Accl_view, const extent<_Rank>& _Compute_domain, const _Kernel_type& _Kernel)

 {

     _Host_Scheduling_info _SchedulingInfo = {_Accl_view};

     details::_Parallel_for_each(&_SchedulingInfo, _Compute_domain, _Kernel);

 }


 template <int _Dim0, int _Dim1, int _Dim2, typename _Kernel_type> void parallel_for_each(const accelerator_view& _Accl_view, const tiled_extent<_Dim0, _Dim1, _Dim2>& _Compute_domain, const _Kernel_type& _Kernel)

 {

     _Host_Scheduling_info _SchedulingInfo = {_Accl_view};

     details::_Parallel_for_each(&_SchedulingInfo, _Compute_domain, _Kernel);

 }


 template <int _Dim0, int _Dim1, typename _Kernel_type> void parallel_for_each(const accelerator_view& _Accl_view, const tiled_extent<_Dim0, _Dim1>& _Compute_domain, const _Kernel_type& _Kernel)

 {

     _Host_Scheduling_info _SchedulingInfo = {_Accl_view};

     details::_Parallel_for_each(&_SchedulingInfo, _Compute_domain, _Kernel);

 }


 template <int _Dim0, typename _Kernel_type> void parallel_for_each(const accelerator_view& _Accl_view, const tiled_extent<_Dim0>& _Compute_domain, const _Kernel_type& _Kernel)

 {

     _Host_Scheduling_info _SchedulingInfo = {_Accl_view};

     details::_Parallel_for_each(&_SchedulingInfo, _Compute_domain, _Kernel);

 }


 //=============================================================================


 extern "C"

 {


 // Debugging intrinsics

 void direct3d_abort() __GPU_ONLY;

 void direct3d_errorf(const char *, ...) __GPU_ONLY;

 void direct3d_printf(const char *, ...) __GPU_ONLY;


 }


 #pragma warning( push )

 #pragma warning( disable : 4100 ) // unreferenced formal parameter


 inline void all_memory_fence(const tile_barrier & _Barrier) __GPU_ONLY

 {

     __dp_d3d_all_memory_fence();

 }


 inline void global_memory_fence(const tile_barrier & _Barrier) __GPU_ONLY

 {

     __dp_d3d_device_memory_fence();

 }


 inline void tile_static_memory_fence(const tile_barrier & _Barrier) __GPU_ONLY

 {

     __dp_d3d_tile_static_memory_fence();

 }


 #pragma warning( pop )


 namespace direct3d

 {


 inline int abs(int _X) __GPU_ONLY

 {

     return __dp_d3d_absi(_X);

 }


 inline float clamp(float _X, float _Min, float _Max) __GPU_ONLY

 {

     return __dp_d3d_clampf(_X, _Min, _Max);

 }


 inline int clamp(int _X, int _Min, int _Max) __GPU_ONLY

 {

     return __dp_d3d_clampi(_X, _Min, _Max);

 }


 inline unsigned int countbits(unsigned int _X) __GPU_ONLY

 {

     return __dp_d3d_countbitsu(_X);

 }


 inline int firstbithigh(int _X) __GPU_ONLY

 {

     return __dp_d3d_firstbithighi(_X);

 }


 inline int firstbitlow(int _X) __GPU_ONLY

 {

     return __dp_d3d_firstbitlowi(_X);

 }


 inline int imax(int _X, int _Y) __GPU_ONLY

 {

     return __dp_d3d_maxi(_X, _Y);

 }


 inline int imin(int _X, int _Y) __GPU_ONLY

 {

     return __dp_d3d_mini(_X, _Y);

 }


 inline unsigned int umax(unsigned int _X, unsigned int _Y) __GPU_ONLY

 {

     return __dp_d3d_maxu(_X, _Y);

 }


 inline unsigned int umin(unsigned int _X, unsigned int _Y) __GPU_ONLY

 {

     return __dp_d3d_minu(_X, _Y);

 }


 inline float mad(float _X, float _Y, float _Z) __GPU_ONLY

 {

     return __dp_d3d_madf(_X, _Y, _Z);

 }


 inline double mad(double _X, double _Y, double _Z) __GPU_ONLY

 {

     return __dp_d3d_madd(_X, _Y, _Z);

 }


 inline int mad(int _X, int _Y, int _Z) __GPU_ONLY

 {

     return __dp_d3d_madi(_X, _Y, _Z);

 }


 inline unsigned int mad(unsigned int _X, unsigned int _Y, unsigned int _Z) __GPU_ONLY

 {

     return __dp_d3d_madu(_X, _Y, _Z);

 }


 inline float noise(float _X) __GPU_ONLY

 {

     return __dp_d3d_noisef(_X);

 }


 inline float radians(float _X) __GPU_ONLY

 {

     return __dp_d3d_radiansf(_X);

 }


 inline float rcp(float _X) __GPU_ONLY

 {

     return __dp_d3d_rcpf(_X);

 }


 inline unsigned int reversebits(unsigned int _X) __GPU_ONLY

 {

     return __dp_d3d_reversebitsu(_X);

 }


 inline float saturate(float _X) __GPU_ONLY

 {

     return __dp_d3d_saturatef(_X);

 }


 inline int sign(int _X) __GPU_ONLY

 {

     return __dp_d3d_signi(_X);

 }


 inline float smoothstep(float _Min, float _Max, float _X) __GPU_ONLY

 {

     return __dp_d3d_smoothstepf(_Min, _Max, _X);

 }


 inline float step(float _Y, float _X) __GPU_ONLY

 {

     return __dp_d3d_stepf(_Y, _X);

 }


 } // namespace Concurrency::direct3d


 } // namespace Concurrency


 #include <xxamp_inl.h>


 namespace concurrency = Concurrency;


 #pragma pack(pop)

 // End of file

__dp_d3d_interlocked_min_int
int __dp_d3d_interlocked_min_int(_Inout_ int *, int) __GPU_ONLY

Concurrency::array::array
array(int _E0, int _E1, int _E2) __CPU_ONLY
Construct an array from three integer extents.
Definition: amp.h:3939

Concurrency::tiled_extent::tiled_extent
tiled_extent(const tiled_extent &_Other) __GPU
Copy constructor. Constructs a new tiled_extent from the supplied argument "_Other".
Definition: amp.h:1296

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(_In_ void *_Data, const Concurrency::extent< _Rank > &_Array_extent) __GPU_ONLY
Definition: amp.h:1821

Concurrency::array_view< const _Value_type, _Rank >::synchronize
void synchronize() const __CPU_ONLY
Synchronizes any modifications made to "this" array_view to its source data.
Definition: amp.h:3751

Concurrency::accelerator_view::accelerator
friend class accelerator
Definition: amprt.h:1444

Concurrency::details::_Array_view_projection_helper::_Project0
static _Projection_result_type< _T, _R >::_Result_type _Project0(const array_view< _T, _R > *_Arr_view, int _I) __GPU
Definition: xxamp_inl.h:42

Concurrency::tiled_extent< _Dim0, 0, 0 >::truncate
tiled_extent truncate() const __GPU
Returns a new tiled_extent with extents adjusted down to be evenly divisible by the tile dimensions...
Definition: amp.h:1499

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(const array< _Value_type, _Rank > &_Src) __GPU
Construct an array_view which is bound to the data contained in the _Src array. The extent of the arr...
Definition: amp.h:3067

Concurrency::array::_M_buffer_descriptor
_Buffer_descriptor _M_buffer_descriptor
Definition: amp.h:5752

Concurrency::array_view::get_source_accelerator_view
accelerator_view get_source_accelerator_view() const
Returns the accelerator_view where the data source of the array_view is located. If the array_view do...
Definition: amp.h:2968

__dp_d3d_firstbitlowi
int __dp_d3d_firstbitlowi(int) __GPU_ONLY

Concurrency::array_view< const _Value_type, _Rank >::section
array_view section(const Concurrency::index< _Rank > &_Idx) const __GPU
Produces a subsection of the source array_view with origin specified by an index, with an extent of (...
Definition: amp.h:3562

Concurrency::atomic_fetch_or
int atomic_fetch_or(_Inout_ int *_Dest, int _Value) __GPU_ONLY
Performs an atomic bitwise or operation of _Value to the memory location pointed to by _Dest ...
Definition: amp.h:6945

Concurrency::array_view::refresh
void refresh() const __CPU_ONLY
Informs the array_view that its bound memory has been modified outside the array_view interface...
Definition: amp.h:2836

Concurrency::array::array
array(int _E0, int _E1, int _E2, Concurrency::accelerator_view _Av, access_type _Cpu_access_type=access_type_auto) __CPU_ONLY
Construct an array from three integer extents, bound to a specific accelerator_view.
Definition: amp.h:4039

Concurrency::index::_CPP_AMP_VERIFY_RANK
_CPP_AMP_VERIFY_RANK(_Rank, index)

Concurrency::array_view::section
array_view section(int _I0, int _E0) const __GPU
Produces a one-dimensional subsection of the source array_view with origin specified by the index com...
Definition: amp.h:2734

Concurrency::index::operator-=
index< _Rank > & operator-=(int _Rhs) __GPU
Subtracts an integer value from each element of this index.
Definition: amp.h:243

array::operator[]
reference operator[](size_type _Pos)
Definition: array:140

Concurrency::details::_Array_view_shape::_M_array_multiplier
Concurrency::extent< _Rank > _M_array_multiplier
Definition: amp.h:1669

Concurrency::array::_Initialize
void _Initialize(Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY
Definition: amp.h:5593

NULL
#define NULL
Definition: vcruntime.h:236

Concurrency::array::array
array(int _E0, _InputIterator _Src_first, Concurrency::accelerator_view _Av, access_type _Cpu_access_type=access_type_auto) __CPU_ONLY
Construct an array initialized from an iterator into a container, bound to a specific accelerator_vie...
Definition: amp.h:4409

Concurrency::array::section
array_view< _Value_type, 3 > section(int _I0, int _I1, int _I2, int _E0, int _E1, int _E2) __GPU
Produces a three-dimensional subsection of the source array with origin specified by the index compon...
Definition: amp.h:5383

Concurrency::array_view::array_view
array_view(int _E0, _Container &_Src) __CPU_ONLY
Construct an array_view which is bound to the data contained in the _Src container.
Definition: amp.h:2373

Concurrency::array::array
array(array &&_Other) __CPU_ONLY
Move constructor.
Definition: amp.h:4849

Concurrency::details::_Array_view_base::_Buffer_descriptor
details::_Buffer_descriptor _Buffer_descriptor
Definition: amp.h:1685

__dp_d3d_radiansf
float __dp_d3d_radiansf(float) __GPU_ONLY

__dp_d3d_interlocked_add
unsigned int __dp_d3d_interlocked_add(_Inout_ unsigned int *, unsigned int) __GPU_ONLY

Concurrency::index::operator--
index operator--(int) __GPU
Post-decrements each element of this index.
Definition: amp.h:337

Concurrency::details::_View_shape::_Get_base_extent
const unsigned int * _Get_base_extent() const
Definition: amprt.h:1601

Concurrency::atomic_exchange
int atomic_exchange(_Inout_ int *_Dest, int _Value) __GPU_ONLY
Sets the value of location pointed to by _Dest to _Value as an atomic operation
Definition: amp.h:6716

Concurrency::operator==
std::enable_if< details::_Is_extent_or_index< _Tuple_type< _Rank > >::value, bool >::type operator==(const _Tuple_type< _Rank > &_Lhs, const _Tuple_type< _Rank > &_Rhs) __GPU
Definition: amp.h:822

Concurrency::details::_Create_uninitialized_tuple
_Tuple_type _Create_uninitialized_tuple() __GPU
Definition: xxamp.h:214

Concurrency::index::operator++
index< _Rank > & operator++() __GPU
Pre-increments each element of this index.
Definition: amp.h:300

Concurrency::details::_Array_view_base
Definition: amp.h:1676

Concurrency::array_view::array_view
array_view() __GPU
Definition: amp.h:2994

Concurrency::array::operator[]
details::_Projection_result_type< _Value_type, _Rank >::_Result_type operator[](int _I) __GPU
Projects the most-significant dimension of this array. If the array rank is 1, this produces a single...
Definition: amp.h:5016

Concurrency::all_memory_fence
void all_memory_fence(const tile_barrier &_Barrier) __GPU_ONLY
Memory fences and tile barriers.
Definition: amp.h:7178

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(int _E0, int _E1, int _E2, const _Container &_Src) __CPU_ONLY
Construct an array_view which is bound to the data contained in the _Src container.
Definition: amp.h:3241

Concurrency::_Tiled_index_base::global
const index< rank > global
An index that represents the global index within an extent.
Definition: amp.h:1013

size
constexpr auto size(const _Container &_Cont) -> decltype(_Cont.size())
Definition: xutility:1478

Concurrency::tiled_extent< _Dim0, _Dim1, 0 >::_map_index
tiled_index< _Dim0, _Dim1 > _map_index(const index< rank > &_Local, const index< rank > &_Tile, const index< rank > &_Global, tile_barrier &_Barrier) const __GPU
Definition: amp.h:1435

Concurrency::details::_Event::_Add_continuation
_AMPIMP _Event _Add_continuation(const std::function< _Event __cdecl()> &_Continuation_task)
Creates an event which is an ordered collection of this and a continuation task

Concurrency::details::_Get_recommended_buffer_host_access_mode
_AMPIMP _Access_mode __cdecl _Get_recommended_buffer_host_access_mode(const accelerator_view &_Av)

Concurrency::array::data
const _Value_type * data() const __GPU
Returns a pointer to the raw data of this array.
Definition: amp.h:5509

Concurrency::details::_Is_container
Definition: amp.h:2216

Concurrency::array_view::section
array_view section(int _I0, int _I1, int _E0, int _E1) const __GPU
Produces a two-dimensional subsection of the source array_view with origin specified by the index com...
Definition: amp.h:2759

Concurrency::array_view::array_view
array_view(const array_view &_Other) __GPU
Copy constructor. Shallow copy.
Definition: amp.h:2283

__dp_d3d_madf
float __dp_d3d_madf(float, float, float) __GPU_ONLY

Concurrency::details::_Array_view_shape::~_Array_view_shape
~_Array_view_shape() __GPU
Definition: amp.h:1568

Concurrency::details::_View_shape::_Get_view_offset
const unsigned int * _Get_view_offset() const
Definition: amprt.h:1606

Concurrency::details::_Get_access_async
_Event _Get_access_async(const _View_key _Key, accelerator_view _Av, _Access_mode _Mode, _Buffer_ptr &_Buf_ptr)
Definition: amprt.h:3389

Concurrency::array::section
array_view< _Value_type, _Rank > section(const Concurrency::index< _Rank > &_Section_origin, const Concurrency::extent< _Rank > &_Section_extent) __GPU
Produces a subsection of the source array at the given origin and extent.
Definition: amp.h:5184

Concurrency::array::_Buffer_descriptor
details::_Buffer_descriptor _Buffer_descriptor
Definition: amp.h:3868

Concurrency::details::_Array_view_base::_Register_copy
void _Register_copy(const _Array_view_base &_Other) __CPU_ONLY
Definition: amp.h:2026

Concurrency::details::_Array_view_base::_Register_copy
void _Register_copy(const _Array_view_base &) __GPU_ONLY
Definition: amp.h:2192

Concurrency::array_view::~array_view
~array_view() __GPU
Destroys this array_view and reclaims resources.
Definition: amp.h:2265

_Read_access
Definition: amprt.h:91

Concurrency::index::operator+=
index< _Rank > & operator+=(int _Rhs) __GPU
Adds an integer value to each element of this index.
Definition: amp.h:228

Concurrency::details::opMul
Definition: xxamp.h:242

Concurrency::extent::operator+=
extent< _Rank > & operator+=(int _Rhs) __GPU
Adds an integer value to each element of this extent.
Definition: amp.h:670

Concurrency::details::opMulEq
Definition: xxamp.h:236

__dp_d3d_interlocked_xor
unsigned int __dp_d3d_interlocked_xor(_Inout_ unsigned int *, unsigned int) __GPU_ONLY

Concurrency::array_view::array_view
array_view(int _E0) __CPU_ONLY
Construct an array_view which is not bound to a data source.
Definition: amp.h:2339

Concurrency::index::operator/=
index< _Rank > & operator/=(int _Rhs) __GPU
Divides each element of this index by an integer value.
Definition: amp.h:273

Concurrency::index::operator++
index< _Rank > operator++(int) __GPU
Post-increments each element of this index.
Definition: amp.h:312

Concurrency::tiled_extent< _Dim0, 0, 0 >::operator=
tiled_extent & operator=(const tiled_extent &_Other) __GPU
copy-assignment operator
Definition: amp.h:1471

Concurrency::array::array
array(int _E0, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, access_type _Cpu_access_type=access_type_auto) __CPU_ONLY
Construct an array initialized from a pair of iterators into a container, bound to a specific acceler...
Definition: amp.h:4382

Concurrency::details::_product_helper
Definition: xxamp.h:260

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(const _In_ _Value_type(&_Src)[_Size]) __GPU
Construct an array_view which is bound to the data contained in the _Src container; ...
Definition: amp.h:3199

Concurrency::details::_Array_view_base::_Reinterpret_as
_Array_view_base< _Rank, _New_element_size > _Reinterpret_as() const __GPU
Definition: amp.h:1922

__dp_d3d_clampi
int __dp_d3d_clampi(int, int, int) __GPU_ONLY

Concurrency::array_view::reinterpret_as
array_view< _Value_type2, _Rank > reinterpret_as() const __GPU
Produces a (possibly unsafe) reinterpretation of this array_view that is linear and with a different ...
Definition: amp.h:2804

__dp_d3d_madu
unsigned int __dp_d3d_madu(unsigned int, unsigned int, unsigned int) __GPU_ONLY

Concurrency::array_view::value_type
_Value_type value_type
Definition: amp.h:2259

Concurrency::details::_Array_view_base::_Register
void _Register() __GPU_ONLY
Definition: amp.h:2190

Concurrency::array_view::array_view
array_view(const Concurrency::extent< _Rank > &_Extent) __CPU_ONLY
Construct an array_view which is not bound to a data source.
Definition: amp.h:2295

Concurrency::details::_eInitializeState
_eInitializeState
Definition: xxamp.h:208

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(const void *_Data, const Concurrency::extent< _Rank > &_Array_extent) __CPU_ONLY
Definition: amp.h:1827

Concurrency::extent::operator-
extent< _Rank > operator-(const index< _Rank > &_Rhs) const __GPU
Element-wise subtraction of this extent with an index.
Definition: amp.h:594

Concurrency::details::_Array_view_base::_Create_section_buffer_shape
static _Ret_ void * _Create_section_buffer_shape(const _Buffer_descriptor &_Descriptor, const Concurrency::index< _Rank > &_Section_origin, const Concurrency::extent< _Rank > &_Section_extent) __CPU_ONLY
Definition: amp.h:2119

Concurrency::_Tiled_index_base::tile
const index< rank > tile
An index that represents the coordinates of the current tile of a tiled_extent.
Definition: amp.h:1023

Concurrency::array_view< const _Value_type, _Rank >::refresh
void refresh() const __CPU_ONLY
Informs the array_view that its bound memory has been modified outside the array_view interface...
Definition: amp.h:3682

array
Definition: array:21

Concurrency::array_view< const _Value_type, _Rank >::view_as
array_view< const _Value_type, _New_rank > view_as(const Concurrency::extent< _New_rank > &_View_extent) const __GPU
Produces an array_view of a different rank over this array_view's data.
Definition: amp.h:3664

Concurrency::details::_Array_view_base::_Project0
void _Project0(int _I, _Array_view_base< _Rank-1, _Element_size > &_Projected_view) const __GPU
Definition: amp.h:1912

Concurrency::array::_Refresh_data_ptr
void _Refresh_data_ptr(_Access_mode, bool=true) __GPU_ONLY
Definition: amp.h:5742

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(const array_view &_Other, const Concurrency::index< _Rank > &_Section_origin, const Concurrency::extent< _Rank > &_Section_extent) __GPU
Definition: amp.h:3798

Concurrency::tiled_extent< _Dim0, _Dim1, 0 >::operator=
tiled_extent & operator=(const tiled_extent &_Other) __GPU
copy-assignment operator
Definition: amp.h:1389

Concurrency::direct3d::noise
float noise(float _X) __GPU_ONLY
Generates a random value using the Perlin noise algorithm
Definition: amp.h:7465

Concurrency::array::section
array_view< _Value_type, 1 > section(int _I0, int _E0) __GPU
Produces a one-dimensional subsection of the source array with origin specified by the index componen...
Definition: amp.h:5283

__dp_d3d_interlocked_or
unsigned int __dp_d3d_interlocked_or(_Inout_ unsigned int *, unsigned int) __GPU_ONLY

__GPU
#define __GPU
Definition: amprt.h:45

Concurrency::operator*
std::enable_if< details::_Is_extent_or_index< _Tuple_type< _Rank > >::value, _Tuple_type< _Rank > >::type operator*(const _Tuple_type< _Rank > &_Lhs, typename _Tuple_type< _Rank >::value_type _Rhs) __GPU
Definition: amp.h:890

Concurrency::details::_Array_view_base::_View_as
_Array_view_base< _New_rank, _Element_size > _View_as(const Concurrency::extent< _New_rank > &_View_extent) const __GPU
Definition: amp.h:1932

Concurrency::array::_M_multiplier
Concurrency::extent< _Rank > _M_multiplier
Definition: amp.h:5755

Concurrency::details::opModEq
Definition: xxamp.h:238

Concurrency::index::operator--
index< _Rank > & operator--() __GPU
Pre-decrements each element of this index.
Definition: amp.h:325

Concurrency::array::section
array_view< const _Value_type, _Rank > section(const Concurrency::extent< _Rank > &_Ext) const __GPU
Produces a subsection of the source array_view with origin of zero, with an extent of _Ext...
Definition: amp.h:5233

Concurrency::array::array
array(const array &_Other) __CPU_ONLY
Copy constructor. Deep copy.
Definition: amp.h:4839

Concurrency::tiled_extent::tiled_extent
tiled_extent() __GPU
Default constructor.
Definition: amp.h:1285

Concurrency::tiled_extent< _Dim0, _Dim1, 0 >::pad
tiled_extent pad() const __GPU
Returns a new tiled_extent with extents adjusted up to be evenly divisible by the tile dimensions...
Definition: amp.h:1408

_Val
_In_ int _Val
Definition: vcruntime_string.h:62

__dp_d3d_maxi
int __dp_d3d_maxi(int, int) __GPU_ONLY

Concurrency::accelerator_view
Class represents a virtual device abstraction on a C++ AMP data-parallel accelerator ...
Definition: amprt.h:1442

Concurrency::index::operator-=
index< _Rank > & operator-=(const index< _Rank > &_Rhs) __GPU
Element-wise subtraction of this index with another index.
Definition: amp.h:213

Concurrency::details::_Array_view_shape::_Array_view_shape
_Array_view_shape(const _Array_view_shape &_Other) __GPU
Definition: amp.h:1576

Concurrency::details::_Get_src_dest_accelerator_view
_AMPIMP std::pair< accelerator_view, accelerator_view > __cdecl _Get_src_dest_accelerator_view(_In_opt_ const _Buffer_descriptor *_SrcBuffDescPtr, _In_opt_ const _Buffer_descriptor *_DestBuffDescPtr)

Concurrency::extent::operator++
extent< _Rank > & operator++() __GPU
Pre-increments each element of this extent.
Definition: amp.h:742

_Local
bool _Local() const _NOEXCEPT
Definition: functional:419

Concurrency::details::_Buffer_descriptor
Definition: amprt.h:433

Concurrency::details::_D3D_interop::_Get_D3D_buffer
static _AMPIMP _Ret_ IUnknown *__cdecl _Get_D3D_buffer(_In_ _Buffer *_Buffer_ptr)

Concurrency::array_view< const _Value_type, _Rank >::_Project0
void _Project0(int _I, array_view< const _Value_type, _Rank-1 > &_Projected_view) const __GPU
Definition: amp.h:3790

Concurrency::direct3d::firstbitlow
int firstbitlow(int _X) __GPU_ONLY
Gets the location of the first set bit in _X, starting from the lowest order bit and working upward ...
Definition: amp.h:7303

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(const _Buffer_descriptor &_Buffer_desc, int _Base_linear_offset, const Concurrency::extent< _Rank > &_Array_extent, const Concurrency::index< _Rank > &_View_offset, const Concurrency::extent< _Rank > &_View_extent) __GPU_ONLY
Definition: amp.h:1769

Concurrency::details::_View_shape::_Create_view_shape
static _AMPIMP _Ret_ _View_shape *__cdecl _Create_view_shape(unsigned int _Rank, unsigned int _Linear_offset, const unsigned int *_Base_extent, const unsigned int *_View_offset, const unsigned int *_View_extent, const bool *_Projection_info=NULL)

Concurrency::array::reinterpret_as
array_view< _Value_type2, 1 > reinterpret_as() __GPU
Produces a (possibly unsafe) reinterpretation of this array that is linear and with a different eleme...
Definition: amp.h:5427

Concurrency
The Concurrency namespace provides classes and functions that provide access to the Concurrency Runti...
Definition: agents.h:43

Concurrency::completion_future
Class represents a future corresponding to a C++ AMP asynchronous operation
Definition: amprt.h:1266

Concurrency::array::section
array_view< const _Value_type, 3 > section(int _I0, int _I1, int _I2, int _E0, int _E1, int _E2) const __GPU
Produces a three-dimensional subsection of the source array with origin specified by the index compon...
Definition: amp.h:5414

Concurrency::details::_Is_valid_extent
static void _Is_valid_extent(const _T< _Rank > &_Tuple) __CPU_ONLY
Definition: xxamp.h:1195

Concurrency::details::_Is_valid_access_mode
bool _Is_valid_access_mode(_Access_mode _Mode)
Definition: amprt.h:417

Concurrency::extent::size
unsigned int size() const __GPU
Returns the total linear size of this extent (in units of elements).
Definition: amp.h:521

__dp_d3d_maxu
unsigned int __dp_d3d_maxu(unsigned int, unsigned int) __GPU_ONLY

__dp_d3d_smoothstepf
float __dp_d3d_smoothstepf(float, float, float) __GPU_ONLY

Concurrency::array_view::_Project0
void _Project0(int _I, array_view< _Value_type, _Rank-1 > &_Projected_view) const __GPU
Definition: amp.h:2988

Concurrency::extent::operator--
extent< _Rank > & operator--() __GPU
Pre-decrements each element of this extent.
Definition: amp.h:767

future

Concurrency::array_view::array_view
array_view(const Concurrency::extent< _Rank > &_Extent, _Value_type *_Src) __GPU
Construct an array_view which is bound to the data pointed to by _Src.
Definition: amp.h:2327

Concurrency::direct3d::umax
unsigned int umax(unsigned int _X, unsigned int _Y) __GPU_ONLY
Determine the maximum numeric value of the arguments
Definition: amp.h:7354

Concurrency::array_view< const _Value_type, _Rank >::synchronize_to_async
concurrency::completion_future synchronize_to_async(const accelerator_view &_Accl_view) const __CPU_ONLY
Asynchronously synchronizes any modifications made to "this" array_view to the specified accelerator_...
Definition: amp.h:3697

Concurrency::_Tiled_index_base
A _Tiled_index_base is the base class of all three kinds of tiled_index to share the common code...
Definition: amp.h:1002

Concurrency::direct3d::make_array
array< _Value_type, _Rank > make_array(const Concurrency::extent< _Rank > &_Extent, const Concurrency::accelerator_view &_Av, _In_ IUnknown *_D3D_buffer) __CPU_ONLY
Create an array from a D3D buffer interface pointer.
Definition: amp.h:6522

__dp_d3d_clampf
float __dp_d3d_clampf(float, float, float) __GPU_ONLY

Concurrency::array_view::array_view
array_view(int _E0, int _E1, int _E2) __CPU_ONLY
Construct an array_view which is not bound to a data source.
Definition: amp.h:2429

Concurrency::array_view< const _Value_type, _Rank >::section
array_view section(int _I0, int _I1, int _E0, int _E1) const __GPU
Produces a two-dimensional subsection of the source array_view with origin specified by the index com...
Definition: amp.h:3605

Concurrency::details::_Array_view_base::_Create_section_buffer_shape
static _Ret_ void * _Create_section_buffer_shape(const _Buffer_descriptor &, const Concurrency::index< _Rank > &, const Concurrency::extent< _Rank > &) __GPU_ONLY
Definition: amp.h:2209

Concurrency::array::array
array(const Concurrency::extent< _Rank > &_Extent, _InputIterator _Src_first, Concurrency::accelerator_view _Av, access_type _Cpu_access_type=access_type_auto) __CPU_ONLY
Construct an array initialized from an iterator into a container, bound to a specific accelerator_vie...
Definition: amp.h:4351

Concurrency::tiled_extent< _Dim0, 0, 0 >::tiled_extent
tiled_extent(const Concurrency::extent< rank > &_Other) __GPU
Constructs a new tiled_extent from the supplied extent.
Definition: amp.h:1459

__dp_d3d_madd
double __dp_d3d_madd(double, double, double) __GPU_ONLY

Concurrency::details::_View_shape::_Get_projection_info
const bool * _Get_projection_info() const
Definition: amprt.h:1615

__dp_d3d_tile_static_memory_fence_with_tile_barrier
void __dp_d3d_tile_static_memory_fence_with_tile_barrier() __GPU_ONLY

Concurrency::array::_Flatten_helper
_Array_flatten_helper< _Rank, typename Concurrency::extent< _Rank >::value_type, typename Concurrency::index< _Rank >::value_type > _Flatten_helper
Definition: amp.h:3869

Concurrency::details::_Array_view_shape
Definition: amp.h:1553

Concurrency::array::array
array(int _E0) __CPU_ONLY
Construct array with the extent _E0
Definition: amp.h:3904

Concurrency::details::_Array_view_base::_M_buffer_descriptor
_Buffer_descriptor _M_buffer_descriptor
Definition: amp.h:2003

Concurrency::details::_Const_array_view_projection_helper
Definition: xxamp.h:132

Concurrency::direct3d::rcp
float rcp(float _X) __GPU_ONLY
Calculates a fast, approximate reciprocal of the argument
Definition: amp.h:7493

Concurrency::details::_Array_view_base::_Create_buffer_view_shape
_Ret_ _View_shape * _Create_buffer_view_shape() const __CPU_ONLY
Definition: amp.h:1942

Concurrency::array::_Create_buffer_view_shape
_Ret_ _View_shape * _Create_buffer_view_shape() const
Definition: amp.h:5690

false_type
integral_constant< bool, false > false_type
Definition: xtr1common:41

Concurrency::array_view::array_view
array_view(array< _Value_type, _Rank > &_Src) __GPU
Construct an array_view which is bound to the data contained in the _Src array. The extent of the arr...
Definition: amp.h:2274

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(const _Array_view_base &_Other, const Concurrency::index< _Rank > &_Section_origin, const Concurrency::extent< _Rank > &_Section_extent) __GPU
Definition: amp.h:1727

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(const array_view< _Value_type, _Rank > &_Src) __GPU
Copy constructor. Shallow copy.
Definition: amp.h:3076

Concurrency::details::opAdd
Definition: xxamp.h:240

Concurrency::details::_Ubiquitous_buffer::_Register_view
_AMPIMP void _Register_view(_In_ _View_key _Key, accelerator_view _Cpu_av, _View_shape_ptr _Shape, _In_opt_ const _View_key _Source_view_key=nullptr)

Concurrency::array::array
array(int _E0, accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY
Construct a staging array between two associated accelerator_view.
Definition: amp.h:4076

Concurrency::_Tiled_index_base::operator=
_Tiled_index_base & operator=(const _Tiled_index_base &) __GPU

Concurrency::array::array
array(const array_view< const _Value_type, _Rank > &_Src, accelerator_view _Av, access_type _Cpu_access_type=access_type_auto) __CPU_ONLY
Construct an array initialized from an array_view, bound to a specific accelerator_view.
Definition: amp.h:4810

Concurrency::tiled_index
A tiled_index is a set of indices of 1 to 3 dimensions which have been subdivided into 1-...
Definition: amp.h:1096

Concurrency::details::_Is_D3D_accelerator_view
_AMPIMP bool __cdecl _Is_D3D_accelerator_view(const accelerator_view &_Av)

Concurrency::details::_Event::_Get
_AMPIMP void _Get()
Wait until the _Event completes and throw any exceptions that occur.

Concurrency::array::array
array(const Concurrency::extent< _Rank > &_Extent, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, access_type _Cpu_access_type=access_type_auto) __CPU_ONLY
Construct an array initialized from a pair of iterators into a container, bound to a specific acceler...
Definition: amp.h:4325

Platform::Details::int
unsigned int
Definition: vccorlib.h:2468

Concurrency::extent::extent
extent(const int _Array[_Rank]) __GPU
Constructs an extent with the coordinate values provided the array of int component values...
Definition: amp.h:476

Concurrency::details::_Get_amp_trace
_AMPIMP _Ret_ _Amp_runtime_trace *__cdecl _Get_amp_trace()

Concurrency::atomic_fetch_dec
int atomic_fetch_dec(_Inout_ int *_Dest) __GPU_ONLY
Performs an atomic decrement to the memory location pointed to by _Dest
Definition: amp.h:6673

Concurrency::array_view::synchronize_async
concurrency::completion_future synchronize_async(access_type _Access_type=access_type_read) const __CPU_ONLY
Asynchronously synchronizes any modifications made to "this" array_view to its source data...
Definition: amp.h:2885

Concurrency::array::array
array(const Concurrency::extent< _Rank > &_Extent) __CPU_ONLY
Construct an array from extents
Definition: amp.h:3892

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(const _Buffer_descriptor &_Buffer_desc, const Concurrency::extent< _Rank > &_Array_extent) __GPU
Definition: amp.h:1736

Concurrency::tiled_index::tiled_index
tiled_index(const tiled_index &_Other) __GPU
Copy Constructor.
Definition: amp.h:1131

_Is_array_mode
Definition: amprt.h:93

Concurrency::direct3d::reversebits
unsigned int reversebits(unsigned int _X) __GPU_ONLY
Reverses the order of the bits in _X
Definition: amp.h:7507

Concurrency::tile_barrier::wait_with_all_memory_fence
void wait_with_all_memory_fence() const __GPU_ONLY
Blocks execution of all threads in a tile until all all threads in the tile have reached this call...
Definition: amp.h:974

UINT_MAX
#define UINT_MAX
Definition: limits.h:36

Concurrency::extent::extent
extent() __GPU
Default constructor. The value at each dimension is initialized to zero.
Definition: amp.h:404

Concurrency::details::_View_shape::_Get_view_extent
const unsigned int * _Get_view_extent() const
Definition: amprt.h:1610

Concurrency::accelerator::cpu_accelerator
static _AMPIMP const wchar_t cpu_accelerator[]
String constant for cpu accelerator
Definition: amprt.h:1035

Concurrency::extent::operator%=
extent< _Rank > & operator%=(int _Rhs) __GPU
Modulus an integer value from each element of this extent.
Definition: amp.h:730

Concurrency::details::_Array_init_helper
Definition: xxamp.h:827

Concurrency::details::_Array_view_shape::_Array_view_shape
_Array_view_shape(int _Base_linear_offset, const Concurrency::extent< _Rank > &_Array_extent) __GPU
Definition: amp.h:1599

Concurrency::array_view< const _Value_type, _Rank >::operator=
array_view & operator=(const array_view< _Value_type, _Rank > &_Other) __GPU
Copy Assignment operator. Shallow copy.
Definition: amp.h:3381

Concurrency::array::_Initialize
void _Initialize(Concurrency::accelerator_view _Av, access_type _Cpu_access_type) __CPU_ONLY
Definition: amp.h:5572

Concurrency::details::_Is_valid_section
static void _Is_valid_section(const _T2< _Rank > &_Base_extent, const _T1< _Rank > &_Section_origin, const _T2< _Rank > &_Section_extent) __CPU_ONLY
Definition: xxamp.h:1106

Concurrency::atomic_fetch_max
int atomic_fetch_max(_Inout_ int *_Dest, int _Value) __GPU_ONLY
Atomically computes the maximum of _Value and the value of the memory location pointed to by _Dest...
Definition: amp.h:6836

Concurrency::array_view::_Initialize
void _Initialize(size_t _Src_data_size, bool _Discard_data=false) __CPU_ONLY
Definition: amp.h:3014

Concurrency::array_view< const _Value_type, _Rank >::_Base
_Array_view_base< _Rank, sizeof(_Value_type)/sizeof(int)> _Base
Definition: amp.h:3036

distance
_Iter_diff_t< _InIt > distance(_InIt _First, _InIt _Last)
Definition: xutility:1124

Concurrency::tile_barrier
The tile_barrier class is a capability class that is only creatable by the system, and passed to a tiled parallel_for_each lambda as part of the tiled_index parameter. It provides wait methods whose purpose is to synchronize execution of threads running within the thread group (tile).
Definition: amp.h:948

Concurrency::array::array
array(int _E0, int _E1, _InputIterator _Src_first, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY
Construct a staging array between two associated accelerator_view, initialized from an iterator into ...
Definition: amp.h:4706

Concurrency::details::_Event::_Add_event
_AMPIMP _Event _Add_event(_Event _Ev)
Creates an event which is an ordered collection of this and _Ev

AS_UINT
#define AS_UINT(v)
Definition: amp.h:6547

Concurrency::index::operator*=
index< _Rank > & operator*=(int _Rhs) __GPU
Multiplies each element of this index with an integer value.
Definition: amp.h:258

Concurrency::array::data
_Ret_ _Value_type * data() __GPU
Returns a pointer to the raw data of this array.
Definition: amp.h:5500

Concurrency::index::index
index(int _I0, int _I1) __GPU
Constructor for index<2>
Definition: amp.h:110

__dp_d3d_tile_static_memory_fence
void __dp_d3d_tile_static_memory_fence() __GPU_ONLY

Concurrency::extent::operator/=
extent< _Rank > & operator/=(int _Rhs) __GPU
Divides an integer value into each element of this extent.
Definition: amp.h:715

Concurrency::array::_Initialize
void _Initialize(Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av, _InputIterator _Src_first, _InputIterator _Src_last) __CPU_ONLY
Definition: amp.h:5628

Concurrency::array::array
array(int _E0, _InputIterator _Src_first, _InputIterator _Src_last) __CPU_ONLY
Construct an array initialized from a pair of iterators into a container.
Definition: amp.h:4179

i
int i[4]
Definition: dvec.h:68

Concurrency::details::_do_not_initialize
Definition: xxamp.h:209

Concurrency::operator-
std::enable_if< details::_Is_extent_or_index< _Tuple_type< _Rank > >::value, _Tuple_type< _Rank > >::type operator-(const _Tuple_type< _Rank > &_Lhs, const _Tuple_type< _Rank > &_Rhs) __GPU
Definition: amp.h:845

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(const Concurrency::extent< _Rank > &_Extent, _In_ _Value_type *_Src) __GPU
Construct an array_view which is bound to the data pointed to by _Src.
Definition: amp.h:3169

Concurrency::array::section
array_view< _Value_type, _Rank > section(const index< _Rank > &_Idx) __GPU
Produces a subsection of the source array with origin specified by an index, with an extent of (this-...
Definition: amp.h:5248

Concurrency::array::array
array(int _E0, int _E1, Concurrency::accelerator_view _Av, access_type _Cpu_access_type=access_type_auto) __CPU_ONLY
Construct an array from two integer extents, bound to a specific accelerator_view.
Definition: amp.h:4010

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base() __GPU
Definition: amp.h:1695

Concurrency::index::index
index() __GPU
Default constructor, initializes all elements with 0.
Definition: amp.h:73

Concurrency::array_view::synchronize_to_async
concurrency::completion_future synchronize_to_async(const accelerator_view &_Accl_view, access_type _Access_type=access_type_read) const __CPU_ONLY
Asynchronously synchronizes any modifications made to "this" array_view to the specified accelerator_...
Definition: amp.h:2861

Concurrency::array_view::array_view
array_view(const Concurrency::extent< _Rank > &_Extent, _Container &_Src) __CPU_ONLY
Construct an array_view which is bound to the data contained in the _Src container.
Definition: amp.h:2310

Concurrency::array_view< const _Value_type, _Rank >::copy_to
void copy_to(const array_view< _Value_type, _Rank > &_Dest) const __CPU_ONLY
Copies elements from this array_view to the destination array_view.
Definition: amp.h:3398

Concurrency::tiled_extent::operator=
tiled_extent & operator=(const tiled_extent &_Other) __GPU
copy-assignment operator
Definition: amp.h:1302

Concurrency::direct3d::sign
int sign(int _X) __GPU_ONLY
Returns the sign of the argument
Definition: amp.h:7535

Concurrency::direct3d_printf
void direct3d_printf(const char *,...) __GPU_ONLY

Concurrency::details::_Buffer_descriptor::_M_curr_cpu_access_mode
_Access_mode _M_curr_cpu_access_mode
Definition: amprt.h:450

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(const Concurrency::extent< _Rank > &_Array_extent) __CPU_ONLY
Definition: amp.h:1794

_In_
#define _In_
Definition: sal.h:305

Concurrency::details::opDiv
Definition: xxamp.h:243

Concurrency::index::operator+=
index< _Rank > & operator+=(const index< _Rank > &_Rhs) __GPU
Element-wise addition of this index with another index.
Definition: amp.h:198

Concurrency::array::_Refresh_data_ptr
void _Refresh_data_ptr(_Access_mode _Requested_mode, bool _Exception=true) __CPU_ONLY
Definition: amp.h:5708

Concurrency::index::operator%=
index< _Rank > & operator%=(int _Rhs) __GPU
Modulus an integer value into each element of this index.
Definition: amp.h:288

Concurrency::details::_Array_view_shape::_Base_linear_offset
int _Base_linear_offset() const __GPU
Definition: amp.h:1571

Concurrency::operator+
std::enable_if< details::_Is_extent_or_index< _Tuple_type< _Rank > >::value, _Tuple_type< _Rank > >::type operator+(const _Tuple_type< _Rank > &_Lhs, const _Tuple_type< _Rank > &_Rhs) __GPU
Definition: amp.h:836

__dp_d3d_reversebitsu
unsigned int __dp_d3d_reversebitsu(unsigned int) __GPU_ONLY

Concurrency::array::array
array(const array_view< const _Value_type, _Rank > &_Src) __CPU_ONLY
Construct an array initialized from an array_view.
Definition: amp.h:4787

Concurrency::details::_Array_view_shape::_M_view_extent
Concurrency::extent< _Rank > _M_view_extent
Definition: amp.h:1672

Concurrency::tiled_extent::tiled_extent
tiled_extent(const Concurrency::extent< rank > &_Other) __GPU
Constructs a new tiled_extent from the supplied extent.
Definition: amp.h:1290

Concurrency::array_view< const _Value_type, _Rank >::_Initialize
void _Initialize() __GPU
Definition: amp.h:3805

__dp_d3d_mini
int __dp_d3d_mini(int, int) __GPU_ONLY

__dp_d3d_rcpf
float __dp_d3d_rcpf(float) __GPU_ONLY

_In_opt_
#define _In_opt_
Definition: sal.h:306

Concurrency::details::_Array_view_base::_Create_projection_buffer_shape
static _Ret_ void * _Create_projection_buffer_shape(const _Buffer_descriptor &, int, int) __GPU_ONLY
Definition: amp.h:2204

Concurrency::array::_Initialize
unsigned int _Initialize() __CPU_ONLY
Definition: amp.h:5558

Concurrency::array::view_as
array_view< const _Value_type, _New_rank > view_as(const Concurrency::extent< _New_rank > &_View_extent) const __GPU
Produces an array_view of a different rank over this array's data.
Definition: amp.h:5474

Concurrency::tiled_extent< _Dim0, _Dim1, 0 >::tiled_extent
tiled_extent(const tiled_extent &_Other) __GPU
Copy constructor. Constructs a new tiled_extent from the supplied argument "_Other".
Definition: amp.h:1383

Concurrency::array_view::synchronize
void synchronize(access_type _Access_type=access_type_read) const __CPU_ONLY
Synchronizes any modifications made to "this" array_view to its source data.
Definition: amp.h:2934

Concurrency::extent::tile
tiled_extent< _Dim0 > tile() const __GPU
Produces a tiled_extent object with the tile extents given by _Dim0.
Definition: amp.h:537

Concurrency::details::_Array_view_projection_helper
Definition: xxamp.h:151

Concurrency::array::_Has_cpu_access
bool _Has_cpu_access() const __CPU_ONLY
Definition: amp.h:5703

__CPU_ONLY
#define __CPU_ONLY
Definition: amprt.h:47

Concurrency::details::_Array_view_base::_Unregister
void _Unregister(bool _Throw_exception=true) __CPU_ONLY
Definition: amp.h:2056

Concurrency::array_view::synchronize_to
void synchronize_to(const accelerator_view &_Accl_view, access_type _Access_type=access_type_read) const __CPU_ONLY
Synchronizes any modifications made to "this" array_view to the specified accelerator_view.
Definition: amp.h:2914

Concurrency::details::_Array_view_shape::_Initialize_multiplier
void _Initialize_multiplier() __GPU
Definition: amp.h:1660

Concurrency::array::_Register
void _Register() __CPU_ONLY
Definition: amp.h:5634

Concurrency::array::_Get_buffer
_Ret_ _Ubiquitous_buffer * _Get_buffer() const __CPU_ONLY
Definition: amp.h:5664

Concurrency::tiled_extent< _Dim0, 0, 0 >::tiled_extent
tiled_extent(const tiled_extent &_Other) __GPU
Copy constructor. Constructs a new tiled_extent from the supplied argument "_Other".
Definition: amp.h:1465

Concurrency::array::array
array(int _E0, _InputIterator _Src_first) __CPU_ONLY
Construct an array initialized from an iterator.
Definition: amp.h:4196

Concurrency::index::value_type
int value_type
Definition: amp.h:68

Concurrency::__declspec
__declspec(deprecated("Concurrency::EnableTracing is a deprecated function.")) _CONCRTIMP HRESULT __cdecl EnableTracing()
Enables tracing in the Concurrency Runtime. This function is deprecated because ETW tracing is now on...

Concurrency::array::section
array_view< _Value_type, _Rank > section(const Concurrency::extent< _Rank > &_Ext) __GPU
Produces a subsection of the source array_view with origin of zero, with an extent of _Ext...
Definition: amp.h:5218

Concurrency::tiled_extent::_map_index
tiled_index< _Dim0, _Dim1, _Dim2 > _map_index(const index< rank > &_Local, const index< rank > &_Tile, const index< rank > &_Global, tile_barrier &_Barrier) const __GPU
Definition: amp.h:1351

Concurrency::runtime_exception
Exception thrown due to a C++ AMP runtime_exception. This is the base type for all C++ AMP exception ...
Definition: amprt_exceptions.h:29

Concurrency::array_view::section
array_view section(int _I0, int _I1, int _I2, int _E0, int _E1, int _E2) const __GPU
Produces a three-dimensional subsection of the source array_view with origin specified by the index c...
Definition: amp.h:2790

Concurrency::extent::_CPP_AMP_VERIFY_RANK
_CPP_AMP_VERIFY_RANK(_Rank, extent)

Concurrency::array::_M_extent
Concurrency::extent< _Rank > _M_extent
Definition: amp.h:5749

Concurrency::details::_Host_Scheduling_info
Definition: amprt.h:3642

Concurrency::extent::operator+
extent< _Rank > operator+(const index< _Rank > &_Rhs) const __GPU
Element-wise addition of this extent with an index.
Definition: amp.h:578

Concurrency::details::_Is_valid_projection
static void _Is_valid_projection(int _I, const _T1< _Rank > &_Base_extent) __CPU_ONLY
Definition: xxamp.h:1131

Concurrency::array::array
array(const Concurrency::extent< _Rank > &_Extent, Concurrency::accelerator_view _Av, access_type _Cpu_access_type=access_type_auto) __CPU_ONLY
Construct an array from extents, bound to a specific accelerator_view.
Definition: amp.h:3962

Concurrency::array::_Get_access_async
_Event _Get_access_async(_Access_mode _Mode, _Buffer_ptr &_Buf_ptr, bool _Zero_copy_cpu_access=false) const __CPU_ONLY
Definition: amp.h:5669

Concurrency::details::_Buffer_descriptor
struct Concurrency::details::_Buffer_descriptor _Buffer_descriptor

Concurrency::extent::operator+=
extent< _Rank > & operator+=(const extent< _Rank > &_Rhs) __GPU
Element-wise addition of this extent with another extent.
Definition: amp.h:610

Concurrency::direct3d::saturate
float saturate(float _X) __GPU_ONLY
Clamps _X within the range of 0 to 1
Definition: amp.h:7521

Concurrency::details::_Select_default_accelerator
_AMPIMP accelerator __cdecl _Select_default_accelerator()

Concurrency::parallel_for_each
void parallel_for_each(const extent< _Rank > &_Compute_domain, const _Kernel_type &_Kernel)
Invokes a parallel computation of a kernel function over a compute domain on an accelerator_view. The accelerator_view is determined from the arrays and/or array_views captured by the kernel function, or if no accelerator_view can be derived, the default is chosen.
Definition: amp.h:7020

Concurrency::details::_View_shape::_Get_linear_offset
unsigned int _Get_linear_offset() const
Definition: amprt.h:1596

Concurrency::details::_Array_view_base::_Access
_Ret_ void * _Access(_Access_mode _Requested_mode, const index< _Rank > &_Index) const __CPU_ONLY
Definition: amp.h:1882

Concurrency::array::array
array(int _E0, int _E1, int _E2, _InputIterator _Src_first, _InputIterator _Src_last) __CPU_ONLY
Construct an array initialized from an iterator.
Definition: amp.h:4269

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(const _Buffer_descriptor &_Buffer_desc, int _Base_linear_offset, const Concurrency::extent< _Rank > &_Array_extent) __GPU
Definition: amp.h:1745

Concurrency::details::_Array_view_shape::_Flatten_helper
_Array_flatten_helper< _Rank, typename Concurrency::extent< _Rank >::value_type, typename Concurrency::index< _Rank >::value_type > _Flatten_helper
Definition: amp.h:1555

Concurrency::direct3d::get_buffer
_Ret_ IUnknown * get_buffer(const array< _Value_type, _Rank > &_Array) __CPU_ONLY
Get the D3D buffer interface underlying an array.
Definition: amp.h:6494

Concurrency::tiled_extent< _Dim0, _Dim1, 0 >::tiled_extent
tiled_extent() __GPU
Default constructor.
Definition: amp.h:1372

Concurrency::details::_project0::func
static void func(_RES_EXT &_ResArrayExtent, const _SRC_EXT &_SrcArrayExtent, _RES_EXT &_ResArrayMultiplier, const _SRC_EXT &_SrcArrayMultiplier, _RES_IDX &_ResViewOffset, const _SRC_IDX &_SrcViewOffset, _RES_EXT &_ResViewExtent, const _SRC_EXT &_SrcViewExtent) __GPU
Definition: xxamp.h:768

Concurrency::array::section
array_view< const _Value_type, 1 > section(int _I0, int _E0) const __GPU
Produces a one-dimensional subsection of the source array with origin specified by the index componen...
Definition: amp.h:5302

Concurrency::array_view< const _Value_type, _Rank >::synchronize_to
void synchronize_to(const accelerator_view &_Accl_view) const __CPU_ONLY
Synchronizes any modifications made to "this" array_view to the specified accelerator_view.
Definition: amp.h:3737

Concurrency::details::_Ubiquitous_buffer::_Get_master_buffer
_AMPIMP _Buffer_ptr _Get_master_buffer() const

Concurrency::details::_Ubiquitous_buffer
Definition: amprt.h:3189

Concurrency::extent::operator+=
extent< _Rank > & operator+=(const index< _Rank > &_Rhs) __GPU
Element-wise addition of this extent with an index.
Definition: amp.h:640

Concurrency::array_view< const _Value_type, _Rank >::data
const _Value_type * data() const __GPU
Returns a pointer to the raw data of this array_view.
Definition: amp.h:3672

Concurrency::array::section
array_view< const _Value_type, _Rank > section(const index< _Rank > &_Idx) const __GPU
Produces a subsection of the source array with origin specified by an index, with an extent of (this-...
Definition: amp.h:5264

Concurrency::tiled_index< _Dim0, 0, 0 >::tiled_index
tiled_index(const tiled_index &_Other) __GPU
Copy Constructor.
Definition: amp.h:1246

Concurrency::atomic_fetch_xor
int atomic_fetch_xor(_Inout_ int *_Dest, int _Value) __GPU_ONLY
Performs an atomic bitwise xor operation of _Value to the memory location pointed to by _Dest ...
Definition: amp.h:6981

Concurrency::tiled_extent< _Dim0, _Dim1, 0 >::tiled_extent
tiled_extent(const Concurrency::extent< rank > &_Other) __GPU
Constructs a new tiled_extent from the supplied extent.
Definition: amp.h:1377

Concurrency::array_view::array_view
array_view(int _E0, int _E1, int _E2, _In_ _Value_type *_Src) __GPU
Construct an array_view which is bound to the data pointed to by _Src.
Definition: amp.h:2525

Concurrency::array_view::section
array_view section(const Concurrency::extent< _Rank > &_Ext) const __GPU
Produces a subsection of the source array_view with origin of zero, with an extent of _Ext...
Definition: amp.h:2716

Concurrency::_Tiled_index_base::_Tiled_index_base
_Tiled_index_base(const _Tiled_index_base &_Other) __GPU
Copy Constructor.
Definition: amp.h:1067

Concurrency::array::array
array(int _E0, int _E1, int _E2, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY
Construct a staging array between two associated accelerator_view, initialized from a pair of iterato...
Definition: amp.h:4741

Concurrency::array::copy_to
void copy_to(const array_view< _Value_type, _Rank > &_Dest) const __CPU_ONLY
Copies elements from this array to the destination array_view.
Definition: amp.h:4922

Concurrency::details::_Get_buffer
_Ret_ _Ubiquitous_buffer * _Get_buffer(const _Array_type &_Array) __CPU_ONLY
Definition: xxamp.h:1069

Concurrency::direct3d::umin
unsigned int umin(unsigned int _X, unsigned int _Y) __GPU_ONLY
Determine the minimum numeric value of the arguments
Definition: amp.h:7371

Concurrency::array::array
array(const Concurrency::extent< _Rank > &_Extent, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY
Construct a staging array between two associated accelerator_view, initialized from a pair of iterato...
Definition: amp.h:4576

Concurrency::details::_Ubiquitous_buffer::_Register_view_copy
_AMPIMP void _Register_view_copy(_In_ _View_key _New_view_key, _In_ _View_key _Existing_view_key)

Concurrency::_Tiled_index_base::_Tiled_index_base
_Tiled_index_base(const index< rank > &_Global, const index< rank > &_Local, const index< rank > &_Tile, const index< rank > &_Tile_origin, const tile_barrier &_Barrier) __GPU
A Constructor that initializes data members using the given values.
Definition: amp.h:1053

Concurrency::direct3d::countbits
unsigned int countbits(unsigned int _X) __GPU_ONLY
Counts the number of set bits in _X
Definition: amp.h:7275

Concurrency::array_view::copy_to
void copy_to(array< _Value_type, _Rank > &_Dest) const __CPU_ONLY
Copies elements from this array_view to the destination array.
Definition: amp.h:2544

Concurrency::array::array
array(const Concurrency::extent< _Rank > &_Extent, _InputIterator _Src_first, _InputIterator _Src_last) __CPU_ONLY
Construct an array initialized from a pair of iterators into a container.
Definition: amp.h:4142

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(const _Buffer_descriptor &_Buffer_desc, int _Base_linear_offset, const Concurrency::extent< _Rank > &_Array_extent, const Concurrency::index< _Rank > &_View_offset, const Concurrency::extent< _Rank > &_View_extent) __CPU_ONLY
Definition: amp.h:1754

Concurrency::direct3d::mad
unsigned int mad(unsigned int _X, unsigned int _Y, unsigned int _Z) __GPU_ONLY
Performs an arithmetic multiply/add operation on three arguments: _X * _Y + _Z
Definition: amp.h:7451

Concurrency::extent::tile
tiled_extent< _Dim0, _Dim1, _Dim2 > tile() const __GPU
Produces a tiled_extent object with the tile extents given by _Dim0, _Dim1, _Dim2.
Definition: amp.h:559

Concurrency::array_view< const _Value_type, _Rank >::~array_view
~array_view() __GPU
Destroys this array_view and reclaims resources.
Definition: amp.h:3058

__dp_d3d_absi
int __dp_d3d_absi(int) __GPU_ONLY

false
#define false
Definition: stdbool.h:16

Concurrency::array_view< const _Value_type, _Rank >::reinterpret_as
array_view< const _Value_type2, _Rank > reinterpret_as() const __GPU
Produces a (possibly unsafe) reinterpretation of this array_view that is linear and with a different ...
Definition: amp.h:3650

Concurrency::direct3d_abort
void direct3d_abort() __GPU_ONLY

__dp_d3d_all_memory_fence
void __dp_d3d_all_memory_fence() __GPU_ONLY

Concurrency::extent::extent
extent(int _I) __GPU
Constructor for extent<1>.
Definition: amp.h:426

__dp_d3d_interlocked_and
unsigned int __dp_d3d_interlocked_and(_Inout_ unsigned int *, unsigned int) __GPU_ONLY

Concurrency::array::array
array(int _E0, int _E1, int _E2, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, access_type _Cpu_access_type=access_type_auto) __CPU_ONLY
Construct an array initialized from a pair of iterators into a container, bound to a specific acceler...
Definition: amp.h:4514

Concurrency::array_view::array_view
array_view(_In_ _Value_type(&_Src)[_Size]) __GPU
Construct an array_view which is bound to the array _Src.
Definition: amp.h:2482

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(const Concurrency::extent< _Rank > &_Extent, _Container &_Src) __CPU_ONLY
Construct an array_view which is bound to the data contained in the _Src container.
Definition: amp.h:3136

Concurrency::array::copy_to
void copy_to(array< _Value_type, _Rank > &_Dest) const __CPU_ONLY
Copies elements from this array to the destination array.
Definition: amp.h:4914

Concurrency::details::_Is_extent_or_index
Definition: amp.h:811

Concurrency::details::_Ubiquitous_buffer::_Unregister_view
_AMPIMP void _Unregister_view(_In_ _View_key _Key)

__dp_d3d_all_memory_fence_with_tile_barrier
void __dp_d3d_all_memory_fence_with_tile_barrier() __GPU_ONLY

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(int _E0, int _E1, const _Value_type *_Src) __GPU
Construct an array_view which is bound to the data pointed to by _Src.
Definition: amp.h:3279

Concurrency::_Tiled_index_base::barrier
const tile_barrier barrier
An object which represents a barrier within the current tile of threads.
Definition: amp.h:1033

Concurrency::details::_Buffer_descriptor::_Get_view_key
_Ret_ _View_key _Get_view_key()
Definition: amprt.h:537

Concurrency::_Tiled_index_base::tile_origin
const index< rank > tile_origin
An index that represents the global coordinates of the origin of the current tile within a tiled_exte...
Definition: amp.h:1028

Concurrency::array_view< const _Value_type, _Rank >::section
array_view section(const Concurrency::index< _Rank > &_Section_origin, const Concurrency::extent< _Rank > &_Section_extent) const __GPU
Produces a subsection of the source array_view at the given origin and extent.
Definition: amp.h:3532

Concurrency::array_view< const _Value_type, _Rank >::section
array_view section(const Concurrency::extent< _Rank > &_Ext) const __GPU
Produces a subsection of the source array_view with origin of zero, with an extent of _Ext...
Definition: amp.h:3547

Concurrency::details::_Array_view_shape::_M_array_extent
Concurrency::extent< _Rank > _M_array_extent
Definition: amp.h:1668

Concurrency::array_view< const _Value_type, _Rank >::get_source_accelerator_view
accelerator_view get_source_accelerator_view() const
Returns the accelerator_view where the data source of the array_view is located. If the array_view do...
Definition: amp.h:3770

Concurrency::extent
The extent type represents an N-dimensional vector of int which specifies the bounds of an N-dimen...
Definition: amp.h:383

Concurrency::details::_Array_view_base::_Register
void _Register(_In_opt_ const _View_key _Source_view_key=nullptr) __CPU_ONLY
Definition: amp.h:2007

Concurrency::details::_Array_view_base::~_Array_view_base
~_Array_view_base() __GPU
Definition: amp.h:1687

Concurrency::array_view::_Base
_Array_view_base< _Rank, sizeof(_Value_type)/sizeof(int)> _Base
Definition: amp.h:2238

Concurrency::array
An array is a multi-dimensional data aggregate on a accelerator_view.
Definition: amp.h:3865

Concurrency::details::_Array_view_base::_Flatten_helper
_Array_flatten_helper< _Rank, typename Concurrency::extent< _Rank >::value_type, typename Concurrency::index< _Rank >::value_type > _Flatten_helper
Definition: amp.h:1678

Concurrency::direct3d_errorf
void direct3d_errorf(const char *,...) __GPU_ONLY

Concurrency::array_view::discard_data
void discard_data() const __CPU_ONLY
Discards the current data underlying this view. This is an optimization hint to the runtime used to a...
Definition: amp.h:2959

AS_INT
#define AS_INT(v)
Definition: amp.h:6548

Concurrency::extent::extent
extent(int _I0, int _I1, int _I2) __GPU
Constructor for extent<3>
Definition: amp.h:460

Concurrency::direct3d::abs
int abs(int _X) __GPU_ONLY
Returns the absolute value of the argument
Definition: amp.h:7221

Concurrency::index::index
index(const int _Array[_Rank]) __GPU
Constructs an index with the coordinate values provided the array of int component values...
Definition: amp.h:145

Concurrency::details::_Array_view_base::_Unregister
void _Unregister(bool=true) __GPU_ONLY
Definition: amp.h:2200

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(const _Container &_Src, typename std::enable_if< details::_Is_container< _Container >::type::value, void ** >::type=0) __CPU_ONLY
Construct an array_view which is bound to the data contained in the _Src container; ...
Definition: amp.h:3116

__dp_d3d_madi
int __dp_d3d_madi(int, int, int) __GPU_ONLY

Concurrency::details::_Amp_runtime_trace::_Launch_async_copy_event_helper
_AMPIMP ULONG _Launch_async_copy_event_helper(const _Buffer_descriptor &_Src, const _Buffer_descriptor &_Dest, ULONGLONG _Num_bytes_for_copy)

Concurrency::array::_Register_copy
void _Register_copy(const array &_Other) __CPU_ONLY
Definition: amp.h:5651

Concurrency::extent::value_type
int value_type
Definition: amp.h:398

__dp_d3d_interlocked_min_uint
unsigned int __dp_d3d_interlocked_min_uint(_Inout_ unsigned int *, unsigned int) __GPU_ONLY

Concurrency::index::index
index(const index< _Rank > &_Other) __GPU
Copy Constructor.
Definition: amp.h:84

Concurrency::array::array
array(int _E0, int _E1, int _E2, _InputIterator _Src_first) __CPU_ONLY
Construct an array initialized from an iterator.
Definition: amp.h:4292

Concurrency::details::_Buffer_descriptor::_M_data_ptr
void * _M_data_ptr
Definition: amprt.h:438

Concurrency::array::array
array(const Concurrency::extent< _Rank > &_Extent, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY
Construct a staging array between two associated accelerator_view.
Definition: amp.h:4058

Concurrency::details::_Array_view_shape::_Array_view_shape
_Array_view_shape(int _Base_linear_offset, const Concurrency::extent< _Rank > &_Array_extent, const Concurrency::index< _Rank > &_Section_origin, const Concurrency::extent< _Rank > &_Section_extent) __GPU
Definition: amp.h:1609

__dp_d3d_interlocked_exchange
unsigned int __dp_d3d_interlocked_exchange(_Inout_ unsigned int *, unsigned int) __GPU_ONLY

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view() __GPU
Definition: amp.h:3796

_Read_write_access
Definition: amprt.h:94

Concurrency::details::_Get_buffer_view_shape
_Ret_ _View_shape * _Get_buffer_view_shape(const _Buffer_descriptor &_Descriptor)
Definition: amprt.h:3395

Concurrency::array_view< const _Value_type, _Rank >::operator=
array_view & operator=(const array_view &_Other) __GPU
Copy Assignment operator. Shallow copy.
Definition: amp.h:3372

Concurrency::direct3d::imin
int imin(int _X, int _Y) __GPU_ONLY
Determine the minimum numeric value of the arguments
Definition: amp.h:7337

Concurrency::array::array
array(int _E0, int _E1, int _E2, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY
Construct a staging array between two associated accelerator_view.
Definition: amp.h:4123

_Access_mode
_Access_mode
Definition: amprt.h:88

Concurrency::array::array
array(int _E0, int _E1, _InputIterator _Src_first, _InputIterator _Src_last) __CPU_ONLY
Construct an array initialized from a pair of iterators into a container.
Definition: amp.h:4222

Concurrency::tiled_extent< _Dim0, 0, 0 >::tiled_extent
tiled_extent() __GPU
Default constructor.
Definition: amp.h:1454

Concurrency::array::array
array(int _E0, _InputIterator _Src_first, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av)
Construct a staging array between two associated accelerator_view, initialized from an iterator into ...
Definition: amp.h:4648

xxamp.h

Concurrency::details::_Get_buffer_descriptor
const _Buffer_descriptor & _Get_buffer_descriptor(const _Array_type &_Array) __GPU
Definition: xxamp.h:1063

Concurrency::array_view::array_view
array_view(const array_view &_Other, const Concurrency::index< _Rank > &_Section_origin, const Concurrency::extent< _Rank > &_Section_extent) __GPU
Definition: amp.h:2996

Concurrency::_Tiled_index_base::local
const index< rank > local
An index that represents the relative index within the current tile of a tiled_extent.
Definition: amp.h:1018

Concurrency::array::array
array(int _E0, int _E1, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY
Construct a staging array between two associated accelerator_view, initialized from a pair of iterato...
Definition: amp.h:4680

data
constexpr auto data(_Container &_Cont) -> decltype(_Cont.data())
Definition: xutility:1513

Concurrency::details::_contains
Definition: xxamp.h:710

Concurrency::direct3d::radians
float radians(float _X) __GPU_ONLY
Converts _X from degrees to radians
Definition: amp.h:7479

Concurrency::details::_Amp_runtime_trace::_Launch_array_view_synchronize_event_helper
_AMPIMP ULONG _Launch_array_view_synchronize_event_helper(const _Buffer_descriptor &_Buff_desc)

Concurrency::extent::operator++
extent< _Rank > operator++(int) __GPU
Post-increments each element of this extent.
Definition: amp.h:754

Concurrency::details::_Amp_runtime_trace::_Start_copy_event_helper
_AMPIMP ULONG _Start_copy_event_helper(const _Buffer_descriptor &_Src, const _Buffer_descriptor &_Dest, ULONGLONG _Num_bytes_for_copy)

Concurrency::direct3d::smoothstep
float smoothstep(float _Min, float _Max, float _X) __GPU_ONLY
Returns a smooth Hermite interpolation between 0 and 1, if _X is in the range [_Min, _Max].
Definition: amp.h:7555

Concurrency::tiled_extent< _Dim0, 0, 0 >::pad
tiled_extent pad() const __GPU
Returns a new tiled_extent with extents adjusted up to be evenly divisible by the tile dimensions...
Definition: amp.h:1490

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(_In_ void *_Data, const Concurrency::extent< _Rank > &_Array_extent) __CPU_ONLY
Definition: amp.h:1805

Concurrency::tiled_index::tiled_index
tiled_index(const index< rank > &_Global, const index< rank > &_Local, const index< rank > &_Tile, const index< rank > &_Tile_origin, const tile_barrier &_Barrier) __GPU
A Constructor that initializes data members using the given values.
Definition: amp.h:1117

Concurrency::details::_Array_flatten_helper
Definition: xxamp.h:892

Concurrency::direct3d::clamp
int clamp(int _X, int _Min, int _Max) __GPU_ONLY
Clamps _X to the specified _Min and _Max range
Definition: amp.h:7261

Concurrency::array_view::array_view
array_view(int _E0, _In_ _Value_type *_Src) __GPU
Construct an array_view which is bound to the data pointed to by _Src.
Definition: amp.h:2469

Concurrency::extent::tile
tiled_extent< _Dim0, _Dim1 > tile() const __GPU
Produces a tiled_extent object with the tile extents given by _Dim0, _Dim1
Definition: amp.h:548

Concurrency::details::_Array_view_shape::operator=
_Array_view_shape & operator=(const _Array_view_shape &_Other) __GPU
Definition: amp.h:1623

Concurrency::array_view::data
_Ret_ _Value_type * data() const __GPU
Returns a pointer to the raw data of this array_view.
Definition: amp.h:2826

Concurrency::extent::operator-=
extent< _Rank > & operator-=(int _Rhs) __GPU
Subtracts an integer value from each element of this extent.
Definition: amp.h:685

Concurrency::extent::operator[]
int operator[](unsigned int _Index) const __GPU
Index operator.
Definition: amp.h:499

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(const _Buffer_descriptor &_Buffer_desc, const Concurrency::extent< _Rank > &_Array_extent, const Concurrency::index< _Rank > &_Section_origin, const Concurrency::extent< _Rank > &_Section_extent) __GPU
Definition: amp.h:1784

_CPP_AMP_VERIFY_MUTABLE_ITERATOR
#define _CPP_AMP_VERIFY_MUTABLE_ITERATOR(_Type_name)
Definition: xxamp.h:27

Concurrency::copy
void copy(const array< _Value_type, _Rank > &_Src, array< _Value_type, _Rank > &_Dest)
Copies the contents of the source array into the destination array.
Definition: amp.h:6008

Concurrency::details::opEq
Definition: xxamp.h:228

Concurrency::details::_Array_view_shape::_M_total_linear_offset
int _M_total_linear_offset
Definition: amp.h:1671

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(int _E0, const _Value_type *_Src) __GPU
Construct an array_view which is bound to the data pointed to by _Src.
Definition: amp.h:3259

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(int _E0, const _Container &_Src) __CPU_ONLY
Construct an array_view which is bound to the data contained in the _Src container.
Definition: amp.h:3184

__dp_d3d_saturatef
float __dp_d3d_saturatef(float) __GPU_ONLY

Concurrency::access_type_auto
Definition: amprt.h:109

Concurrency::array::~array
~array() __CPU_ONLY noexcept(false)
Destroys this array and reclaims resources.
Definition: amp.h:5525

Concurrency::tiled_extent
A tiled_extent is an extent of 1 to 3 dimensions which also subdivides the extent space into 1-...
Definition: amp.h:1274

Concurrency::index::_M_base
int _M_base[_Rank]
Definition: amp.h:359

Concurrency::details::opMod
Definition: xxamp.h:244

Concurrency::atomic_fetch_and
int atomic_fetch_and(_Inout_ int *_Dest, int _Value) __GPU_ONLY
Performs an atomic bitwise and operation of _Value to the memory location pointed to by _Dest ...
Definition: amp.h:6908

advance
void advance(_InIt &_Where, _Diff _Off)
Definition: xutility:1089

Concurrency::array::section
array_view< const _Value_type, _Rank > section(const Concurrency::index< _Rank > &_Section_origin, const Concurrency::extent< _Rank > &_Section_extent) const __GPU
Produces a subsection of the source array at the given origin and extent.
Definition: amp.h:5202

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(int _E0, int _E1, const _Container &_Src) __CPU_ONLY
Construct an array_view which is bound to the data contained in the _Src container.
Definition: amp.h:3218

Concurrency::extent::extent
extent(int _I0, int _I1) __GPU
Constructor for extent<2>
Definition: amp.h:441

Concurrency::array::array
array(int _E0, int _E1, _InputIterator _Src_first, Concurrency::accelerator_view _Av, access_type _Cpu_access_type=access_type_auto) __CPU_ONLY
Construct an array initialized from an iterator into a container, bound to a specific accelerator_vie...
Definition: amp.h:4475

type_traits

amprt.h

Concurrency::details::_Amp_runtime_trace::_Start_array_view_synchronize_event_helper
_AMPIMP ULONG _Start_array_view_synchronize_event_helper(const _Buffer_descriptor &_Buff_desc)

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(int _E0, int _E1, int _E2, const _Value_type *_Src) __GPU
Construct an array_view which is bound to the data pointed to by _Src.
Definition: amp.h:3302

Concurrency::array::reinterpret_as
array_view< const _Value_type2, 1 > reinterpret_as() const __GPU
Produces a (possibly unsafe) reinterpretation of this array that is linear and with a different eleme...
Definition: amp.h:5439

Concurrency::details::_Calculate_reinterpreted_size
int _Calculate_reinterpreted_size(int _Old_size) __GPU_ONLY
Definition: amp.h:1527

Concurrency::array_view::array_view
array_view(_Buffer_descriptor &_Src_buffer, const Concurrency::extent< _Rank > &_Extent) __GPU
Definition: amp.h:3002

Concurrency::array::_Unregister
void _Unregister() __CPU_ONLY
Definition: amp.h:5656

Concurrency::array::array
array(int _E0, int _E1, int _E2, _InputIterator _Src_first, Concurrency::accelerator_view _Av, access_type _Cpu_access_type=access_type_auto) __CPU_ONLY
Construct an array initialized from an iterator into a container, bound to a specific accelerator_vie...
Definition: amp.h:4547

Concurrency::array_view< const _Value_type, _Rank >::section
array_view section(int _I0, int _E0) const __GPU
Produces a one-dimensional subsection of the source array_view with origin specified by the index com...
Definition: amp.h:3580

Concurrency::access_type_none
Definition: amprt.h:105

_No_access
Definition: amprt.h:90

Concurrency::operator!=
std::enable_if< details::_Is_extent_or_index< _Tuple_type< _Rank > >::value, bool >::type operator!=(const _Tuple_type< _Rank > &_Lhs, const _Tuple_type< _Rank > &_Rhs) __GPU
Definition: amp.h:829

Concurrency::atomic_fetch_sub
int atomic_fetch_sub(_Inout_ int *_Dest, int _Value) __GPU_ONLY
Performs an atomic subtraction of _Value from the memory location pointed to by _Dest ...
Definition: amp.h:6599

Concurrency::array::array
array(const Concurrency::extent< _Rank > &_Extent, _InputIterator _Src_first, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY
Construct a staging array between two associated accelerator_view, initialized from an iterator into ...
Definition: amp.h:4598

Concurrency::array::operator()
details::_Projection_result_type< _Value_type, _Rank >::_Const_result_type operator()(int _I) const __GPU
Projects the most-significant dimension of this array. If the array rank is 1, this produces a single...
Definition: amp.h:5167

Concurrency::details::_Copy_async_impl
_Event _Copy_async_impl(const array_view< _Value_type, _Rank > &_Src, OutputIterator _DestIter)
Definition: amp.h:5933

Concurrency::array_view::copy_to
void copy_to(const array_view< _Value_type, _Rank > &_Dest) const __CPU_ONLY
Copies elements from this array_view to the destination array_view.
Definition: amp.h:2552

__dp_d3d_firstbithighi
int __dp_d3d_firstbithighi(int) __GPU_ONLY

Concurrency::array::operator()
details::_Projection_result_type< _Value_type, _Rank >::_Result_type operator()(int _I) __GPU
Projects the most-significant dimension of this array. If the array rank is 1, this produces a single...
Definition: amp.h:5152

Concurrency::details::_Array_view_base::_Access
_Ret_ void * _Access(const index< _Rank > &_Index) const __GPU
Definition: amp.h:1876

Concurrency::array_view< const _Value_type, _Rank >
Definition: amp.h:3033

AS_UINT_PTR
#define AS_UINT_PTR(p)
Definition: amp.h:6546

xxamp_inl.h

Concurrency::details::opDivEq
Definition: xxamp.h:237

Concurrency::details::opAssign
Definition: xxamp.h:233

Concurrency::atomic_compare_exchange
bool atomic_compare_exchange(_Inout_ int *_Dest, _Inout_ int *_Expected_value, int _Value) __GPU_ONLY
Atomically, compares the value pointed to by _Dest for equality with that pointed to by _Expected_val...
Definition: amp.h:6775

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(int _E0, int _E1, _In_ _Value_type *_Src) __GPU
Construct an array_view which is bound to the data pointed to by _Src.
Definition: amp.h:3339

Concurrency::details::_Create_reinterpreted_shape
_Ret_ _View_shape * _Create_reinterpreted_shape(const _View_shape *_Source_shape, size_t _Curr_elem_size, size_t _New_elem_size)
Definition: amprt.h:1885

Concurrency::extent::extent
extent(const extent< _Rank > &_Other) __GPU
Copy constructor. Constructs a new extent from the supplied argument _Other.
Definition: amp.h:415

__dp_d3d_interlocked_compare_exchange
unsigned int __dp_d3d_interlocked_compare_exchange(_Inout_ unsigned int *, unsigned int, unsigned int) __GPU_ONLY

Concurrency::atomic_fetch_inc
int atomic_fetch_inc(_Inout_ int *_Dest) __GPU_ONLY
Performs an atomic increment to the memory location pointed to by _Dest
Definition: amp.h:6643

Concurrency::global_memory_fence
void global_memory_fence(const tile_barrier &_Barrier) __GPU_ONLY
Ensures that global memory accesses are visible to other threads in the thread tile, and are executed according to program order
Definition: amp.h:7189

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(const _Buffer_descriptor &_Buffer_desc, const _Array_view_shape< _Rank, _Element_size > &_Shape) __GPU
Definition: amp.h:1697

Concurrency::array_view< const _Value_type, _Rank >::copy_to
void copy_to(array< _Value_type, _Rank > &_Dest) const __CPU_ONLY
Copies elements from this array_view to the destination array.
Definition: amp.h:3390

Concurrency::array_view::section
array_view section(const Concurrency::index< _Rank > &_Section_origin, const Concurrency::extent< _Rank > &_Section_extent) const __GPU
Produces a subsection of the source array_view at the given origin and extent.
Definition: amp.h:2686

Concurrency::array::array
array(int _E0, int _E1) __CPU_ONLY
Construct an array from two integer extents.
Definition: amp.h:3920

Concurrency::details::_Array_view_base::_Section
_Array_view_base _Section(const Concurrency::index< _Rank > &_Section_origin, const Concurrency::extent< _Rank > &_Section_extent) const __GPU
Definition: amp.h:1897

Concurrency::array::_Initialize
void _Initialize(Concurrency::accelerator_view _Av, _InputIterator _Src_first, _InputIterator _Src_last, access_type _Cpu_access_type) __CPU_ONLY
Definition: amp.h:5586

Concurrency::array::array
array(int _E0, int _E1, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY
Construct a staging array between two associated accelerator_view.
Definition: amp.h:4098

Concurrency::details::_Parallel_for_each
void _Parallel_for_each(_In_ _Host_Scheduling_info *_Sch_info, extent< _Rank > _Compute_domain, const _Kernel_type &_F)

Concurrency::details::_Array_projection_helper::_Project0
static _Projection_result_type< _T, _R >::_Result_type _Project0(_In_ array< _T, _R > *_Array, int _I) __GPU
Definition: xxamp_inl.h:73

Concurrency::array::array
array(int _E0, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY
Construct a staging array between two associated accelerator_view, initialized from a pair of iterato...
Definition: amp.h:4625

Concurrency::details::_Array_view_base::_Access
_Ret_ void * _Access(_Access_mode, const index< _Rank > &_Index) const __GPU_ONLY
Definition: amp.h:1892

AS_FLOAT
#define AS_FLOAT(v)
Definition: amp.h:6549

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(int _E0, _In_ _Value_type *_Src) __GPU
Construct an array_view which is bound to the data pointed to by _Src.
Definition: amp.h:3319

Concurrency::extent::_M_base
int _M_base[_Rank]
Definition: amp.h:806

Concurrency::details::_Copy_impl
_AMPIMP _Event __cdecl _Copy_impl(_In_ _Buffer *_Src, size_t _Src_offset, _Out_ _Buffer *_Dst, size_t _Dest_offset, size_t _Num_elems, size_t _Preferred_copy_chunk_num_elems=0)

true_type
integral_constant< bool, true > true_type
Definition: xtr1common:40

Concurrency::index::operator=
index< _Rank > & operator=(const index< _Rank > &_Other) __GPU
copy-assignment operators
Definition: amp.h:153

rank
Definition: type_traits:931

Concurrency::extent::operator=
extent< _Rank > & operator=(const extent< _Rank > &_Other) __GPU
copy-assignment operator
Definition: amp.h:484

Concurrency::index::index
index(int _I) __GPU
Constructor for index<1>
Definition: amp.h:95

Concurrency::index
Define an N-dimensional index point; which may also be viewed as a vector based at the origin in N-sp...
Definition: amp.h:53

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(int _E0, int _E1, int _E2, _In_ _Value_type *_Src) __GPU
Construct an array_view which is bound to the data pointed to by _Src.
Definition: amp.h:3362

Concurrency::details::opSub
Definition: xxamp.h:241

_Inout_
#define _Inout_
Definition: sal.h:375

Concurrency::details::_Array_view_base::_Register
void _Register(_In_ void *_Shape) __CPU_ONLY
Definition: amp.h:2031

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(const _Array_view_base &_Other) __GPU
Definition: amp.h:1706

current_exception
exception_ptr current_exception() _NOEXCEPT
Definition: exception:359

Concurrency::array::array
array(const Concurrency::extent< _Rank > &_Extent, _InputIterator _Src_first) __CPU_ONLY
Construct an array initialized from an iterator.
Definition: amp.h:4158

Concurrency::tiled_index< _Dim0, 0, 0 >::tiled_index
tiled_index(const index< rank > &_Global, const index< rank > &_Local, const index< rank > &_Tile, const index< rank > &_Tile_origin, const tile_barrier &_Barrier) __GPU
A Constructor that initializes data members using the given values.
Definition: amp.h:1232

Concurrency::details::_Array_view_base::_Register
void _Register(_In_ void *) __GPU_ONLY
Definition: amp.h:2196

Concurrency::array::operator=
array & operator=(const array_view< const _Value_type, _Rank > &_Src) __CPU_ONLY
Assignment operator from an array_view
Definition: amp.h:4905

Concurrency::accelerator::get_auto_selection_view
static _AMPIMP accelerator_view __cdecl get_auto_selection_view()
Returns the auto selection accelerator_view which when specified as the parallel_for_each target resu...

Concurrency::details::_Reference_counted_obj_ptr
Definition: amprt.h:168

Concurrency::array_view< const _Value_type, _Rank >::synchronize_async
concurrency::completion_future synchronize_async() const __CPU_ONLY
Asynchronously synchronizes any modifications made to "this" array_view to its source data...
Definition: amp.h:3715

Concurrency::tiled_extent::truncate
tiled_extent truncate() const __GPU
Returns a new tiled_extent with extents adjusted down to be evenly divisible by the tile dimensions...
Definition: amp.h:1333

Concurrency::array::array
array(int _E0, int _E1, _InputIterator _Src_first, _InputIterator _Src_last, Concurrency::accelerator_view _Av, access_type _Cpu_access_type=access_type_auto) __CPU_ONLY
Construct an array initialized from a pair of iterators into a container, bound to a specific acceler...
Definition: amp.h:4445

Concurrency::details::_Buffer_descriptor::_Get_buffer_ptr
_Ret_ _Ubiquitous_buffer * _Get_buffer_ptr() const __CPU_ONLY
Definition: amprt.h:503

Concurrency::index::operator[]
int operator[](unsigned _Index) const __GPU
Index operator.
Definition: amp.h:168

Concurrency::details::_Const_array_view_projection_helper::_Project0
static _Projection_result_type< _T, _R >::_Const_result_type _Project0(const array_view< const _T, _R > *_Arr_view, int _I) __GPU
Definition: xxamp_inl.h:33

Concurrency::details::_Event
Definition: amprt.h:318

Concurrency::array_view< const _Value_type, _Rank >::_Initialize
void _Initialize(size_t _Src_data_size) __CPU_ONLY
Definition: amp.h:3811

__dp_d3d_device_memory_fence_with_tile_barrier
void __dp_d3d_device_memory_fence_with_tile_barrier() __GPU_ONLY

Concurrency::details::_Get_synchronize_access_mode
_Access_mode _Get_synchronize_access_mode(access_type cpu_access_type)
Definition: amprt.h:1927

Concurrency::extent::operator-=
extent< _Rank > & operator-=(const extent< _Rank > &_Rhs) __GPU
Element-wise subtraction of this extent with another extent.
Definition: amp.h:625

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(const void *_Data, const Concurrency::extent< _Rank > &_Array_extent) __GPU_ONLY
Definition: amp.h:1843

Concurrency::extent::operator-=
extent< _Rank > & operator-=(const index< _Rank > &_Rhs) __GPU
Element-wise subtraction of this extent with an index.
Definition: amp.h:655

Concurrency::tile_barrier::wait_with_global_memory_fence
void wait_with_global_memory_fence() const __GPU_ONLY
Blocks execution of all threads in a tile until all all threads in the tile have reached this call...
Definition: amp.h:983

_Extent
Definition: type_traits:950

Concurrency::array::value_type
_Value_type value_type
Definition: amp.h:3884

Concurrency::details::_arithmetic_op_loop_helper
Definition: xxamp.h:257

Concurrency::details::_Array_view_shape::_M_view_offset
Concurrency::index< _Rank > _M_view_offset
Definition: amp.h:1670

Concurrency::accelerator
Class represents a accelerator abstraction for C++ AMP data-parallel devices
Definition: amprt.h:1013

Concurrency::operator%
std::enable_if< details::_Is_extent_or_index< _Tuple_type< _Rank > >::value, _Tuple_type< _Rank > >::type operator%(const _Tuple_type< _Rank > &_Lhs, typename _Tuple_type< _Rank >::value_type _Rhs) __GPU
Definition: amp.h:926

Concurrency::access_type_read
Definition: amprt.h:106

Concurrency::details::opSubEq
Definition: xxamp.h:235

__dp_d3d_interlocked_max_uint
unsigned int __dp_d3d_interlocked_max_uint(_Inout_ unsigned int *, unsigned int) __GPU_ONLY

Concurrency::array_view< const _Value_type, _Rank >::value_type
const _Value_type value_type
Definition: amp.h:3053

__dp_d3d_device_memory_fence
void __dp_d3d_device_memory_fence() __GPU_ONLY

Concurrency::details::_compound_assign_op_loop_helper
Definition: xxamp.h:254

Concurrency::details::_Array_view_base::operator=
_Array_view_base & operator=(const _Array_view_base &_Other) __GPU
Definition: amp.h:1856

_Write_access
Definition: amprt.h:92

Concurrency::tiled_extent< _Dim0, 0, 0 >::_map_index
tiled_index< _Dim0 > _map_index(const index< rank > &_Local, const index< rank > &_Tile, const index< rank > &_Global, tile_barrier &_Barrier) const __GPU
Definition: amp.h:1515

INT_MAX
#define INT_MAX
Definition: limits.h:35

Concurrency::array_view
An array_view is an N-dimensional view over data held in another container (such as arrayDefinition: amp.h:2236

Concurrency::array_view::array_view
array_view(int _E0, int _E1) __CPU_ONLY
Construct an array_view which is not bound to a data source.
Definition: amp.h:2390

Concurrency::tile_barrier::wait_with_tile_static_memory_fence
void wait_with_tile_static_memory_fence() const __GPU_ONLY
Blocks execution of all threads in a tile until all all threads in the tile have reached this call...
Definition: amp.h:992

Concurrency::array::array
array(int _E0, int _E1, _InputIterator _Src_first) __CPU_ONLY
Construct an array initialized from an iterator.
Definition: amp.h:4242

Concurrency::array_view::array_view
array_view(_Container &_Src, typename std::enable_if< details::_Is_container< _Container >::type::value, void ** >::type=0) __CPU_ONLY
Construct an array_view which is bound to the data contained in the _Src container.
Definition: amp.h:2353

Concurrency::array::section
array_view< _Value_type, 2 > section(int _I0, int _I1, int _E0, int _E1) __GPU
Produces a two-dimensional subsection of the source array with origin specified by the index componen...
Definition: amp.h:5327

__GPU_ONLY
#define __GPU_ONLY
Definition: amprt.h:46

Concurrency::details::_Array_view_base::_Section
_Array_view_base _Section(const index< _Rank > &_Idx) const __GPU
Definition: amp.h:1907

Concurrency::details::_Array_view_shape::_Project0
void _Project0(int _I, _Array_view_shape< _Rank-1, _Element_size > &_Projected_shape) const __GPU
Definition: amp.h:1633

Concurrency::details::opAddEq
Definition: xxamp.h:234

Concurrency::array_view::view_as
array_view< _Value_type, _New_rank > view_as(const Concurrency::extent< _New_rank > &_View_extent) const __GPU
Produces an array_view of a different rank over this array_view's data.
Definition: amp.h:2818

Concurrency::direct3d::imax
int imax(int _X, int _Y) __GPU_ONLY
Determine the maximum numeric value of the arguments
Definition: amp.h:7320

Concurrency::details::_Is_cpu_accelerator
bool _Is_cpu_accelerator(const accelerator &_Accl)
Definition: amprt.h:3401

Concurrency::array_view::array_view
array_view(int _E0, int _E1, _In_ _Value_type *_Src) __GPU
Construct an array_view which is bound to the data pointed to by _Src.
Definition: amp.h:2502

__dp_d3d_signi
int __dp_d3d_signi(int) __GPU_ONLY

Concurrency::tile_barrier::wait
void wait() const __GPU_ONLY
Blocks execution of all threads in a tile until all all threads in the tile have reached this call...
Definition: amp.h:965

Concurrency::array_view::array_view
array_view(int _E0, int _E1, int _E2, _Container &_Src) __CPU_ONLY
Construct an array_view which is bound to the data contained in the _Src container.
Definition: amp.h:2451

Concurrency::details::_cmp_op_loop_helper
Definition: xxamp.h:251

__dp_d3d_countbitsu
unsigned int __dp_d3d_countbitsu(unsigned int) __GPU_ONLY

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(const Concurrency::extent< _Rank > &_Extent, const _Container &_Src) __CPU_ONLY
Construct an array_view which is bound to the data contained in the _Src container.
Definition: amp.h:3099

Concurrency::tiled_index< _Dim0, _Dim1, 0 >::tiled_index
tiled_index(const tiled_index &_Other) __GPU
Copy Constructor.
Definition: amp.h:1189

Concurrency::details::_View_shape
Definition: amprt.h:1581

Concurrency::array_view::operator=
array_view & operator=(const array_view &_Other) __GPU
Copy Assignment operator. Shallow copy.
Definition: amp.h:2535

_Value
_In_ int _Value
Definition: setjmp.h:173

Concurrency::atomic_fetch_add
int atomic_fetch_add(_Inout_ int *_Dest, int _Value) __GPU_ONLY
Performs an atomic addition of _Value to the memory location pointed to by _Dest
Definition: amp.h:6563

Concurrency::details::_Array_view_shape::_Array_view_shape
_Array_view_shape() __GPU
Definition: amp.h:1652

Concurrency::array_view< const _Value_type, _Rank >::section
array_view section(int _I0, int _I1, int _I2, int _E0, int _E1, int _E2) const __GPU
Produces a three-dimensional subsection of the source array_view with origin specified by the index c...
Definition: amp.h:3636

Concurrency::array_view::section
array_view section(const Concurrency::index< _Rank > &_Idx) const __GPU
Produces a subsection of the source array_view with origin specified by an index, with an extent of (...
Definition: amp.h:2701

Concurrency::extent::operator--
extent< _Rank > operator--(int) __GPU
Post-decrements each element of this extent.
Definition: amp.h:779

Concurrency::extent::_map_index
index< _Rank > _map_index(const index< _Rank > &_Index) const __GPU
Definition: amp.h:789

Concurrency::tile_barrier::tile_barrier
tile_barrier(const tile_barrier &_Other) __GPU
Copy Constructor. The tile_barrier class does not have a public default constructor or assignment ope...
Definition: amp.h:959

Concurrency::details::_Array_view_shape::_Array_view_shape
_Array_view_shape(const _Array_view_shape &_Other, const Concurrency::index< _Rank > &_Section_origin, const Concurrency::extent< _Rank > &_Section_extent) __GPU
Definition: amp.h:1587

Concurrency::array_view::_Initialize
void _Initialize() __GPU
Definition: amp.h:3008

Concurrency::array_view::get_ref
_Value_type & get_ref(const index< _Rank > &_Index) const __GPU
Get a reference to the element indexed by _Index. Unlike the other indexing operators for accessing t...
Definition: amp.h:2585

__dp_d3d_noisef
float __dp_d3d_noisef(float) __GPU_ONLY

Concurrency::array::section
array_view< const _Value_type, 2 > section(int _I0, int _I1, int _E0, int _E1) const __GPU
Produces a two-dimensional subsection of the source array with origin specified by the index componen...
Definition: amp.h:5352

Concurrency::_Tiled_index_base::_CPP_AMP_VERIFY_RANK
_CPP_AMP_VERIFY_RANK(_Rank, tiled_index)

Concurrency::array::operator[]
details::_Projection_result_type< _Value_type, _Rank >::_Const_result_type operator[](int _I) const __GPU
Projects the most-significant dimension of this array. If the array rank is 1, this produces a single...
Definition: amp.h:5031

_Size
_Size
Definition: vcruntime_string.h:36

Concurrency::details::_Array_view_base::_Create_projection_buffer_shape
static _Ret_ void * _Create_projection_buffer_shape(const _Buffer_descriptor &_Descriptor, unsigned int _Dim, int _Dim_offset) __CPU_ONLY
Definition: amp.h:2074

__dp_d3d_minu
unsigned int __dp_d3d_minu(unsigned int, unsigned int) __GPU_ONLY

Concurrency::details::_Amp_runtime_trace::_Write_end_event
_AMPIMP void _Write_end_event(ULONG _Span_id)

Concurrency::details::_View_shape::_Get_rank
unsigned int _Get_rank() const
Definition: amprt.h:1591

Concurrency::tiled_extent::pad
tiled_extent pad() const __GPU
Returns a new tiled_extent with extents adjusted up to be evenly divisible by the tile dimensions...
Definition: amp.h:1321

_Ret_
#define _Ret_
Definition: sal.h:996

Concurrency::copy_async
concurrency::completion_future copy_async(const array< _Value_type, _Rank > &_Src, array< _Value_type, _Rank > &_Dest)
Asynchronously copies the contents of the source array into the destination array.
Definition: amp.h:5988

Concurrency::extent::operator*=
extent< _Rank > & operator*=(int _Rhs) __GPU
Multiplies an integer value to each element of this extent.
Definition: amp.h:700

Concurrency::details::_Amp_runtime_trace::_Start_async_op_wait_event_helper
concurrency::completion_future _Start_async_op_wait_event_helper(ULONG _Async_op_id, _Event _Ev)
Definition: amprt.h:3753

__dp_d3d_interlocked_max_int
int __dp_d3d_interlocked_max_int(_Inout_ int *, int) __GPU_ONLY

Concurrency::direct3d::firstbithigh
int firstbithigh(int _X) __GPU_ONLY
Gets the location of the first set bit in _X, starting from the highest order bit and working downwar...
Definition: amp.h:7289

Concurrency::operator/
std::enable_if< details::_Is_extent_or_index< _Tuple_type< _Rank > >::value, _Tuple_type< _Rank > >::type operator/(const _Tuple_type< _Rank > &_Lhs, typename _Tuple_type< _Rank >::value_type _Rhs) __GPU
Definition: amp.h:908

__dp_d3d_stepf
float __dp_d3d_stepf(float, float) __GPU_ONLY

Concurrency::access_type
access_type
Enumeration type used to denote the various types of access to data.
Definition: amprt.h:103

Concurrency::details::_Array_view_base::_Array_view_base
_Array_view_base(const _Array_view_base &_Other, const Concurrency::extent< _Rank > &_Array_extent) __GPU
Definition: amp.h:1718

Concurrency::extent::contains
bool contains(const index< rank > &_Index) const __GPU
Tests whether the index "_Index" is properly contained within this extent.
Definition: amp.h:529

Concurrency::array::array
array(const array_view< const _Value_type, _Rank > &_Src, accelerator_view _Av, accelerator_view _Associated_Av) __CPU_ONLY
Construct a staging array between two associated accelerator_views, initialized from an array_view...
Definition: amp.h:4829

Concurrency::tiled_extent< _Dim0, _Dim1, 0 >::truncate
tiled_extent truncate() const __GPU
Returns a new tiled_extent with extents adjusted down to be evenly divisible by the tile dimensions...
Definition: amp.h:1418

Concurrency::tiled_index< _Dim0, _Dim1, 0 >::tiled_index
tiled_index(const index< rank > &_Global, const index< rank > &_Local, const index< rank > &_Tile, const index< rank > &_Tile_origin, const tile_barrier &_Barrier) __GPU
A Constructor that initializes data members using the given values.
Definition: amp.h:1175

Concurrency::array::array
array(int _E0, Concurrency::accelerator_view _Av, access_type _Cpu_access_type=access_type_auto) __CPU_ONLY
Construct array with the extent _E0, bound to a specific accelerator_view.
Definition: amp.h:3984

Concurrency::direct3d::step
float step(float _Y, float _X) __GPU_ONLY
Compares two values, returning 0 or 1 based on which value is greater
Definition: amp.h:7572

Concurrency::access_type_read_write
Definition: amprt.h:108

Concurrency::array::view_as
array_view< _Value_type, _New_rank > view_as(const Concurrency::extent< _New_rank > &_View_extent) __GPU
Produces an array_view of a different rank over this array's data.
Definition: amp.h:5460

Concurrency::details::_Const_array_projection_helper::_Project0
static _Projection_result_type< _T, _R >::_Const_result_type _Project0(const array< _T, _R > *_Array, int _I) __GPU
Definition: xxamp_inl.h:65

Concurrency::index::index
index(int _I0, int _I1, int _I2) __GPU
Constructor for index<3>
Definition: amp.h:129

Concurrency::atomic_fetch_min
int atomic_fetch_min(_Inout_ int *_Dest, int _Value) __GPU_ONLY
Atomically computes the minimum of _Value and the value of the memory location pointed to by _Dest...
Definition: amp.h:6873

Concurrency::array::array
array(int _E0, int _E1, int _E2, _InputIterator _Src_first, Concurrency::accelerator_view _Av, Concurrency::accelerator_view _Associated_Av) __CPU_ONLY
Construct a staging array between two associated accelerator_view, initialized from an iterator into ...
Definition: amp.h:4770

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(const array_view< const _Value_type, _Rank > &_Src) __GPU
Copy constructor. Shallow copy.
Definition: amp.h:3085

Concurrency::array_view::array_view
array_view(int _E0, int _E1, _Container &_Src) __CPU_ONLY
Construct an array_view which is bound to the data contained in the _Src container.
Definition: amp.h:2409

Concurrency::tile_static_memory_fence
void tile_static_memory_fence(const tile_barrier &_Barrier) __GPU_ONLY
Ensures that tile_static memory accesses are visible to other threads in the thread tile...
Definition: amp.h:7200

Concurrency::array_view< const _Value_type, _Rank >::get_ref
const _Value_type & get_ref(const index< _Rank > &_Index) const __GPU
Get a reference to the element indexed by _Index. Unlike the other indexing operators for accessing t...
Definition: amp.h:3431

Concurrency::array_view< const _Value_type, _Rank >::array_view
array_view(const Concurrency::extent< _Rank > &_Extent, const _Value_type *_Src) __GPU
Construct an array_view which is bound to the data pointed to by _Src.
Definition: amp.h:3153