Home | History | Annotate | Download | only in include

Lines Matching refs:__local

7628 float __ovld fract(float x, __local float *iptr);
7629 float2 __ovld fract(float2 x, __local float2 *iptr);
7630 float3 __ovld fract(float3 x, __local float3 *iptr);
7631 float4 __ovld fract(float4 x, __local float4 *iptr);
7632 float8 __ovld fract(float8 x, __local float8 *iptr);
7633 float16 __ovld fract(float16 x, __local float16 *iptr);
7647 double __ovld fract(double x, __local double *iptr);
7648 double2 __ovld fract(double2 x, __local double2 *iptr);
7649 double3 __ovld fract(double3 x, __local double3 *iptr);
7650 double4 __ovld fract(double4 x, __local double4 *iptr);
7651 double8 __ovld fract(double8 x, __local double8 *iptr);
7652 double16 __ovld fract(double16 x, __local double16 *iptr);
7667 half __ovld fract(half x, __local half *iptr);
7668 half2 __ovld fract(half2 x, __local half2 *iptr);
7669 half3 __ovld fract(half3 x, __local half3 *iptr);
7670 half4 __ovld fract(half4 x, __local half4 *iptr);
7671 half8 __ovld fract(half8 x, __local half8 *iptr);
7672 half16 __ovld fract(half16 x, __local half16 *iptr);
7718 float __ovld frexp(float x, __local int *exp);
7719 float2 __ovld frexp(float2 x, __local int2 *exp);
7720 float3 __ovld frexp(float3 x, __local int3 *exp);
7721 float4 __ovld frexp(float4 x, __local int4 *exp);
7722 float8 __ovld frexp(float8 x, __local int8 *exp);
7723 float16 __ovld frexp(float16 x, __local int16 *exp);
7737 double __ovld frexp(double x, __local int *exp);
7738 double2 __ovld frexp(double2 x, __local int2 *exp);
7739 double3 __ovld frexp(double3 x, __local int3 *exp);
7740 double4 __ovld frexp(double4 x, __local int4 *exp);
7741 double8 __ovld frexp(double8 x, __local int8 *exp);
7742 double16 __ovld frexp(double16 x, __local int16 *exp);
7757 half __ovld frexp(half x, __local int *exp);
7758 half2 __ovld frexp(half2 x, __local int2 *exp);
7759 half3 __ovld frexp(half3 x, __local int3 *exp);
7760 half4 __ovld frexp(half4 x, __local int4 *exp);
7761 half8 __ovld frexp(half8 x, __local int8 *exp);
7762 half16 __ovld frexp(half16 x, __local int16 *exp);
7925 float __ovld lgamma_r(float x, __local int *signp);
7926 float2 __ovld lgamma_r(float2 x, __local int2 *signp);
7927 float3 __ovld lgamma_r(float3 x, __local int3 *signp);
7928 float4 __ovld lgamma_r(float4 x, __local int4 *signp);
7929 float8 __ovld lgamma_r(float8 x, __local int8 *signp);
7930 float16 __ovld lgamma_r(float16 x, __local int16 *signp);
7944 double __ovld lgamma_r(double x, __local int *signp);
7945 double2 __ovld lgamma_r(double2 x, __local int2 *signp);
7946 double3 __ovld lgamma_r(double3 x, __local int3 *signp);
7947 double4 __ovld lgamma_r(double4 x, __local int4 *signp);
7948 double8 __ovld lgamma_r(double8 x, __local int8 *signp);
7949 double16 __ovld lgamma_r(double16 x, __local int16 *signp);
7964 half __ovld lgamma_r(half x, __local int *signp);
7965 half2 __ovld lgamma_r(half2 x, __local int2 *signp);
7966 half3 __ovld lgamma_r(half3 x, __local int3 *signp);
7967 half4 __ovld lgamma_r(half4 x, __local int4 *signp);
7968 half8 __ovld lgamma_r(half8 x, __local int8 *signp);
7969 half16 __ovld lgamma_r(half16 x, __local int16 *signp);
8231 float __ovld modf(float x, __local float *iptr);
8232 float2 __ovld modf(float2 x, __local float2 *iptr);
8233 float3 __ovld modf(float3 x, __local float3 *iptr);
8234 float4 __ovld modf(float4 x, __local float4 *iptr);
8235 float8 __ovld modf(float8 x, __local float8 *iptr);
8236 float16 __ovld modf(float16 x, __local float16 *iptr);
8250 double __ovld modf(double x, __local double *iptr);
8251 double2 __ovld modf(double2 x, __local double2 *iptr);
8252 double3 __ovld modf(double3 x, __local double3 *iptr);
8253 double4 __ovld modf(double4 x, __local double4 *iptr);
8254 double8 __ovld modf(double8 x, __local double8 *iptr);
8255 __local double16 *iptr);
8270 half __ovld modf(half x, __local half *iptr);
8271 half2 __ovld modf(half2 x, __local half2 *iptr);
8272 half3 __ovld modf(half3 x, __local half3 *iptr);
8273 half4 __ovld modf(half4 x, __local half4 *iptr);
8274 half8 __ovld modf(half8 x, __local half8 *iptr);
8275 half16 __ovld modf(half16 x, __local half16 *iptr);
8492 float __ovld remquo(float x, float y, __local int *quo);
8493 float2 __ovld remquo(float2 x, float2 y, __local int2 *quo);
8494 float3 __ovld remquo(float3 x, float3 y, __local int3 *quo);
8495 float4 __ovld remquo(float4 x, float4 y, __local int4 *quo);
8496 float8 __ovld remquo(float8 x, float8 y, __local int8 *quo);
8497 float16 __ovld remquo(float16 x, float16 y, __local int16 *quo);
8511 double __ovld remquo(double x, double y, __local int *quo);
8512 double2 __ovld remquo(double2 x, double2 y, __local int2 *quo);
8513 double3 __ovld remquo(double3 x, double3 y, __local int3 *quo);
8514 double4 __ovld remquo(double4 x, double4 y, __local int4 *quo);
8515 double8 __ovld remquo(double8 x, double8 y, __local int8 *quo);
8516 double16 __ovld remquo(double16 x, double16 y, __local int16 *quo);
8531 half __ovld remquo(half x, half y, __local int *quo);
8532 half2 __ovld remquo(half2 x, half2 y, __local int2 *quo);
8533 half3 __ovld remquo(half3 x, half3 y, __local int3 *quo);
8534 half4 __ovld remquo(half4 x, half4 y, __local int4 *quo);
8535 half8 __ovld remquo(half8 x, half8 y, __local int8 *quo);
8536 half16 __ovld remquo(half16 x, half16 y, __local int16 *quo);
8715 float __ovld sincos(float x, __local float *cosval);
8716 float2 __ovld sincos(float2 x, __local float2 *cosval);
8717 float3 __ovld sincos(float3 x, __local float3 *cosval);
8718 float4 __ovld sincos(float4 x, __local float4 *cosval);
8719 float8 __ovld sincos(float8 x, __local float8 *cosval);
8720 float16 __ovld sincos(float16 x, __local float16 *cosval);
8734 double __ovld sincos(double x, __local double *cosval);
8735 double2 __ovld sincos(double2 x, __local double2 *cosval);
8736 double3 __ovld sincos(double3 x, __local double3 *cosval);
8737 double4 __ovld sincos(double4 x, __local double4 *cosval);
8738 double8 __ovld sincos(double8 x, __local double8 *cosval);
8739 double16 __ovld sincos(double16 x, __local double16 *cosval);
8754 half __ovld sincos(half x, __local half *cosval);
8755 half2 __ovld sincos(half2 x, __local half2 *cosval);
8756 half3 __ovld sincos(half3 x, __local half3 *cosval);
8757 half4 __ovld sincos(half4 x, __local half4 *cosval);
8758 half8 __ovld sincos(half8 x, __local half8 *cosval);
8759 half16 __ovld sincos(half16 x, __local half16 *cosval);
11721 char2 __ovld vload2(size_t offset, const __local char *p);
11722 uchar2 __ovld vload2(size_t offset, const __local uchar *p);
11723 short2 __ovld vload2(size_t offset, const __local short *p);
11724 ushort2 __ovld vload2(size_t offset, const __local ushort *p);
11725 int2 __ovld vload2(size_t offset, const __local int *p);
11726 uint2 __ovld vload2(size_t offset, const __local uint *p);
11727 long2 __ovld vload2(size_t offset, const __local long *p);
11728 ulong2 __ovld vload2(size_t offset, const __local ulong *p);
11729 float2 __ovld vload2(size_t offset, const __local float *p);
11730 char3 __ovld vload3(size_t offset, const __local char *p);
11731 uchar3 __ovld vload3(size_t offset, const __local uchar *p);
11732 short3 __ovld vload3(size_t offset, const __local short *p);
11733 ushort3 __ovld vload3(size_t offset, const __local ushort *p);
11734 int3 __ovld vload3(size_t offset, const __local int *p);
11735 uint3 __ovld vload3(size_t offset, const __local uint *p);
11736 long3 __ovld vload3(size_t offset, const __local long *p);
11737 ulong3 __ovld vload3(size_t offset, const __local ulong *p);
11738 float3 __ovld vload3(size_t offset, const __local float *p);
11739 char4 __ovld vload4(size_t offset, const __local char *p);
11740 uchar4 __ovld vload4(size_t offset, const __local uchar *p);
11741 short4 __ovld vload4(size_t offset, const __local short *p);
11742 ushort4 __ovld vload4(size_t offset, const __local ushort *p);
11743 int4 __ovld vload4(size_t offset, const __local int *p);
11744 uint4 __ovld vload4(size_t offset, const __local uint *p);
11745 long4 __ovld vload4(size_t offset, const __local long *p);
11746 ulong4 __ovld vload4(size_t offset, const __local ulong *p);
11747 float4 __ovld vload4(size_t offset, const __local float *p);
11748 char8 __ovld vload8(size_t offset, const __local char *p);
11749 uchar8 __ovld vload8(size_t offset, const __local uchar *p);
11750 short8 __ovld vload8(size_t offset, const __local short *p);
11751 ushort8 __ovld vload8(size_t offset, const __local ushort *p);
11752 int8 __ovld vload8(size_t offset, const __local int *p);
11753 uint8 __ovld vload8(size_t offset, const __local uint *p);
11754 long8 __ovld vload8(size_t offset, const __local long *p);
11755 ulong8 __ovld vload8(size_t offset, const __local ulong *p);
11756 float8 __ovld vload8(size_t offset, const __local float *p);
11757 char16 __ovld vload16(size_t offset, const __local char *p);
11758 uchar16 __ovld vload16(size_t offset, const __local uchar *p);
11759 short16 __ovld vload16(size_t offset, const __local short *p);
11760 ushort16 __ovld vload16(size_t offset, const __local ushort *p);
11761 __local int *p);
11762 uint16 __ovld vload16(size_t offset, const __local uint *p);
11763 long16 __ovld vload16(size_t offset, const __local long *p);
11764 ulong16 __ovld vload16(size_t offset, const __local ulong *p);
11765 float16 __ovld vload16(size_t offset, const __local float *p);
11818 double2 __ovld vload2(size_t offset, const __local double *p);
11819 double3 __ovld vload3(size_t offset, const __local double *p);
11820 double4 __ovld vload4(size_t offset, const __local double *p);
11821 double8 __ovld vload8(size_t offset, const __local double *p);
11822 double16 __ovld vload16(size_t offset, const __local double *p);
11837 half __ovld vload(size_t offset, const __local half *p);
11838 half2 __ovld vload2(size_t offset, const __local half *p);
11839 half3 __ovld vload3(size_t offset, const __local half *p);
11840 half4 __ovld vload4(size_t offset, const __local half *p);
11841 half8 __ovld vload8(size_t offset, const __local half *p);
11842 half16 __ovld vload16(size_t offset, const __local half *p);
11959 void __ovld vstore2(char2 data, size_t offset, __local char *p);
11960 void __ovld vstore2(uchar2 data, size_t offset, __local uchar *p);
11961 void __ovld vstore2(short2 data, size_t offset, __local short *p);
11962 void __ovld vstore2(ushort2 data, size_t offset, __local ushort *p);
11963 void __ovld vstore2(int2 data, size_t offset, __local int *p);
11964 void __ovld vstore2(uint2 data, size_t offset, __local uint *p);
11965 void __ovld vstore2(long2 data, size_t offset, __local long *p);
11966 void __ovld vstore2(ulong2 data, size_t offset, __local ulong *p);
11967 void __ovld vstore2(float2 data, size_t offset, __local float *p);
11968 void __ovld vstore3(char3 data, size_t offset, __local char *p);
11969 void __ovld vstore3(uchar3 data, size_t offset, __local uchar *p);
11970 void __ovld vstore3(short3 data, size_t offset, __local short *p);
11971 void __ovld vstore3(ushort3 data, size_t offset, __local ushort *p);
11972 void __ovld vstore3(int3 data, size_t offset, __local int *p);
11973 void __ovld vstore3(uint3 data, size_t offset, __local uint *p);
11974 void __ovld vstore3(long3 data, size_t offset, __local long *p);
11975 void __ovld vstore3(ulong3 data, size_t offset, __local ulong *p);
11976 void __ovld vstore3(float3 data, size_t offset, __local float *p);
11977 void __ovld vstore4(char4 data, size_t offset, __local char *p);
11978 void __ovld vstore4(uchar4 data, size_t offset, __local uchar *p);
11979 void __ovld vstore4(short4 data, size_t offset, __local short *p);
11980 void __ovld vstore4(ushort4 data, size_t offset, __local ushort *p);
11981 void __ovld vstore4(int4 data, size_t offset, __local int *p);
11982 void __ovld vstore4(uint4 data, size_t offset, __local uint *p);
11983 void __ovld vstore4(long4 data, size_t offset, __local long *p);
11984 void __ovld vstore4(ulong4 data, size_t offset, __local ulong *p);
11985 void __ovld vstore4(float4 data, size_t offset, __local float *p);
11986 void __ovld vstore8(char8 data, size_t offset, __local char *p);
11987 void __ovld vstore8(uchar8 data, size_t offset, __local uchar *p);
11988 void __ovld vstore8(short8 data, size_t offset, __local short *p);
11989 void __ovld vstore8(ushort8 data, size_t offset, __local ushort *p);
11990 void __ovld vstore8(int8 data, size_t offset, __local int *p);
11991 void __ovld vstore8(uint8 data, size_t offset, __local uint *p);
11992 void __ovld vstore8(long8 data, size_t offset, __local long *p);
11993 void __ovld vstore8(ulong8 data, size_t offset, __local ulong *p);
11994 void __ovld vstore8(float8 data, size_t offset, __local float *p);
11995 void __ovld vstore16(char16 data, size_t offset, __local char *p);
11996 void __ovld vstore16(uchar16 data, size_t offset, __local uchar *p);
11997 void __ovld vstore16(short16 data, size_t offset, __local short *p);
11998 void __ovld vstore16(ushort16 data, size_t offset, __local ushort *p);
11999 void __ovld vstore16(int16 data, size_t offset, __local int *p);
12000 void __ovld vstore16(uint16 data, size_t offset, __local uint *p);
12001 void __ovld vstore16(long16 data, size_t offset, __local long *p);
12002 void __ovld vstore16(ulong16 data, size_t offset, __local ulong *p);
12003 void __ovld vstore16(float16 data, size_t offset, __local float *p);
12055 void __ovld vstore2(double2 data, size_t offset, __local double *p);
12056 void __ovld vstore3(double3 data, size_t offset, __local double *p);
12057 void __ovld vstore4(double4 data, size_t offset, __local double *p);
12058 void __ovld vstore8(double8 data, size_t offset, __local double *p);
12059 void __ovld vstore16(double16 data, size_t offset, __local double *p);
12073 void __ovld vstore(half data, size_t offset, __local half *p);
12074 void __ovld vstore2(half2 data, size_t offset, __local half *p);
12075 void __ovld vstore3(half3 data, size_t offset, __local half *p);
12076 void __ovld vstore4(half4 data, size_t offset, __local half *p);
12077 void __ovld vstore8(half8 data, size_t offset, __local half *p);
12078 void __ovld vstore16(half16 data, size_t offset, __local half *p);
12101 float __ovld vload_half(size_t offset, const __local half *p);
12130 float2 __ovld vload_half2(size_t offset, const __local half *p);
12131 float3 __ovld vload_half3(size_t offset, const __local half *p);
12132 float4 __ovld vload_half4(size_t offset, const __local half *p);
12133 float8 __ovld vload_half8(size_t offset, const __local half *p);
12134 float16 __ovld vload_half16(size_t offset, const __local half *p);
12172 void __ovld vstore_half(float data, size_t offset, __local half *p);
12173 void __ovld vstore_half_rte(float data, size_t offset, __local half *p);
12174 void __ovld vstore_half_rtz(float data, size_t offset, __local half *p);
12175 void __ovld vstore_half_rtp(float data, size_t offset, __local half *p);
12176 void __ovld vstore_half_rtn(float data, size_t offset, __local half *p);
12188 void __ovld vstore_half(double data, size_t offset, __local half *p);
12189 void __ovld vstore_half_rte(double data, size_t offset, __local half *p);
12190 void __ovld vstore_half_rtz(double data, size_t offset, __local half *p);
12191 void __ovld vstore_half_rtp(double data, size_t offset, __local half *p);
12192 void __ovld vstore_half_rtn(double data, size_t offset, __local half *p);
12291 void __ovld vstore_half2(float2 data, size_t offset, __local half *p);
12292 void __ovld vstore_half3(float3 data, size_t offset, __local half *p);
12293 void __ovld vstore_half4(float4 data, size_t offset, __local half *p);
12294 void __ovld vstore_half8(float8 data, size_t offset, __local half *p);
12295 void __ovld vstore_half16(float16 data, size_t offset, __local half *p);
12296 void __ovld vstore_half2_rte(float2 data, size_t offset, __local half *p);
12297 void __ovld vstore_half3_rte(float3 data, size_t offset, __local half *p);
12298 void __ovld vstore_half4_rte(float4 data, size_t offset, __local half *p);
12299 void __ovld vstore_half8_rte(float8 data, size_t offset, __local half *p);
12300 void __ovld vstore_half16_rte(float16 data, size_t offset, __local half *p);
12301 __local half *p);
12302 void __ovld vstore_half3_rtz(float3 data, size_t offset, __local half *p);
12303 void __ovld vstore_half4_rtz(float4 data, size_t offset, __local half *p);
12304 void __ovld vstore_half8_rtz(float8 data, size_t offset, __local half *p);
12305 void __ovld vstore_half16_rtz(float16 data, size_t offset, __local half *p);
12306 void __ovld vstore_half2_rtp(float2 data, size_t offset, __local half *p);
12307 void __ovld vstore_half3_rtp(float3 data, size_t offset, __local half *p);
12308 void __ovld vstore_half4_rtp(float4 data, size_t offset, __local half *p);
12309 void __ovld vstore_half8_rtp(float8 data, size_t offset, __local half *p);
12310 void __ovld vstore_half16_rtp(float16 data, size_t offset, __local half *p);
12311 void __ovld vstore_half2_rtn(float2 data, size_t offset, __local half *p);
12312 void __ovld vstore_half3_rtn(float3 data, size_t offset, __local half *p);
12313 void __ovld vstore_half4_rtn(float4 data, size_t offset, __local half *p);
12314 void __ovld vstore_half8_rtn(float8 data, size_t offset, __local half *p);
12315 void __ovld vstore_half16_rtn(float16 data, size_t offset, __local half *p);
12367 void __ovld vstore_half2(double2 data, size_t offset, __local half *p);
12368 void __ovld vstore_half3(double3 data, size_t offset, __local half *p);
12369 void __ovld vstore_half4(double4 data, size_t offset, __local half *p);
12370 void __ovld vstore_half8(double8 data, size_t offset, __local half *p);
12371 void __ovld vstore_half16(double16 data, size_t offset, __local half *p);
12372 void __ovld vstore_half2_rte(double2 data, size_t offset, __local half *p);
12373 void __ovld vstore_half3_rte(double3 data, size_t offset, __local half *p);
12374 void __ovld vstore_half4_rte(double4 data, size_t offset, __local half *p);
12375 void __ovld vstore_half8_rte(double8 data, size_t offset, __local half *p);
12376 void __ovld vstore_half16_rte(double16 data, size_t offset, __local half *p);
12377 void __ovld vstore_half2_rtz(double2 data, size_t offset, __local half *p);
12378 void __ovld vstore_half3_rtz(double3 data, size_t offset, __local half *p);
12379 void __ovld vstore_half4_rtz(double4 data, size_t offset, __local half *p);
12380 void __ovld vstore_half8_rtz(double8 data, size_t offset, __local half *p);
12381 void __ovld vstore_half16_rtz(double16 data, size_t offset, __local half *p);
12382 void __ovld vstore_half2_rtp(double2 data, size_t offset, __local half *p);
12383 void __ovld vstore_half3_rtp(double3 data, size_t offset, __local half *p);
12384 void __ovld vstore_half4_rtp(double4 data, size_t offset, __local half *p);
12385 void __ovld vstore_half8_rtp(double8 data, size_t offset, __local half *p);
12386 void __ovld vstore_half16_rtp(double16 data, size_t offset, __local half *p);
12387 void __ovld vstore_half2_rtn(double2 data, size_t offset, __local half *p);
12388 void __ovld vstore_half3_rtn(double3 data, size_t offset, __local half *p);
12389 void __ovld vstore_half4_rtn(double4 data, size_t offset, __local half *p);
12390 void __ovld vstore_half8_rtn(double8 data, size_t offset, __local half *p);
12391 void __ovld vstore_half16_rtn(double16 data, size_t offset, __local half *p);
12453 float __ovld vloada_half(size_t offset, const __local half *p);
12454 float2 __ovld vloada_half2(size_t offset, const __local half *p);
12455 float3 __ovld vloada_half3(size_t offset, const __local half *p);
12456 float4 __ovld vloada_half4(size_t offset, const __local half *p);
12457 float8 __ovld vloada_half8(size_t offset, const __local half *p);
12458 float16 __ovld vloada_half16(size_t offset, const __local half *p);
12592 void __ovld vstorea_half(float data, size_t offset, __local half *p);
12593 void __ovld vstorea_half2(float2 data, size_t offset, __local half *p);
12594 void __ovld vstorea_half3(float3 data, size_t offset, __local half *p);
12595 void __ovld vstorea_half4(float4 data, size_t offset, __local half *p);
12596 void __ovld vstorea_half8(float8 data, size_t offset, __local half *p);
12597 void __ovld vstorea_half16(float16 data, size_t offset, __local half *p);
12599 void __ovld vstorea_half_rte(float data, size_t offset, __local half *p);
12600 void __ovld vstorea_half2_rte(float2 data, size_t offset, __local half *p);
12601 void __ovld vstorea_half3_rte(float3 data, size_t offset, __local half *p);
12602 void __ovld vstorea_half4_rte(float4 data, size_t offset, __local half *p);
12603 void __ovld vstorea_half8_rte(float8 data, size_t offset, __local half *p);
12604 void __ovld vstorea_half16_rte(float16 data, size_t offset, __local half *p);
12606 void __ovld vstorea_half_rtz(float data, size_t offset, __local half *p);
12607 void __ovld vstorea_half2_rtz(float2 data, size_t offset, __local half *p);
12608 void __ovld vstorea_half3_rtz(float3 data, size_t offset, __local half *p);
12609 void __ovld vstorea_half4_rtz(float4 data, size_t offset, __local half *p);
12610 void __ovld vstorea_half8_rtz(float8 data, size_t offset, __local half *p);
12611 void __ovld vstorea_half16_rtz(float16 data, size_t offset, __local half *p);
12613 void __ovld vstorea_half_rtp(float data, size_t offset, __local half *p);
12614 void __ovld vstorea_half2_rtp(float2 data, size_t offset, __local half *p);
12615 void __ovld vstorea_half3_rtp(float3 data, size_t offset, __local half *p);
12616 void __ovld vstorea_half4_rtp(float4 data, size_t offset, __local half *p);
12617 void __ovld vstorea_half8_rtp(float8 data, size_t offset, __local half *p);
12618 void __ovld vstorea_half16_rtp(float16 data, size_t offset, __local half *p);
12620 void __ovld vstorea_half_rtn(float data, size_t offset, __local half *p);
12621 void __ovld vstorea_half2_rtn(float2 data, size_t offset, __local half *p);
12622 void __ovld vstorea_half3_rtn(float3 data, size_t offset, __local half *p);
12623 void __ovld vstorea_half4_rtn(float4 data, size_t offset, __local half *p);
12624 void __ovld vstorea_half8_rtn(float8 data, size_t offset, __local half *p);
12625 void __ovld vstorea_half16_rtn(float16 data, size_t offset, __local half *p);
12698 void __ovld vstorea_half(double data, size_t offset, __local half *p);
12699 void __ovld vstorea_half2(double2 data, size_t offset, __local half *p);
12700 void __ovld vstorea_half3(double3 data, size_t offset, __local half *p);
12701 void __ovld vstorea_half4(double4 data, size_t offset, __local half *p);
12702 void __ovld vstorea_half8(double8 data, size_t offset, __local half *p);
12703 void __ovld vstorea_half16(double16 data, size_t offset, __local half *p);
12705 void __ovld vstorea_half_rte(double data, size_t offset, __local half *p);
12706 void __ovld vstorea_half2_rte(double2 data, size_t offset, __local half *p);
12707 void __ovld vstorea_half3_rte(double3 data, size_t offset, __local half *p);
12708 void __ovld vstorea_half4_rte(double4 data, size_t offset, __local half *p);
12709 void __ovld vstorea_half8_rte(double8 data, size_t offset, __local half *p);
12710 void __ovld vstorea_half16_rte(double16 data, size_t offset, __local half *p);
12712 void __ovld vstorea_half_rtz(double data, size_t offset, __local half *p);
12713 void __ovld vstorea_half2_rtz(double2 data, size_t offset, __local half *p);
12714 void __ovld vstorea_half3_rtz(double3 data, size_t offset, __local half *p);
12715 void __ovld vstorea_half4_rtz(double4 data, size_t offset, __local half *p);
12716 void __ovld vstorea_half8_rtz(double8 data, size_t offset, __local half *p);
12717 void __ovld vstorea_half16_rtz(double16 data, size_t offset, __local half *p);
12719 void __ovld vstorea_half_rtp(double data, size_t offset, __local half *p);
12720 void __ovld vstorea_half2_rtp(double2 data, size_t offset, __local half *p);
12721 void __ovld vstorea_half3_rtp(double3 data, size_t offset, __local half *p);
12722 void __ovld vstorea_half4_rtp(double4 data, size_t offset, __local half *p);
12723 void __ovld vstorea_half8_rtp(double8 data, size_t offset, __local half *p);
12724 void __ovld vstorea_half16_rtp(double16 data, size_t offset, __local half *p);
12726 void __ovld vstorea_half_rtn(double data, size_t offset, __local half *p);
12727 void __ovld vstorea_half2_rtn(double2 data, size_t offset, __local half *p);
12728 void __ovld vstorea_half3_rtn(double3 data, size_t offset, __local half *p);
12729 void __ovld vstorea_half4_rtn(double4 data, size_t offset, __local half *p);
12730 void __ovld vstorea_half8_rtn(double8 data, size_t offset, __local half *p);
12731 void __ovld vstorea_half16_rtn(double16 data, size_t offset, __local half *p);
12905 * const __local gentype *src,
12929 event_t __ovld async_work_group_copy(__local char *dst, const __global char *src, size_t num_elements, event_t event);
12930 event_t __ovld async_work_group_copy(__local uchar *dst, const __global uchar *src, size_t num_elements, event_t event);
12931 event_t __ovld async_work_group_copy(__local short *dst, const __global short *src, size_t num_elements, event_t event);
12932 event_t __ovld async_work_group_copy(__local ushort *dst, const __global ushort *src, size_t num_elements, event_t event);
12933 event_t __ovld async_work_group_copy(__local int *dst, const __global int *src, size_t num_elements, event_t event);
12934 event_t __ovld async_work_group_copy(__local uint *dst, const __global uint *src, size_t num_elements, event_t event);
12935 event_t __ovld async_work_group_copy(__local long *dst, const __global long *src, size_t num_elements, event_t event);
12936 event_t __ovld async_work_group_copy(__local ulong *dst, const __global ulong *src, size_t num_elements, event_t event);
12937 event_t __ovld async_work_group_copy(__local float *dst, const __global float *src, size_t num_elements, event_t event);
12938 event_t __ovld async_work_group_copy(__local char2 *dst, const __global char2 *src, size_t num_elements, event_t event);
12939 event_t __ovld async_work_group_copy(__local uchar2 *dst, const __global uchar2 *src, size_t num_elements, event_t event);
12940 event_t __ovld async_work_group_copy(__local short2 *dst, const __global short2 *src, size_t num_elements, event_t event);
12941 event_t __ovld async_work_group_copy(__local ushort2 *dst, const __global ushort2 *src, size_t num_elements, event_t event);
12942 event_t __ovld async_work_group_copy(__local int2 *dst, const __global int2 *src, size_t num_elements, event_t event);
12943 event_t __ovld async_work_group_copy(__local uint2 *dst, const __global uint2 *src, size_t num_elements, event_t event);
12944 event_t __ovld async_work_group_copy(__local long2 *dst, const __global long2 *src, size_t num_elements, event_t event);
12945 event_t __ovld async_work_group_copy(__local ulong2 *dst, const __global ulong2 *src, size_t num_elements, event_t event);
12946 event_t __ovld async_work_group_copy(__local float2 *dst, const __global float2 *src, size_t num_elements, event_t event);
12947 event_t __ovld async_work_group_copy(__local char3 *dst, const __global char3 *src, size_t num_elements, event_t event);
12948 event_t __ovld async_work_group_copy(__local uchar3 *dst, const __global uchar3 *src, size_t num_elements, event_t event);
12949 event_t __ovld async_work_group_copy(__local short3 *dst, const __global short3 *src, size_t num_elements, event_t event);
12950 event_t __ovld async_work_group_copy(__local ushort3 *dst, const __global ushort3 *src, size_t num_elements, event_t event);
12951 event_t __ovld async_work_group_copy(__local int3 *dst, const __global int3 *src, size_t num_elements, event_t event);
12952 event_t __ovld async_work_group_copy(__local uint3 *dst, const __global uint3 *src, size_t num_elements, event_t event);
12953 event_t __ovld async_work_group_copy(__local long3 *dst, const __global long3 *src, size_t num_elements, event_t event);
12954 event_t __ovld async_work_group_copy(__local ulong3 *dst, const __global ulong3 *src, size_t num_elements, event_t event);
12955 event_t __ovld async_work_group_copy(__local float3 *dst, const __global float3 *src, size_t num_elements, event_t event);
12956 event_t __ovld async_work_group_copy(__local char4 *dst, const __global char4 *src, size_t num_elements, event_t event);
12957 event_t __ovld async_work_group_copy(__local uchar4 *dst, const __global uchar4 *src, size_t num_elements, event_t event);
12958 event_t __ovld async_work_group_copy(__local short4 *dst, const __global short4 *src, size_t num_elements, event_t event);
12959 event_t __ovld async_work_group_copy(__local ushort4 *dst, const __global ushort4 *src, size_t num_elements, event_t event);
12960 event_t __ovld async_work_group_copy(__local int4 *dst, const __global int4 *src, size_t num_elements, event_t event);
12961 event_t __ovld async_work_group_copy(__local uint4 *dst, const __global uint4 *src, size_t num_elements, event_t event);
12962 event_t __ovld async_work_group_copy(__local long4 *dst, const __global long4 *src, size_t num_elements, event_t event);
12963 event_t __ovld async_work_group_copy(__local ulong4 *dst, const __global ulong4 *src, size_t num_elements, event_t event);
12964 event_t __ovld async_work_group_copy(__local float4 *dst, const __global float4 *src, size_t num_elements, event_t event);
12965 event_t __ovld async_work_group_copy(__local char8 *dst, const __global char8 *src, size_t num_elements, event_t event);
12966 event_t __ovld async_work_group_copy(__local uchar8 *dst, const __global uchar8 *src, size_t num_elements, event_t event);
12967 event_t __ovld async_work_group_copy(__local short8 *dst, const __global short8 *src, size_t num_elements, event_t event);
12968 event_t __ovld async_work_group_copy(__local ushort8 *dst, const __global ushort8 *src, size_t num_elements, event_t event);
12969 event_t __ovld async_work_group_copy(__local int8 *dst, const __global int8 *src, size_t num_elements, event_t event);
12970 event_t __ovld async_work_group_copy(__local uint8 *dst, const __global uint8 *src, size_t num_elements, event_t event);
12971 event_t __ovld async_work_group_copy(__local long8 *dst, const __global long8 *src, size_t num_elements, event_t event);
12972 event_t __ovld async_work_group_copy(__local ulong8 *dst, const __global ulong8 *src, size_t num_elements, event_t event);
12973 event_t __ovld async_work_group_copy(__local float8 *dst, const __global float8 *src, size_t num_elements, event_t event);
12974 event_t __ovld async_work_group_copy(__local char16 *dst, const __global char16 *src, size_t num_elements, event_t event);
12975 event_t __ovld async_work_group_copy(__local uchar16 *dst, const __global uchar16 *src, size_t num_elements, event_t event);
12976 event_t __ovld async_work_group_copy(__local short16 *dst, const __global short16 *src, size_t num_elements, event_t event);
12977 event_t __ovld async_work_group_copy(__local ushort16 *dst, const __global ushort16 *src, size_t num_elements, event_t event);
12978 event_t __ovld async_work_group_copy(__local int16 *dst, const __global int16 *src, size_t num_elements, event_t event);
12979 event_t __ovld async_work_group_copy(__local uint16 *dst, const __global uint16 *src, size_t num_elements, event_t event);
12980 event_t __ovld async_work_group_copy(__local long16 *dst, const __global long16 *src, size_t num_elements, event_t event);
12981 event_t __ovld async_work_group_copy(__local ulong16 *dst, const __global ulong16 *src, size_t num_elements, event_t event);
12982 event_t __ovld async_work_group_copy(__local float16 *dst, const __global float16 *src, size_t num_elements, event_t event);
12983 event_t __ovld async_work_group_copy(__global char *dst, const __local char *src, size_t num_elements, event_t event);
12984 event_t __ovld async_work_group_copy(__global uchar *dst, const __local uchar *src, size_t num_elements, event_t event);
12985 event_t __ovld async_work_group_copy(__global short *dst, const __local short *src, size_t num_elements, event_t event);
12986 event_t __ovld async_work_group_copy(__global ushort *dst, const __local ushort *src, size_t num_elements, event_t event);
12987 event_t __ovld async_work_group_copy(__global int *dst, const __local int *src, size_t num_elements, event_t event);
12988 event_t __ovld async_work_group_copy(__global uint *dst, const __local uint *src, size_t num_elements, event_t event);
12989 event_t __ovld async_work_group_copy(__global long *dst, const __local long *src, size_t num_elements, event_t event);
12990 event_t __ovld async_work_group_copy(__global ulong *dst, const __local ulong *src, size_t num_elements, event_t event);
12991 event_t __ovld async_work_group_copy(__global float *dst, const __local float *src, size_t num_elements, event_t event);
12992 event_t __ovld async_work_group_copy(__global char2 *dst, const __local char2 *src, size_t num_elements, event_t event);
12993 event_t __ovld async_work_group_copy(__global uchar2 *dst, const __local uchar2 *src, size_t num_elements, event_t event);
12994 event_t __ovld async_work_group_copy(__global short2 *dst, const __local short2 *src, size_t num_elements, event_t event);
12995 event_t __ovld async_work_group_copy(__global ushort2 *dst, const __local ushort2 *src, size_t num_elements, event_t event);
12996 event_t __ovld async_work_group_copy(__global int2 *dst, const __local int2 *src, size_t num_elements, event_t event);
12997 event_t __ovld async_work_group_copy(__global uint2 *dst, const __local uint2 *src, size_t num_elements, event_t event);
12998 event_t __ovld async_work_group_copy(__global long2 *dst, const __local long2 *src, size_t num_elements, event_t event);
12999 event_t __ovld async_work_group_copy(__global ulong2 *dst, const __local ulong2 *src, size_t num_elements, event_t event);
13000 event_t __ovld async_work_group_copy(__global float2 *dst, const __local float2 *src, size_t num_elements, event_t event);
13001 event_t __ovld async_work_group_copy(__global char3 *dst, const __local char3 *src, size_t num_elements, event_t event);
13002 event_t __ovld async_work_group_copy(__global uchar3 *dst, const __local uchar3 *src, size_t num_elements, event_t event);
13003 event_t __ovld async_work_group_copy(__global short3 *dst, const __local short3 *src, size_t num_elements, event_t event);
13004 event_t __ovld async_work_group_copy(__global ushort3 *dst, const __local ushort3 *src, size_t num_elements, event_t event);
13005 event_t __ovld async_work_group_copy(__global int3 *dst, const __local int3 *src, size_t num_elements, event_t event);
13006 event_t __ovld async_work_group_copy(__global uint3 *dst, const __local uint3 *src, size_t num_elements, event_t event);
13007 event_t __ovld async_work_group_copy(__global long3 *dst, const __local long3 *src, size_t num_elements, event_t event);
13008 event_t __ovld async_work_group_copy(__global ulong3 *dst, const __local ulong3 *src, size_t num_elements, event_t event);
13009 event_t __ovld async_work_group_copy(__global float3 *dst, const __local float3 *src, size_t num_elements, event_t event);
13010 event_t __ovld async_work_group_copy(__global char4 *dst, const __local char4 *src, size_t num_elements, event_t event);
13011 event_t __ovld async_work_group_copy(__global uchar4 *dst, const __local uchar4 *src, size_t num_elements, event_t event);
13012 event_t __ovld async_work_group_copy(__global short4 *dst, const __local short4 *src, size_t num_elements, event_t event);
13013 event_t __ovld async_work_group_copy(__global ushort4 *dst, const __local ushort4 *src, size_t num_elements, event_t event);
13014 event_t __ovld async_work_group_copy(__global int4 *dst, const __local int4 *src, size_t num_elements, event_t event);
13015 event_t __ovld async_work_group_copy(__global uint4 *dst, const __local uint4 *src, size_t num_elements, event_t event);
13016 event_t __ovld async_work_group_copy(__global long4 *dst, const __local long4 *src, size_t num_elements, event_t event);
13017 event_t __ovld async_work_group_copy(__global ulong4 *dst, const __local ulong4 *src, size_t num_elements, event_t event);
13018 event_t __ovld async_work_group_copy(__global float4 *dst, const __local float4 *src, size_t num_elements, event_t event);
13019 event_t __ovld async_work_group_copy(__global char8 *dst, const __local char8 *src, size_t num_elements, event_t event);
13020 event_t __ovld async_work_group_copy(__global uchar8 *dst, const __local uchar8 *src, size_t num_elements, event_t event);
13021 event_t __ovld async_work_group_copy(__global short8 *dst, const __local short8 *src, size_t num_elements, event_t event);
13022 event_t __ovld async_work_group_copy(__global ushort8 *dst, const __local ushort8 *src, size_t num_elements, event_t event);
13023 event_t __ovld async_work_group_copy(__global int8 *dst, const __local int8 *src, size_t num_elements, event_t event);
13024 event_t __ovld async_work_group_copy(__global uint8 *dst, const __local uint8 *src, size_t num_elements, event_t event);
13025 event_t __ovld async_work_group_copy(__global long8 *dst, const __local long8 *src, size_t num_elements, event_t event);
13026 event_t __ovld async_work_group_copy(__global ulong8 *dst, const __local ulong8 *src, size_t num_elements, event_t event);
13027 event_t __ovld async_work_group_copy(__global float8 *dst, const __local float8 *src, size_t num_elements, event_t event);
13028 event_t __ovld async_work_group_copy(__global char16 *dst, const __local char16 *src, size_t num_elements, event_t event);
13029 event_t __ovld async_work_group_copy(__global uchar16 *dst, const __local uchar16 *src, size_t num_elements, event_t event);
13030 event_t __ovld async_work_group_copy(__global short16 *dst, const __local short16 *src, size_t num_elements, event_t event);
13031 event_t __ovld async_work_group_copy(__global ushort16 *dst, const __local ushort16 *src, size_t num_elements, event_t event);
13032 event_t __ovld async_work_group_copy(__global int16 *dst, const __local int16 *src, size_t num_elements, event_t event);
13033 event_t __ovld async_work_group_copy(__global uint16 *dst, const __local uint16 *src, size_t num_elements, event_t event);
13034 event_t __ovld async_work_group_copy(__global long16 *dst, const __local long16 *src, size_t num_elements, event_t event);
13035 event_t __ovld async_work_group_copy(__global ulong16 *dst, const __local ulong16 *src, size_t num_elements, event_t event);
13036 event_t __ovld async_work_group_copy(__global float16 *dst, const __local float16 *src, size_t num_elements, event_t event);
13038 event_t __ovld async_work_group_copy(__local double *dst, const __global double *src, size_t num_elements, event_t event);
13039 __local double2 *dst, const __global double2 *src, size_t num_elements, event_t event);
13040 event_t __ovld async_work_group_copy(__local double3 *dst, const __global double3 *src, size_t num_elements, event_t event);
13041 event_t __ovld async_work_group_copy(__local double4 *dst, const __global double4 *src, size_t num_elements, event_t event);
13042 event_t __ovld async_work_group_copy(__local double8 *dst, const __global double8 *src, size_t num_elements, event_t event);
13043 event_t __ovld async_work_group_copy(__local double16 *dst, const __global double16 *src, size_t num_elements, event_t event);
13044 event_t __ovld async_work_group_copy(__global double *dst, const __local double *src, size_t num_elements, event_t event);
13045 event_t __ovld async_work_group_copy(__global double2 *dst, const __local double2 *src, size_t num_elements, event_t event);
13046 event_t __ovld async_work_group_copy(__global double3 *dst, const __local double3 *src, size_t num_elements, event_t event);
13047 event_t __ovld async_work_group_copy(__global double4 *dst, const __local double4 *src, size_t num_elements, event_t event);
13048 event_t __ovld async_work_group_copy(__global double8 *dst, const __local double8 *src, size_t num_elements, event_t event);
13049 event_t __ovld async_work_group_copy(__global double16 *dst, const __local double16 *src, size_t num_elements, event_t event);
13052 event_t __ovld async_work_group_copy(__local half *dst, const __global half *src, size_t num_elements, event_t event);
13053 event_t __ovld async_work_group_copy(__local half2 *dst, const __global half2 *src, size_t num_elements, event_t event);
13054 event_t __ovld async_work_group_copy(__local half3 *dst, const __global half3 *src, size_t num_elements, event_t event);
13055 event_t __ovld async_work_group_copy(__local half4 *dst, const __global half4 *src, size_t num_elements, event_t event);
13056 event_t __ovld async_work_group_copy(__local half8 *dst, const __global half8 *src, size_t num_elements, event_t event);
13057 event_t __ovld async_work_group_copy(__local half16 *dst, const __global half16 *src, size_t num_elements, event_t event);
13058 event_t __ovld async_work_group_copy(__global half *dst, const __local half *src, size_t num_elements, event_t event);
13059 event_t __ovld async_work_group_copy(__global half2 *dst, const __local half2 *src, size_t num_elements, event_t event);
13060 event_t __ovld async_work_group_copy(__global half3 *dst, const __local half3 *src, size_t num_elements, event_t event);
13061 event_t __ovld async_work_group_copy(__global half4 *dst, const __local half4 *src, size_t num_elements, event_t event);
13062 event_t __ovld async_work_group_copy(__global half8 *dst, const __local half8 *src, size_t num_elements, event_t event);
13063 event_t __ovld async_work_group_copy(__global half16 *dst, const __local half16 *src, size_t num_elements, event_t event);
13092 event_t __ovld async_work_group_strided_copy(__local char *dst, const __global char *src, size_t num_elements, size_t src_stride, event_t event);
13093 event_t __ovld async_work_group_strided_copy(__local uchar *dst, const __global uchar *src, size_t num_elements, size_t src_stride, event_t event);
13094 event_t __ovld async_work_group_strided_copy(__local short *dst, const __global short *src, size_t num_elements, size_t src_stride, event_t event);
13095 event_t __ovld async_work_group_strided_copy(__local ushort *dst, const __global ushort *src, size_t num_elements, size_t src_stride, event_t event);
13096 event_t __ovld async_work_group_strided_copy(__local int *dst, const __global int *src, size_t num_elements, size_t src_stride, event_t event);
13097 event_t __ovld async_work_group_strided_copy(__local uint *dst, const __global uint *src, size_t num_elements, size_t src_stride, event_t event);
13098 event_t __ovld async_work_group_strided_copy(__local long *dst, const __global long *src, size_t num_elements, size_t src_stride, event_t event);
13099 event_t __ovld async_work_group_strided_copy(__local ulong *dst, const __global ulong *src, size_t num_elements, size_t src_stride, event_t event);
13100 event_t __ovld async_work_group_strided_copy(__local float *dst, const __global float *src, size_t num_elements, size_t src_stride, event_t event);
13101 event_t __ovld async_work_group_strided_copy(__local char2 *dst, const __global char2 *src, size_t num_elements, size_t src_stride, event_t event);
13102 event_t __ovld async_work_group_strided_copy(__local uchar2 *dst, const __global uchar2 *src, size_t num_elements, size_t src_stride, event_t event);
13103 event_t __ovld async_work_group_strided_copy(__local short2 *dst, const __global short2 *src, size_t num_elements, size_t src_stride, event_t event);
13104 event_t __ovld async_work_group_strided_copy(__local ushort2 *dst, const __global ushort2 *src, size_t num_elements, size_t src_stride, event_t event);
13105 event_t __ovld async_work_group_strided_copy(__local int2 *dst, const __global int2 *src, size_t num_elements, size_t src_stride, event_t event);
13106 event_t __ovld async_work_group_strided_copy(__local uint2 *dst, const __global uint2 *src, size_t num_elements, size_t src_stride, event_t event);
13107 event_t __ovld async_work_group_strided_copy(__local long2 *dst, const __global long2 *src, size_t num_elements, size_t src_stride, event_t event);
13108 event_t __ovld async_work_group_strided_copy(__local ulong2 *dst, const __global ulong2 *src, size_t num_elements, size_t src_stride, event_t event);
13109 event_t __ovld async_work_group_strided_copy(__local float2 *dst, const __global float2 *src, size_t num_elements, size_t src_stride, event_t event);
13110 event_t __ovld async_work_group_strided_copy(__local char3 *dst, const __global char3 *src, size_t num_elements, size_t src_stride, event_t event);
13111 event_t __ovld async_work_group_strided_copy(__local uchar3 *dst, const __global uchar3 *src, size_t num_elements, size_t src_stride, event_t event);
13112 event_t __ovld async_work_group_strided_copy(__local short3 *dst, const __global short3 *src, size_t num_elements, size_t src_stride, event_t event);
13113 event_t __ovld async_work_group_strided_copy(__local ushort3 *dst, const __global ushort3 *src, size_t num_elements, size_t src_stride, event_t event);
13114 event_t __ovld async_work_group_strided_copy(__local int3 *dst, const __global int3 *src, size_t num_elements, size_t src_stride, event_t event);
13115 event_t __ovld async_work_group_strided_copy(__local uint3 *dst, const __global uint3 *src, size_t num_elements, size_t src_stride, event_t event);
13116 event_t __ovld async_work_group_strided_copy(__local long3 *dst, const __global long3 *src, size_t num_elements, size_t src_stride, event_t event);
13117 event_t __ovld async_work_group_strided_copy(__local ulong3 *dst, const __global ulong3 *src, size_t num_elements, size_t src_stride, event_t event);
13118 event_t __ovld async_work_group_strided_copy(__local float3 *dst, const __global float3 *src, size_t num_elements, size_t src_stride, event_t event);
13119 event_t __ovld async_work_group_strided_copy(__local char4 *dst, const __global char4 *src, size_t num_elements, size_t src_stride, event_t event);
13120 event_t __ovld async_work_group_strided_copy(__local uchar4 *dst, const __global uchar4 *src, size_t num_elements, size_t src_stride, event_t event);
13121 event_t __ovld async_work_group_strided_copy(__local short4 *dst, const __global short4 *src, size_t num_elements, size_t src_stride, event_t event);
13122 event_t __ovld async_work_group_strided_copy(__local ushort4 *dst, const __global ushort4 *src, size_t num_elements, size_t src_stride, event_t event);
13123 event_t __ovld async_work_group_strided_copy(__local int4 *dst, const __global int4 *src, size_t num_elements, size_t src_stride, event_t event);
13124 event_t __ovld async_work_group_strided_copy(__local uint4 *dst, const __global uint4 *src, size_t num_elements, size_t src_stride, event_t event);
13125 event_t __ovld async_work_group_strided_copy(__local long4 *dst, const __global long4 *src, size_t num_elements, size_t src_stride, event_t event);
13126 event_t __ovld async_work_group_strided_copy(__local ulong4 *dst, const __global ulong4 *src, size_t num_elements, size_t src_stride, event_t event);
13127 event_t __ovld async_work_group_strided_copy(__local float4 *dst, const __global float4 *src, size_t num_elements, size_t src_stride, event_t event);
13128 event_t __ovld async_work_group_strided_copy(__local char8 *dst, const __global char8 *src, size_t num_elements, size_t src_stride, event_t event);
13129 event_t __ovld async_work_group_strided_copy(__local uchar8 *dst, const __global uchar8 *src, size_t num_elements, size_t src_stride, event_t event);
13130 event_t __ovld async_work_group_strided_copy(__local short8 *dst, const __global short8 *src, size_t num_elements, size_t src_stride, event_t event);
13131 event_t __ovld async_work_group_strided_copy(__local ushort8 *dst, const __global ushort8 *src, size_t num_elements, size_t src_stride, event_t event);
13132 event_t __ovld async_work_group_strided_copy(__local int8 *dst, const __global int8 *src, size_t num_elements, size_t src_stride, event_t event);
13133 event_t __ovld async_work_group_strided_copy(__local uint8 *dst, const __global uint8 *src, size_t num_elements, size_t src_stride, event_t event);
13134 event_t __ovld async_work_group_strided_copy(__local long8 *dst, const __global long8 *src, size_t num_elements, size_t src_stride, event_t event);
13135 event_t __ovld async_work_group_strided_copy(__local ulong8 *dst, const __global ulong8 *src, size_t num_elements, size_t src_stride, event_t event);
13136 event_t __ovld async_work_group_strided_copy(__local float8 *dst, const __global float8 *src, size_t num_elements, size_t src_stride, event_t event);
13137 event_t __ovld async_work_group_strided_copy(__local char16 *dst, const __global char16 *src, size_t num_elements, size_t src_stride, event_t event);
13138 event_t __ovld async_work_group_strided_copy(__local uchar16 *dst, const __global uchar16 *src, size_t num_elements, size_t src_stride, event_t event);
13139 event_t __ovld async_work_group_strided_copy(__local short16 *dst, const __global short16 *src, size_t num_elements, size_t src_stride, event_t event);
13140 event_t __ovld async_work_group_strided_copy(__local ushort16 *dst, const __global ushort16 *src, size_t num_elements, size_t src_stride, event_t event);
13141 event_t __ovld async_work_group_strided_copy(__local int16 *dst, const __global int16 *src, size_t num_elements, size_t src_stride, event_t event);
13142 event_t __ovld async_work_group_strided_copy(__local uint16 *dst, const __global uint16 *src, size_t num_elements, size_t src_stride, event_t event);
13143 event_t __ovld async_work_group_strided_copy(__local long16 *dst, const __global long16 *src, size_t num_elements, size_t src_stride, event_t event);
13144 event_t __ovld async_work_group_strided_copy(__local ulong16 *dst, const __global ulong16 *src, size_t num_elements, size_t src_stride, event_t event);
13145 event_t __ovld async_work_group_strided_copy(__local float16 *dst, const __global float16 *src, size_t num_elements, size_t src_stride, event_t event);
13146 event_t __ovld async_work_group_strided_copy(__global char *dst, const __local char *src, size_t num_elements, size_t dst_stride, event_t event);
13147 event_t __ovld async_work_group_strided_copy(__global uchar *dst, const __local uchar *src, size_t num_elements, size_t dst_stride, event_t event);
13148 event_t __ovld async_work_group_strided_copy(__global short *dst, const __local short *src, size_t num_elements, size_t dst_stride, event_t event);
13149 event_t __ovld async_work_group_strided_copy(__global ushort *dst, const __local ushort *src, size_t num_elements, size_t dst_stride, event_t event);
13150 event_t __ovld async_work_group_strided_copy(__global int *dst, const __local int *src, size_t num_elements, size_t dst_stride, event_t event);
13151 event_t __ovld async_work_group_strided_copy(__global uint *dst, const __local uint *src, size_t num_elements, size_t dst_stride, event_t event);
13152 event_t __ovld async_work_group_strided_copy(__global long *dst, const __local long *src, size_t num_elements, size_t dst_stride, event_t event);
13153 event_t __ovld async_work_group_strided_copy(__global ulong *dst, const __local ulong *src, size_t num_elements, size_t dst_stride, event_t event);
13154 event_t __ovld async_work_group_strided_copy(__global float *dst, const __local float *src, size_t num_elements, size_t dst_stride, event_t event);
13155 event_t __ovld async_work_group_strided_copy(__global char2 *dst, const __local char2 *src, size_t num_elements, size_t dst_stride, event_t event);
13156 event_t __ovld async_work_group_strided_copy(__global uchar2 *dst, const __local uchar2 *src, size_t num_elements, size_t dst_stride, event_t event);
13157 event_t __ovld async_work_group_strided_copy(__global short2 *dst, const __local short2 *src, size_t num_elements, size_t dst_stride, event_t event);
13158 event_t __ovld async_work_group_strided_copy(__global ushort2 *dst, const __local ushort2 *src, size_t num_elements, size_t dst_stride, event_t event);
13159 event_t __ovld async_work_group_strided_copy(__global int2 *dst, const __local int2 *src, size_t num_elements, size_t dst_stride, event_t event);
13160 event_t __ovld async_work_group_strided_copy(__global uint2 *dst, const __local uint2 *src, size_t num_elements, size_t dst_stride, event_t event);
13161 event_t __ovld async_work_group_strided_copy(__global long2 *dst, const __local long2 *src, size_t num_elements, size_t dst_stride, event_t event);
13162 event_t __ovld async_work_group_strided_copy(__global ulong2 *dst, const __local ulong2 *src, size_t num_elements, size_t dst_stride, event_t event);
13163 event_t __ovld async_work_group_strided_copy(__global float2 *dst, const __local float2 *src, size_t num_elements, size_t dst_stride, event_t event);
13164 event_t __ovld async_work_group_strided_copy(__global char3 *dst, const __local char3 *src, size_t num_elements, size_t dst_stride, event_t event);
13165 event_t __ovld async_work_group_strided_copy(__global uchar3 *dst, const __local uchar3 *src, size_t num_elements, size_t dst_stride, event_t event);
13166 event_t __ovld async_work_group_strided_copy(__global short3 *dst, const __local short3 *src, size_t num_elements, size_t dst_stride, event_t event);
13167 event_t __ovld async_work_group_strided_copy(__global ushort3 *dst, const __local ushort3 *src, size_t num_elements, size_t dst_stride, event_t event);
13168 event_t __ovld async_work_group_strided_copy(__global int3 *dst, const __local int3 *src, size_t num_elements, size_t dst_stride, event_t event);
13169 event_t __ovld async_work_group_strided_copy(__global uint3 *dst, const __local uint3 *src, size_t num_elements, size_t dst_stride, event_t event);
13170 event_t __ovld async_work_group_strided_copy(__global long3 *dst, const __local long3 *src, size_t num_elements, size_t dst_stride, event_t event);
13171 event_t __ovld async_work_group_strided_copy(__global ulong3 *dst, const __local ulong3 *src, size_t num_elements, size_t dst_stride, event_t event);
13172 event_t __ovld async_work_group_strided_copy(__global float3 *dst, const __local float3 *src, size_t num_elements, size_t dst_stride, event_t event);
13173 event_t __ovld async_work_group_strided_copy(__global char4 *dst, const __local char4 *src, size_t num_elements, size_t dst_stride, event_t event);
13174 event_t __ovld async_work_group_strided_copy(__global uchar4 *dst, const __local uchar4 *src, size_t num_elements, size_t dst_stride, event_t event);
13175 event_t __ovld async_work_group_strided_copy(__global short4 *dst, const __local
13176 event_t __ovld async_work_group_strided_copy(__global ushort4 *dst, const __local ushort4 *src, size_t num_elements, size_t dst_stride, event_t event);
13177 event_t __ovld async_work_group_strided_copy(__global int4 *dst, const __local int4 *src, size_t num_elements, size_t dst_stride, event_t event);
13178 event_t __ovld async_work_group_strided_copy(__global uint4 *dst, const __local uint4 *src, size_t num_elements, size_t dst_stride, event_t event);
13179 event_t __ovld async_work_group_strided_copy(__global long4 *dst, const __local long4 *src, size_t num_elements, size_t dst_stride, event_t event);
13180 event_t __ovld async_work_group_strided_copy(__global ulong4 *dst, const __local ulong4 *src, size_t num_elements, size_t dst_stride, event_t event);
13181 event_t __ovld async_work_group_strided_copy(__global float4 *dst, const __local float4 *src, size_t num_elements, size_t dst_stride, event_t event);
13182 event_t __ovld async_work_group_strided_copy(__global char8 *dst, const __local char8 *src, size_t num_elements, size_t dst_stride, event_t event);
13183 event_t __ovld async_work_group_strided_copy(__global uchar8 *dst, const __local uchar8 *src, size_t num_elements, size_t dst_stride, event_t event);
13184 event_t __ovld async_work_group_strided_copy(__global short8 *dst, const __local short8 *src, size_t num_elements, size_t dst_stride, event_t event);
13185 event_t __ovld async_work_group_strided_copy(__global ushort8 *dst, const __local ushort8 *src, size_t num_elements, size_t dst_stride, event_t event);
13186 event_t __ovld async_work_group_strided_copy(__global int8 *dst, const __local int8 *src, size_t num_elements, size_t dst_stride, event_t event);
13187 event_t __ovld async_work_group_strided_copy(__global uint8 *dst, const __local uint8 *src, size_t num_elements, size_t dst_stride, event_t event);
13188 event_t __ovld async_work_group_strided_copy(__global long8 *dst, const __local long8 *src, size_t num_elements, size_t dst_stride, event_t event);
13189 event_t __ovld async_work_group_strided_copy(__global ulong8 *dst, const __local ulong8 *src, size_t num_elements, size_t dst_stride, event_t event);
13190 event_t __ovld async_work_group_strided_copy(__global float8 *dst, const __local float8 *src, size_t num_elements, size_t dst_stride, event_t event);
13191 event_t __ovld async_work_group_strided_copy(__global char16 *dst, const __local char16 *src, size_t num_elements, size_t dst_stride, event_t event);
13192 event_t __ovld async_work_group_strided_copy(__global uchar16 *dst, const __local uchar16 *src, size_t num_elements, size_t dst_stride, event_t event);
13193 event_t __ovld async_work_group_strided_copy(__global short16 *dst, const __local short16 *src, size_t num_elements, size_t dst_stride, event_t event);
13194 event_t __ovld async_work_group_strided_copy(__global ushort16 *dst, const __local ushort16 *src, size_t num_elements, size_t dst_stride, event_t event);
13195 event_t __ovld async_work_group_strided_copy(__global int16 *dst, const __local int16 *src, size_t num_elements, size_t dst_stride, event_t event);
13196 event_t __ovld async_work_group_strided_copy(__global uint16 *dst, const __local uint16 *src, size_t num_elements, size_t dst_stride, event_t event);
13197 event_t __ovld async_work_group_strided_copy(__global long16 *dst, const __local long16 *src, size_t num_elements, size_t dst_stride, event_t event);
13198 event_t __ovld async_work_group_strided_copy(__global ulong16 *dst, const __local ulong16 *src, size_t num_elements, size_t dst_stride, event_t event);
13199 event_t __ovld async_work_group_strided_copy(__global float16 *dst, const __local float16 *src, size_t num_elements, size_t dst_stride, event_t event);
13201 event_t __ovld async_work_group_strided_copy(__local double *dst, const __global double *src, size_t num_elements, size_t src_stride, event_t event);
13202 event_t __ovld async_work_group_strided_copy(__local double2 *dst, const __global double2 *src, size_t num_elements, size_t src_stride, event_t event);
13203 event_t __ovld async_work_group_strided_copy(__local double3 *dst, const __global double3 *src, size_t num_elements, size_t src_stride, event_t event);
13204 event_t __ovld async_work_group_strided_copy(__local double4 *dst, const __global double4 *src, size_t num_elements, size_t src_stride, event_t event);
13205 event_t __ovld async_work_group_strided_copy(__local double8 *dst, const __global double8 *src, size_t num_elements, size_t src_stride, event_t event);
13206 event_t __ovld async_work_group_strided_copy(__local double16 *dst, const __global double16 *src, size_t num_elements, size_t src_stride, event_t event);
13207 event_t __ovld async_work_group_strided_copy(__global double *dst, const __local double *src, size_t num_elements, size_t dst_stride, event_t event);
13208 event_t __ovld async_work_group_strided_copy(__global double2 *dst, const __local double2 *src, size_t num_elements, size_t dst_stride, event_t event);
13209 event_t __ovld async_work_group_strided_copy(__global double3 *dst, const __local double3 *src, size_t num_elements, size_t dst_stride, event_t event);
13210 event_t __ovld async_work_group_strided_copy(__global double4 *dst, const __local double4 *src, size_t num_elements, size_t dst_stride, event_t event);
13211 event_t __ovld async_work_group_strided_copy(__global double8 *dst, const __local double8 *src, size_t num_elements, size_t dst_stride, event_t event);
13212 event_t __ovld async_work_group_strided_copy(__global double16 *dst, const __local double16 *src, size_t num_elements, size_t dst_stride, event_t event);
13215 event_t __ovld async_work_group_strided_copy(__local half *dst, const __global half *src, size_t num_elements, size_t src_stride, event_t event);
13216 event_t __ovld async_work_group_strided_copy(__local half2 *dst, const __global half2 *src, size_t num_elements, size_t src_stride, event_t event);
13217 event_t __ovld async_work_group_strided_copy(__local half3 *dst, const __global half3 *src, size_t num_elements, size_t src_stride, event_t event);
13218 event_t __ovld async_work_group_strided_copy(__local half4 *dst, const __global half4 *src, size_t num_elements, size_t src_stride, event_t event);
13219 event_t __ovld async_work_group_strided_copy(__local half8 *dst, const __global half8 *src, size_t num_elements, size_t src_stride, event_t event);
13220 event_t __ovld async_work_group_strided_copy(__local half16 *dst, const __global half16 *src, size_t num_elements, size_t src_stride, event_t event);
13221 event_t __ovld async_work_group_strided_copy(__global half *dst, const __local half *src, size_t num_elements, size_t dst_stride, event_t event);
13222 event_t __ovld async_work_group_strided_copy(__global half2 *dst, const __local half2 *src, size_t num_elements, size_t dst_stride, event_t event);
13223 event_t __ovld async_work_group_strided_copy(__global half3 *dst, const __local half3 *src, size_t num_elements, size_t dst_stride, event_t event);
13224 event_t __ovld async_work_group_strided_copy(__global half4 *dst, const __local half4 *src, size_t num_elements, size_t dst_stride, event_t event);
13225 event_t __ovld async_work_group_strided_copy(__global half8 *dst, const __local half8 *src, size_t num_elements, size_t dst_stride, event_t event);
13226 event_t __ovld async_work_group_strided_copy(__global half16 *dst, const __local half16 *src, size_t num_elements, size_t dst_stride, event_t event);
13334 int __ovld atomic_add(volatile __local int *p, int val);
13335 unsigned int __ovld atomic_add(volatile __local unsigned int *p, unsigned int val);
13342 int __ovld atom_add(volatile __local int *p, int val);
13343 unsigned int __ovld atom_add(volatile __local unsigned int *p, unsigned int val);
13349 long __ovld atom_add(volatile __local long *p, long val);
13350 unsigned long __ovld atom_add(volatile __local unsigned long *p, unsigned long val);
13360 int __ovld atomic_sub(volatile __local int *p, int val);
13361 unsigned int __ovld atomic_sub(volatile __local unsigned int *p, unsigned int val);
13368 int __ovld atom_sub(volatile __local int *p, int val);
13369 unsigned int __ovld atom_sub(volatile __local unsigned int *p, unsigned int val);
13375 long __ovld atom_sub(volatile __local long *p, long val);
13376 unsigned long __ovld atom_sub(volatile __local unsigned long *p, unsigned long val);
13386 int __ovld atomic_xchg(volatile __local int *p, int val);
13387 unsigned int __ovld atomic_xchg(volatile __local unsigned int *p, unsigned int val);
13389 float __ovld atomic_xchg(volatile __local float *p, float val);
13396 int __ovld atom_xchg(volatile __local int *p, int val);
13397 unsigned int __ovld atom_xchg(volatile __local unsigned int *p, unsigned int val);
13402 long __ovld atom_xchg(volatile __local long *p, long val);
13404 unsigned long __ovld atom_xchg(volatile __local unsigned long *p, unsigned long val);
13415 int __ovld atomic_inc(volatile __local int *p);
13416 unsigned int __ovld atomic_inc(volatile __local unsigned int *p);
13423 int __ovld atom_inc(volatile __local int *p);
13424 unsigned int __ovld atom_inc(volatile __local unsigned int *p);
13430 long __ovld atom_inc(volatile __local long *p);
13431 unsigned long __ovld atom_inc(volatile __local unsigned long *p);
13442 int __ovld atomic_dec(volatile __local int *p);
13443 unsigned int __ovld atomic_dec(volatile __local unsigned int *p);
13450 int __ovld atom_dec(volatile __local int *p);
13451 unsigned int __ovld atom_dec(volatile __local unsigned int *p);
13457 long __ovld atom_dec(volatile __local long *p);
13458 unsigned long __ovld atom_dec(volatile __local unsigned long *p);
13470 int __ovld atomic_cmpxchg(volatile __local int *p, int cmp, int val);
13471 unsigned int __ovld atomic_cmpxchg(volatile __local unsigned int *p, unsigned int cmp, unsigned int val);
13478 int __ovld atom_cmpxchg(volatile __local int *p, int cmp, int val);
13479 unsigned int __ovld atom_cmpxchg(volatile __local unsigned int *p, unsigned int cmp, unsigned int val);
13485 long __ovld atom_cmpxchg(volatile __local long *p, long cmp, long val);
13486 unsigned long __ovld atom_cmpxchg(volatile __local unsigned long *p, unsigned long cmp, unsigned long val);
13498 int __ovld atomic_min(volatile __local int *p, int val);
13499 unsigned int __ovld atomic_min(volatile __local unsigned int *p, unsigned int val);
13506 int __ovld atom_min(volatile __local int *p, int val);
13507 unsigned int __ovld atom_min(volatile __local unsigned int *p, unsigned int val);
13513 long __ovld atom_min(volatile __local long *p, long val);
13514 unsigned long __ovld atom_min(volatile __local unsigned long *p, unsigned long val);
13526 int __ovld atomic_max(volatile __local int *p, int val);
13527 unsigned int __ovld atomic_max(volatile __local unsigned int *p, unsigned int val);
13534 int __ovld atom_max(volatile __local int *p, int val);
13535 unsigned int __ovld atom_max(volatile __local unsigned int *p, unsigned int val);
13541 long __ovld atom_max(volatile __local long *p, long val);
13542 unsigned long __ovld atom_max(volatile __local unsigned long *p, unsigned long val);
13553 int __ovld atomic_and(volatile __local int *p, int val);
13554 unsigned int __ovld atomic_and(volatile __local unsigned int *p, unsigned int val);
13561 int __ovld atom_and(volatile __local int *p, int val);
13562 unsigned int __ovld atom_and(volatile __local unsigned int *p, unsigned int val);
13568 long __ovld atom_and(volatile __local long *p, long val);
13569 unsigned long __ovld atom_and(volatile __local unsigned long *p, unsigned long val);
13580 int __ovld atomic_or(volatile __local int *p, int val);
13581 unsigned int __ovld atomic_or(volatile __local unsigned int *p, unsigned int val);
13588 int __ovld atom_or(volatile __local int *p, int val);
13589 unsigned int __ovld atom_or(volatile __local unsigned int *p, unsigned int val);
13595 long __ovld atom_or(volatile __local long *p, long val);
13596 unsigned long __ovld atom_or(volatile __local unsigned long *p, unsigned long val);
13607 int __ovld atomic_xor(volatile __local int *p, int val);
13608 unsigned int __ovld atomic_xor(volatile __local unsigned int *p, unsigned int val);
13615 int __ovld atom_xor(volatile __local int *p, int val);
13616 unsigned int __ovld atom_xor(volatile __local unsigned int *p, unsigned int val);
13622 long __ovld atom_xor(volatile __local long *p, long val);
13623 unsigned long __ovld atom_xor(volatile __local unsigned long *p, unsigned long val);