blob: 069cded82fb1b3118bd714d3086bdb302a7c0df7 [file] [log] [blame]
/*
* Copyright (c) 2014 Advanced Micro Devices, Inc.
*
* Permission is hereby granted, free of charge, to any person obtaining a copy
* of this software and associated documentation files (the "Software"), to deal
* in the Software without restriction, including without limitation the rights
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
* copies of the Software, and to permit persons to whom the Software is
* furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
* THE SOFTWARE.
*/
extern __attribute__((pure)) float __cvt_f16_to_f32(ushort);
__attribute__((always_inline)) static float
vldhp(size_t i, const half *p)
{
ushort h = *(const short *)(p + i);
return __cvt_f16_to_f32(h);
}
extern __attribute__((overloadable, weak, alias("vldhp"))) float vload_half(size_t, const half *);
extern __attribute__((overloadable, weak, alias("vldhp"))) float vloada_half(size_t, const half *);
extern __attribute__((pure)) float __cvt_f16_to_f32(ushort);
__attribute__((always_inline)) static float
vldhc(size_t i, const __constant half *p)
{
ushort h = *(const __constant short *)(p + i);
return __cvt_f16_to_f32(h);
}
extern __attribute__((overloadable, weak, alias("vldhc"))) float vload_half(size_t, const __constant half *);
extern __attribute__((overloadable, weak, alias("vldhc"))) float vloada_half(size_t, const __constant half *);
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float __cvt_f16_to_f32(ushort);
__attribute__((always_inline)) static float
vldhg(size_t i, const __global half *p)
{
ushort h = *(const __global short *)(p + i);
return __cvt_f16_to_f32(h);
}
extern __attribute__((overloadable, weak, alias("vldhg"))) float vload_half(size_t, const __global half *);
extern __attribute__((overloadable, weak, alias("vldhg"))) float vloada_half(size_t, const __global half *);
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float __cvt_f16_to_f32(ushort);
__attribute__((always_inline)) static float
vldhl(size_t i, const __local half *p)
{
ushort h = *(const __local short *)(p + i);
return __cvt_f16_to_f32(h);
}
extern __attribute__((overloadable, weak, alias("vldhl"))) float vload_half(size_t, const __local half *);
extern __attribute__((overloadable, weak, alias("vldhl"))) float vloada_half(size_t, const __local half *);
#endif
extern __attribute__((pure)) float2 __cvt_2f16_to_2f32(ushort2);
__attribute__((overloadable, always_inline, weak)) float2
vload_half2(size_t i, const half *p)
{
return __cvt_2f16_to_2f32(vload2(i, (const ushort *)p));
}
extern __attribute__((pure)) float2 __cvt_2f16_to_2f32(ushort2);
__attribute__((overloadable, always_inline, weak)) float2
vload_half2(size_t i, const __constant half *p)
{
return __cvt_2f16_to_2f32(vload2(i, (const __constant ushort *)p));
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float2 __cvt_2f16_to_2f32(ushort2);
__attribute__((overloadable, always_inline, weak)) float2
vload_half2(size_t i, const __global half *p)
{
return __cvt_2f16_to_2f32(vload2(i, (const __global ushort *)p));
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float2 __cvt_2f16_to_2f32(ushort2);
__attribute__((overloadable, always_inline, weak)) float2
vload_half2(size_t i, const __local half *p)
{
return __cvt_2f16_to_2f32(vload2(i, (const __local ushort *)p));
}
#endif
extern __attribute__((pure)) float3 __cvt_3f16_to_3f32(ushort3);
__attribute__((overloadable, always_inline, weak)) float3
vload_half3(size_t i, const half *p)
{
return __cvt_3f16_to_3f32(vload3(i, (const ushort *)p));
}
extern __attribute__((pure)) float3 __cvt_3f16_to_3f32(ushort3);
__attribute__((overloadable, always_inline, weak)) float3
vload_half3(size_t i, const __constant half *p)
{
return __cvt_3f16_to_3f32(vload3(i, (const __constant ushort *)p));
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float3 __cvt_3f16_to_3f32(ushort3);
__attribute__((overloadable, always_inline, weak)) float3
vload_half3(size_t i, const __global half *p)
{
return __cvt_3f16_to_3f32(vload3(i, (const __global ushort *)p));
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float3 __cvt_3f16_to_3f32(ushort3);
__attribute__((overloadable, always_inline, weak)) float3
vload_half3(size_t i, const __local half *p)
{
return __cvt_3f16_to_3f32(vload3(i, (const __local ushort *)p));
}
#endif
extern __attribute__((pure)) float4 __cvt_4f16_to_4f32(ushort4);
__attribute__((overloadable, always_inline, weak)) float4
vload_half4(size_t i, const half *p)
{
return __cvt_4f16_to_4f32(vload4(i, (const ushort *)p));
}
extern __attribute__((pure)) float4 __cvt_4f16_to_4f32(ushort4);
__attribute__((overloadable, always_inline, weak)) float4
vload_half4(size_t i, const __constant half *p)
{
return __cvt_4f16_to_4f32(vload4(i, (const __constant ushort *)p));
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float4 __cvt_4f16_to_4f32(ushort4);
__attribute__((overloadable, always_inline, weak)) float4
vload_half4(size_t i, const __global half *p)
{
return __cvt_4f16_to_4f32(vload4(i, (const __global ushort *)p));
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float4 __cvt_4f16_to_4f32(ushort4);
__attribute__((overloadable, always_inline, weak)) float4
vload_half4(size_t i, const __local half *p)
{
return __cvt_4f16_to_4f32(vload4(i, (const __local ushort *)p));
}
#endif
extern __attribute__((pure)) float8 __cvt_8f16_to_8f32(ushort8);
__attribute__((overloadable, always_inline, weak)) float8
vload_half8(size_t i, const half *p)
{
return __cvt_8f16_to_8f32(vload8(i, (const ushort *)p));
}
extern __attribute__((pure)) float8 __cvt_8f16_to_8f32(ushort8);
__attribute__((overloadable, always_inline, weak)) float8
vload_half8(size_t i, const __constant half *p)
{
return __cvt_8f16_to_8f32(vload8(i, (const __constant ushort *)p));
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float8 __cvt_8f16_to_8f32(ushort8);
__attribute__((overloadable, always_inline, weak)) float8
vload_half8(size_t i, const __global half *p)
{
return __cvt_8f16_to_8f32(vload8(i, (const __global ushort *)p));
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float8 __cvt_8f16_to_8f32(ushort8);
__attribute__((overloadable, always_inline, weak)) float8
vload_half8(size_t i, const __local half *p)
{
return __cvt_8f16_to_8f32(vload8(i, (const __local ushort *)p));
}
#endif
extern __attribute__((pure)) float16 __cvt_16f16_to_16f32(ushort16);
__attribute__((overloadable, always_inline, weak)) float16
vload_half16(size_t i, const half *p)
{
return __cvt_16f16_to_16f32(vload16(i, (const ushort *)p));
}
extern __attribute__((pure)) float16 __cvt_16f16_to_16f32(ushort16);
__attribute__((overloadable, always_inline, weak)) float16
vload_half16(size_t i, const __constant half *p)
{
return __cvt_16f16_to_16f32(vload16(i, (const __constant ushort *)p));
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float16 __cvt_16f16_to_16f32(ushort16);
__attribute__((overloadable, always_inline, weak)) float16
vload_half16(size_t i, const __global half *p)
{
return __cvt_16f16_to_16f32(vload16(i, (const __global ushort *)p));
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float16 __cvt_16f16_to_16f32(ushort16);
__attribute__((overloadable, always_inline, weak)) float16
vload_half16(size_t i, const __local half *p)
{
return __cvt_16f16_to_16f32(vload16(i, (const __local ushort *)p));
}
#endif
extern __attribute__((pure)) float2 __cvt_2f16_to_2f32(ushort2);
__attribute__((overloadable, always_inline, weak)) float2
vloada_half2(size_t i, const half *p)
{
return __cvt_2f16_to_2f32(*(const ushort2 *)(p + i * 2));
}
extern __attribute__((pure)) float2 __cvt_2f16_to_2f32(ushort2);
__attribute__((overloadable, always_inline, weak)) float2
vloada_half2(size_t i, const __constant half *p)
{
return __cvt_2f16_to_2f32(*(const __constant ushort2 *)(p + i * 2));
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float2 __cvt_2f16_to_2f32(ushort2);
__attribute__((overloadable, always_inline, weak)) float2
vloada_half2(size_t i, const __global half *p)
{
return __cvt_2f16_to_2f32(*(const __global ushort2 *)(p + i * 2));
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float2 __cvt_2f16_to_2f32(ushort2);
__attribute__((overloadable, always_inline, weak)) float2
vloada_half2(size_t i, const __local half *p)
{
return __cvt_2f16_to_2f32(*(const __local ushort2 *)(p + i * 2));
}
#endif
extern __attribute__((pure)) float3 __cvt_3f16_to_3f32(ushort3);
__attribute__((overloadable, always_inline, weak)) float3
vloada_half3(size_t i, const half *p)
{
ushort4 h = *(const ushort4 *)(p + i * 4);
return __cvt_3f16_to_3f32(h.s012);
}
extern __attribute__((pure)) float3 __cvt_3f16_to_3f32(ushort3);
__attribute__((overloadable, always_inline, weak)) float3
vloada_half3(size_t i, const __constant half *p)
{
ushort4 h = *(const __constant ushort4 *)(p + i * 4);
return __cvt_3f16_to_3f32(h.s012);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float3 __cvt_3f16_to_3f32(ushort3);
__attribute__((overloadable, always_inline, weak)) float3
vloada_half3(size_t i, const __global half *p)
{
ushort4 h = *(const __global ushort4 *)(p + i * 4);
return __cvt_3f16_to_3f32(h.s012);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float3 __cvt_3f16_to_3f32(ushort3);
__attribute__((overloadable, always_inline, weak)) float3
vloada_half3(size_t i, const __local half *p)
{
ushort4 h = *(const __local ushort4 *)(p + i * 4);
return __cvt_3f16_to_3f32(h.s012);
}
#endif
extern __attribute__((pure)) float4 __cvt_4f16_to_4f32(ushort4);
__attribute__((overloadable, always_inline, weak)) float4
vloada_half4(size_t i, const half *p)
{
return __cvt_4f16_to_4f32(*(const ushort4 *)(p + i * 4));
}
extern __attribute__((pure)) float4 __cvt_4f16_to_4f32(ushort4);
__attribute__((overloadable, always_inline, weak)) float4
vloada_half4(size_t i, const __constant half *p)
{
return __cvt_4f16_to_4f32(*(const __constant ushort4 *)(p + i * 4));
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float4 __cvt_4f16_to_4f32(ushort4);
__attribute__((overloadable, always_inline, weak)) float4
vloada_half4(size_t i, const __global half *p)
{
return __cvt_4f16_to_4f32(*(const __global ushort4 *)(p + i * 4));
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float4 __cvt_4f16_to_4f32(ushort4);
__attribute__((overloadable, always_inline, weak)) float4
vloada_half4(size_t i, const __local half *p)
{
return __cvt_4f16_to_4f32(*(const __local ushort4 *)(p + i * 4));
}
#endif
extern __attribute__((pure)) float8 __cvt_8f16_to_8f32(ushort8);
__attribute__((overloadable, always_inline, weak)) float8
vloada_half8(size_t i, const half *p)
{
return __cvt_8f16_to_8f32(*(const ushort8 *)(p + i * 8));
}
extern __attribute__((pure)) float8 __cvt_8f16_to_8f32(ushort8);
__attribute__((overloadable, always_inline, weak)) float8
vloada_half8(size_t i, const __constant half *p)
{
return __cvt_8f16_to_8f32(*(const __constant ushort8 *)(p + i * 8));
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float8 __cvt_8f16_to_8f32(ushort8);
__attribute__((overloadable, always_inline, weak)) float8
vloada_half8(size_t i, const __global half *p)
{
return __cvt_8f16_to_8f32(*(const __global ushort8 *)(p + i * 8));
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float8 __cvt_8f16_to_8f32(ushort8);
__attribute__((overloadable, always_inline, weak)) float8
vloada_half8(size_t i, const __local half *p)
{
return __cvt_8f16_to_8f32(*(const __local ushort8 *)(p + i * 8));
}
#endif
extern __attribute__((pure)) float16 __cvt_16f16_to_16f32(ushort16);
__attribute__((overloadable, always_inline, weak)) float16
vloada_half16(size_t i, const half *p)
{
return __cvt_16f16_to_16f32(*(const ushort16 *)(p + i * 16));
}
extern __attribute__((pure)) float16 __cvt_16f16_to_16f32(ushort16);
__attribute__((overloadable, always_inline, weak)) float16
vloada_half16(size_t i, const __constant half *p)
{
return __cvt_16f16_to_16f32(*(const __constant ushort16 *)(p + i * 16));
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float16 __cvt_16f16_to_16f32(ushort16);
__attribute__((overloadable, always_inline, weak)) float16
vloada_half16(size_t i, const __global half *p)
{
return __cvt_16f16_to_16f32(*(const __global ushort16 *)(p + i * 16));
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) float16 __cvt_16f16_to_16f32(ushort16);
__attribute__((overloadable, always_inline, weak)) float16
vloada_half16(size_t i, const __local half *p)
{
return __cvt_16f16_to_16f32(*(const __local ushort16 *)(p + i * 16));
}
#endif
extern __attribute__((pure)) ushort __cvt_f32_to_f16_cur(float);
__attribute__((always_inline)) static void
vsthpf32c(float v, size_t i, half *p)
{
*(ushort *)(p + i) = __cvt_f32_to_f16_cur(v);
}
extern __attribute__((overloadable, weak, alias("vsthpf32c"))) void vstore_half(float, size_t, half *);
extern __attribute__((overloadable, weak, alias("vsthpf32c"))) void vstorea_half(float, size_t, half *);
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f32_to_f16_cur(float);
__attribute__((always_inline)) static void
vsthgf32c(float v, size_t i, __global half *p)
{
*(__global ushort *)(p + i) = __cvt_f32_to_f16_cur(v);
}
extern __attribute__((overloadable, weak, alias("vsthgf32c"))) void vstore_half(float, size_t, __global half *);
extern __attribute__((overloadable, weak, alias("vsthgf32c"))) void vstorea_half(float, size_t, __global half *);
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f32_to_f16_cur(float);
__attribute__((always_inline)) static void
vsthlf32c(float v, size_t i, __local half *p)
{
*(__local ushort *)(p + i) = __cvt_f32_to_f16_cur(v);
}
extern __attribute__((overloadable, weak, alias("vsthlf32c"))) void vstore_half(float, size_t, __local half *);
extern __attribute__((overloadable, weak, alias("vsthlf32c"))) void vstorea_half(float, size_t, __local half *);
#endif
extern __attribute__((pure)) ushort __cvt_f32_to_f16_rte(float);
__attribute__((always_inline)) static void
vsthpf32e(float v, size_t i, half *p)
{
*(ushort *)(p + i) = __cvt_f32_to_f16_rte(v);
}
extern __attribute__((overloadable, weak, alias("vsthpf32e"))) void vstore_half_rte(float, size_t, half *);
extern __attribute__((overloadable, weak, alias("vsthpf32e"))) void vstorea_half_rte(float, size_t, half *);
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f32_to_f16_rte(float);
__attribute__((always_inline)) static void
vsthgf32e(float v, size_t i, __global half *p)
{
*(__global ushort *)(p + i) = __cvt_f32_to_f16_rte(v);
}
extern __attribute__((overloadable, weak, alias("vsthgf32e"))) void vstore_half_rte(float, size_t, __global half *);
extern __attribute__((overloadable, weak, alias("vsthgf32e"))) void vstorea_half_rte(float, size_t, __global half *);
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f32_to_f16_rte(float);
__attribute__((always_inline)) static void
vsthlf32e(float v, size_t i, __local half *p)
{
*(__local ushort *)(p + i) = __cvt_f32_to_f16_rte(v);
}
extern __attribute__((overloadable, weak, alias("vsthlf32e"))) void vstore_half_rte(float, size_t, __local half *);
extern __attribute__((overloadable, weak, alias("vsthlf32e"))) void vstorea_half_rte(float, size_t, __local half *);
#endif
extern __attribute__((pure)) ushort __cvt_f32_to_f16_rtp(float);
__attribute__((always_inline)) static void
vsthpf32p(float v, size_t i, half *p)
{
*(ushort *)(p + i) = __cvt_f32_to_f16_rtp(v);
}
extern __attribute__((overloadable, weak, alias("vsthpf32p"))) void vstore_half_rtp(float, size_t, half *);
extern __attribute__((overloadable, weak, alias("vsthpf32p"))) void vstorea_half_rtp(float, size_t, half *);
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f32_to_f16_rtp(float);
__attribute__((always_inline)) static void
vsthgf32p(float v, size_t i, __global half *p)
{
*(__global ushort *)(p + i) = __cvt_f32_to_f16_rtp(v);
}
extern __attribute__((overloadable, weak, alias("vsthgf32p"))) void vstore_half_rtp(float, size_t, __global half *);
extern __attribute__((overloadable, weak, alias("vsthgf32p"))) void vstorea_half_rtp(float, size_t, __global half *);
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f32_to_f16_rtp(float);
__attribute__((always_inline)) static void
vsthlf32p(float v, size_t i, __local half *p)
{
*(__local ushort *)(p + i) = __cvt_f32_to_f16_rtp(v);
}
extern __attribute__((overloadable, weak, alias("vsthlf32p"))) void vstore_half_rtp(float, size_t, __local half *);
extern __attribute__((overloadable, weak, alias("vsthlf32p"))) void vstorea_half_rtp(float, size_t, __local half *);
#endif
extern __attribute__((pure)) ushort __cvt_f32_to_f16_rtn(float);
__attribute__((always_inline)) static void
vsthpf32n(float v, size_t i, half *p)
{
*(ushort *)(p + i) = __cvt_f32_to_f16_rtn(v);
}
extern __attribute__((overloadable, weak, alias("vsthpf32n"))) void vstore_half_rtn(float, size_t, half *);
extern __attribute__((overloadable, weak, alias("vsthpf32n"))) void vstorea_half_rtn(float, size_t, half *);
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f32_to_f16_rtn(float);
__attribute__((always_inline)) static void
vsthgf32n(float v, size_t i, __global half *p)
{
*(__global ushort *)(p + i) = __cvt_f32_to_f16_rtn(v);
}
extern __attribute__((overloadable, weak, alias("vsthgf32n"))) void vstore_half_rtn(float, size_t, __global half *);
extern __attribute__((overloadable, weak, alias("vsthgf32n"))) void vstorea_half_rtn(float, size_t, __global half *);
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f32_to_f16_rtn(float);
__attribute__((always_inline)) static void
vsthlf32n(float v, size_t i, __local half *p)
{
*(__local ushort *)(p + i) = __cvt_f32_to_f16_rtn(v);
}
extern __attribute__((overloadable, weak, alias("vsthlf32n"))) void vstore_half_rtn(float, size_t, __local half *);
extern __attribute__((overloadable, weak, alias("vsthlf32n"))) void vstorea_half_rtn(float, size_t, __local half *);
#endif
extern __attribute__((pure)) ushort __cvt_f32_to_f16_rtz(float);
__attribute__((always_inline)) static void
vsthpf32z(float v, size_t i, half *p)
{
*(ushort *)(p + i) = __cvt_f32_to_f16_rtz(v);
}
extern __attribute__((overloadable, weak, alias("vsthpf32z"))) void vstore_half_rtz(float, size_t, half *);
extern __attribute__((overloadable, weak, alias("vsthpf32z"))) void vstorea_half_rtz(float, size_t, half *);
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f32_to_f16_rtz(float);
__attribute__((always_inline)) static void
vsthgf32z(float v, size_t i, __global half *p)
{
*(__global ushort *)(p + i) = __cvt_f32_to_f16_rtz(v);
}
extern __attribute__((overloadable, weak, alias("vsthgf32z"))) void vstore_half_rtz(float, size_t, __global half *);
extern __attribute__((overloadable, weak, alias("vsthgf32z"))) void vstorea_half_rtz(float, size_t, __global half *);
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f32_to_f16_rtz(float);
__attribute__((always_inline)) static void
vsthlf32z(float v, size_t i, __local half *p)
{
*(__local ushort *)(p + i) = __cvt_f32_to_f16_rtz(v);
}
extern __attribute__((overloadable, weak, alias("vsthlf32z"))) void vstore_half_rtz(float, size_t, __local half *);
extern __attribute__((overloadable, weak, alias("vsthlf32z"))) void vstorea_half_rtz(float, size_t, __local half *);
#endif
extern __attribute__((pure)) ushort __cvt_f64_to_f16_cur(double);
__attribute__((always_inline)) static void
vsthpf64c(double v, size_t i, half *p)
{
*(ushort *)(p + i) = __cvt_f64_to_f16_cur(v);
}
extern __attribute__((overloadable, weak, alias("vsthpf64c"))) void vstore_half(double, size_t, half *);
extern __attribute__((overloadable, weak, alias("vsthpf64c"))) void vstorea_half(double, size_t, half *);
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f64_to_f16_cur(double);
__attribute__((always_inline)) static void
vsthgf64c(double v, size_t i, __global half *p)
{
*(__global ushort *)(p + i) = __cvt_f64_to_f16_cur(v);
}
extern __attribute__((overloadable, weak, alias("vsthgf64c"))) void vstore_half(double, size_t, __global half *);
extern __attribute__((overloadable, weak, alias("vsthgf64c"))) void vstorea_half(double, size_t, __global half *);
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f64_to_f16_cur(double);
__attribute__((always_inline)) static void
vsthlf64c(double v, size_t i, __local half *p)
{
*(__local ushort *)(p + i) = __cvt_f64_to_f16_cur(v);
}
extern __attribute__((overloadable, weak, alias("vsthlf64c"))) void vstore_half(double, size_t, __local half *);
extern __attribute__((overloadable, weak, alias("vsthlf64c"))) void vstorea_half(double, size_t, __local half *);
#endif
extern __attribute__((pure)) ushort __cvt_f64_to_f16_rte(double);
__attribute__((always_inline)) static void
vsthpf64e(double v, size_t i, half *p)
{
*(ushort *)(p + i) = __cvt_f64_to_f16_rte(v);
}
extern __attribute__((overloadable, weak, alias("vsthpf64e"))) void vstore_half_rte(double, size_t, half *);
extern __attribute__((overloadable, weak, alias("vsthpf64e"))) void vstorea_half_rte(double, size_t, half *);
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f64_to_f16_rte(double);
__attribute__((always_inline)) static void
vsthgf64e(double v, size_t i, __global half *p)
{
*(__global ushort *)(p + i) = __cvt_f64_to_f16_rte(v);
}
extern __attribute__((overloadable, weak, alias("vsthgf64e"))) void vstore_half_rte(double, size_t, __global half *);
extern __attribute__((overloadable, weak, alias("vsthgf64e"))) void vstorea_half_rte(double, size_t, __global half *);
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f64_to_f16_rte(double);
__attribute__((always_inline)) static void
vsthlf64e(double v, size_t i, __local half *p)
{
*(__local ushort *)(p + i) = __cvt_f64_to_f16_rte(v);
}
extern __attribute__((overloadable, weak, alias("vsthlf64e"))) void vstore_half_rte(double, size_t, __local half *);
extern __attribute__((overloadable, weak, alias("vsthlf64e"))) void vstorea_half_rte(double, size_t, __local half *);
#endif
extern __attribute__((pure)) ushort __cvt_f64_to_f16_rtp(double);
__attribute__((always_inline)) static void
vsthpf64p(double v, size_t i, half *p)
{
*(ushort *)(p + i) = __cvt_f64_to_f16_rtp(v);
}
extern __attribute__((overloadable, weak, alias("vsthpf64p"))) void vstore_half_rtp(double, size_t, half *);
extern __attribute__((overloadable, weak, alias("vsthpf64p"))) void vstorea_half_rtp(double, size_t, half *);
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f64_to_f16_rtp(double);
__attribute__((always_inline)) static void
vsthgf64p(double v, size_t i, __global half *p)
{
*(__global ushort *)(p + i) = __cvt_f64_to_f16_rtp(v);
}
extern __attribute__((overloadable, weak, alias("vsthgf64p"))) void vstore_half_rtp(double, size_t, __global half *);
extern __attribute__((overloadable, weak, alias("vsthgf64p"))) void vstorea_half_rtp(double, size_t, __global half *);
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f64_to_f16_rtp(double);
__attribute__((always_inline)) static void
vsthlf64p(double v, size_t i, __local half *p)
{
*(__local ushort *)(p + i) = __cvt_f64_to_f16_rtp(v);
}
extern __attribute__((overloadable, weak, alias("vsthlf64p"))) void vstore_half_rtp(double, size_t, __local half *);
extern __attribute__((overloadable, weak, alias("vsthlf64p"))) void vstorea_half_rtp(double, size_t, __local half *);
#endif
extern __attribute__((pure)) ushort __cvt_f64_to_f16_rtn(double);
__attribute__((always_inline)) static void
vsthpf64n(double v, size_t i, half *p)
{
*(ushort *)(p + i) = __cvt_f64_to_f16_rtn(v);
}
extern __attribute__((overloadable, weak, alias("vsthpf64n"))) void vstore_half_rtn(double, size_t, half *);
extern __attribute__((overloadable, weak, alias("vsthpf64n"))) void vstorea_half_rtn(double, size_t, half *);
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f64_to_f16_rtn(double);
__attribute__((always_inline)) static void
vsthgf64n(double v, size_t i, __global half *p)
{
*(__global ushort *)(p + i) = __cvt_f64_to_f16_rtn(v);
}
extern __attribute__((overloadable, weak, alias("vsthgf64n"))) void vstore_half_rtn(double, size_t, __global half *);
extern __attribute__((overloadable, weak, alias("vsthgf64n"))) void vstorea_half_rtn(double, size_t, __global half *);
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f64_to_f16_rtn(double);
__attribute__((always_inline)) static void
vsthlf64n(double v, size_t i, __local half *p)
{
*(__local ushort *)(p + i) = __cvt_f64_to_f16_rtn(v);
}
extern __attribute__((overloadable, weak, alias("vsthlf64n"))) void vstore_half_rtn(double, size_t, __local half *);
extern __attribute__((overloadable, weak, alias("vsthlf64n"))) void vstorea_half_rtn(double, size_t, __local half *);
#endif
extern __attribute__((pure)) ushort __cvt_f64_to_f16_rtz(double);
__attribute__((always_inline)) static void
vsthpf64z(double v, size_t i, half *p)
{
*(ushort *)(p + i) = __cvt_f64_to_f16_rtz(v);
}
extern __attribute__((overloadable, weak, alias("vsthpf64z"))) void vstore_half_rtz(double, size_t, half *);
extern __attribute__((overloadable, weak, alias("vsthpf64z"))) void vstorea_half_rtz(double, size_t, half *);
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f64_to_f16_rtz(double);
__attribute__((always_inline)) static void
vsthgf64z(double v, size_t i, __global half *p)
{
*(__global ushort *)(p + i) = __cvt_f64_to_f16_rtz(v);
}
extern __attribute__((overloadable, weak, alias("vsthgf64z"))) void vstore_half_rtz(double, size_t, __global half *);
extern __attribute__((overloadable, weak, alias("vsthgf64z"))) void vstorea_half_rtz(double, size_t, __global half *);
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort __cvt_f64_to_f16_rtz(double);
__attribute__((always_inline)) static void
vsthlf64z(double v, size_t i, __local half *p)
{
*(__local ushort *)(p + i) = __cvt_f64_to_f16_rtz(v);
}
extern __attribute__((overloadable, weak, alias("vsthlf64z"))) void vstore_half_rtz(double, size_t, __local half *);
extern __attribute__((overloadable, weak, alias("vsthlf64z"))) void vstorea_half_rtz(double, size_t, __local half *);
#endif
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_cur(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2(float2 v, size_t i, half *p)
{
vstore2(__cvt_2f32_to_2f16_cur(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_cur(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2(float2 v, size_t i, __global half *p)
{
vstore2(__cvt_2f32_to_2f16_cur(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_cur(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2(float2 v, size_t i, __local half *p)
{
vstore2(__cvt_2f32_to_2f16_cur(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rte(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rte(float2 v, size_t i, half *p)
{
vstore2(__cvt_2f32_to_2f16_rte(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rte(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rte(float2 v, size_t i, __global half *p)
{
vstore2(__cvt_2f32_to_2f16_rte(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rte(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rte(float2 v, size_t i, __local half *p)
{
vstore2(__cvt_2f32_to_2f16_rte(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtp(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtp(float2 v, size_t i, half *p)
{
vstore2(__cvt_2f32_to_2f16_rtp(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtp(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtp(float2 v, size_t i, __global half *p)
{
vstore2(__cvt_2f32_to_2f16_rtp(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtp(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtp(float2 v, size_t i, __local half *p)
{
vstore2(__cvt_2f32_to_2f16_rtp(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtn(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtn(float2 v, size_t i, half *p)
{
vstore2(__cvt_2f32_to_2f16_rtn(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtn(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtn(float2 v, size_t i, __global half *p)
{
vstore2(__cvt_2f32_to_2f16_rtn(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtn(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtn(float2 v, size_t i, __local half *p)
{
vstore2(__cvt_2f32_to_2f16_rtn(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtz(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtz(float2 v, size_t i, half *p)
{
vstore2(__cvt_2f32_to_2f16_rtz(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtz(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtz(float2 v, size_t i, __global half *p)
{
vstore2(__cvt_2f32_to_2f16_rtz(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtz(float2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtz(float2 v, size_t i, __local half *p)
{
vstore2(__cvt_2f32_to_2f16_rtz(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_cur(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3(float3 v, size_t i, half *p)
{
vstore3(__cvt_3f32_to_3f16_cur(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_cur(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3(float3 v, size_t i, __global half *p)
{
vstore3(__cvt_3f32_to_3f16_cur(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_cur(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3(float3 v, size_t i, __local half *p)
{
vstore3(__cvt_3f32_to_3f16_cur(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rte(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rte(float3 v, size_t i, half *p)
{
vstore3(__cvt_3f32_to_3f16_rte(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rte(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rte(float3 v, size_t i, __global half *p)
{
vstore3(__cvt_3f32_to_3f16_rte(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rte(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rte(float3 v, size_t i, __local half *p)
{
vstore3(__cvt_3f32_to_3f16_rte(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtp(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtp(float3 v, size_t i, half *p)
{
vstore3(__cvt_3f32_to_3f16_rtp(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtp(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtp(float3 v, size_t i, __global half *p)
{
vstore3(__cvt_3f32_to_3f16_rtp(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtp(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtp(float3 v, size_t i, __local half *p)
{
vstore3(__cvt_3f32_to_3f16_rtp(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtn(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtn(float3 v, size_t i, half *p)
{
vstore3(__cvt_3f32_to_3f16_rtn(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtn(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtn(float3 v, size_t i, __global half *p)
{
vstore3(__cvt_3f32_to_3f16_rtn(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtn(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtn(float3 v, size_t i, __local half *p)
{
vstore3(__cvt_3f32_to_3f16_rtn(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtz(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtz(float3 v, size_t i, half *p)
{
vstore3(__cvt_3f32_to_3f16_rtz(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtz(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtz(float3 v, size_t i, __global half *p)
{
vstore3(__cvt_3f32_to_3f16_rtz(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtz(float3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtz(float3 v, size_t i, __local half *p)
{
vstore3(__cvt_3f32_to_3f16_rtz(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_cur(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4(float4 v, size_t i, half *p)
{
vstore4(__cvt_4f32_to_4f16_cur(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_cur(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4(float4 v, size_t i, __global half *p)
{
vstore4(__cvt_4f32_to_4f16_cur(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_cur(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4(float4 v, size_t i, __local half *p)
{
vstore4(__cvt_4f32_to_4f16_cur(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rte(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rte(float4 v, size_t i, half *p)
{
vstore4(__cvt_4f32_to_4f16_rte(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rte(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rte(float4 v, size_t i, __global half *p)
{
vstore4(__cvt_4f32_to_4f16_rte(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rte(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rte(float4 v, size_t i, __local half *p)
{
vstore4(__cvt_4f32_to_4f16_rte(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtp(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtp(float4 v, size_t i, half *p)
{
vstore4(__cvt_4f32_to_4f16_rtp(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtp(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtp(float4 v, size_t i, __global half *p)
{
vstore4(__cvt_4f32_to_4f16_rtp(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtp(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtp(float4 v, size_t i, __local half *p)
{
vstore4(__cvt_4f32_to_4f16_rtp(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtn(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtn(float4 v, size_t i, half *p)
{
vstore4(__cvt_4f32_to_4f16_rtn(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtn(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtn(float4 v, size_t i, __global half *p)
{
vstore4(__cvt_4f32_to_4f16_rtn(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtn(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtn(float4 v, size_t i, __local half *p)
{
vstore4(__cvt_4f32_to_4f16_rtn(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtz(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtz(float4 v, size_t i, half *p)
{
vstore4(__cvt_4f32_to_4f16_rtz(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtz(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtz(float4 v, size_t i, __global half *p)
{
vstore4(__cvt_4f32_to_4f16_rtz(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtz(float4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtz(float4 v, size_t i, __local half *p)
{
vstore4(__cvt_4f32_to_4f16_rtz(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_cur(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8(float8 v, size_t i, half *p)
{
vstore8(__cvt_8f32_to_8f16_cur(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_cur(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8(float8 v, size_t i, __global half *p)
{
vstore8(__cvt_8f32_to_8f16_cur(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_cur(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8(float8 v, size_t i, __local half *p)
{
vstore8(__cvt_8f32_to_8f16_cur(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rte(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rte(float8 v, size_t i, half *p)
{
vstore8(__cvt_8f32_to_8f16_rte(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rte(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rte(float8 v, size_t i, __global half *p)
{
vstore8(__cvt_8f32_to_8f16_rte(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rte(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rte(float8 v, size_t i, __local half *p)
{
vstore8(__cvt_8f32_to_8f16_rte(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtp(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtp(float8 v, size_t i, half *p)
{
vstore8(__cvt_8f32_to_8f16_rtp(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtp(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtp(float8 v, size_t i, __global half *p)
{
vstore8(__cvt_8f32_to_8f16_rtp(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtp(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtp(float8 v, size_t i, __local half *p)
{
vstore8(__cvt_8f32_to_8f16_rtp(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtn(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtn(float8 v, size_t i, half *p)
{
vstore8(__cvt_8f32_to_8f16_rtn(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtn(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtn(float8 v, size_t i, __global half *p)
{
vstore8(__cvt_8f32_to_8f16_rtn(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtn(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtn(float8 v, size_t i, __local half *p)
{
vstore8(__cvt_8f32_to_8f16_rtn(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtz(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtz(float8 v, size_t i, half *p)
{
vstore8(__cvt_8f32_to_8f16_rtz(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtz(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtz(float8 v, size_t i, __global half *p)
{
vstore8(__cvt_8f32_to_8f16_rtz(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtz(float8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtz(float8 v, size_t i, __local half *p)
{
vstore8(__cvt_8f32_to_8f16_rtz(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_cur(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16(float16 v, size_t i, half *p)
{
vstore16(__cvt_16f32_to_16f16_cur(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_cur(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16(float16 v, size_t i, __global half *p)
{
vstore16(__cvt_16f32_to_16f16_cur(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_cur(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16(float16 v, size_t i, __local half *p)
{
vstore16(__cvt_16f32_to_16f16_cur(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rte(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rte(float16 v, size_t i, half *p)
{
vstore16(__cvt_16f32_to_16f16_rte(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rte(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rte(float16 v, size_t i, __global half *p)
{
vstore16(__cvt_16f32_to_16f16_rte(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rte(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rte(float16 v, size_t i, __local half *p)
{
vstore16(__cvt_16f32_to_16f16_rte(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtp(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtp(float16 v, size_t i, half *p)
{
vstore16(__cvt_16f32_to_16f16_rtp(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtp(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtp(float16 v, size_t i, __global half *p)
{
vstore16(__cvt_16f32_to_16f16_rtp(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtp(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtp(float16 v, size_t i, __local half *p)
{
vstore16(__cvt_16f32_to_16f16_rtp(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtn(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtn(float16 v, size_t i, half *p)
{
vstore16(__cvt_16f32_to_16f16_rtn(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtn(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtn(float16 v, size_t i, __global half *p)
{
vstore16(__cvt_16f32_to_16f16_rtn(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtn(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtn(float16 v, size_t i, __local half *p)
{
vstore16(__cvt_16f32_to_16f16_rtn(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtz(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtz(float16 v, size_t i, half *p)
{
vstore16(__cvt_16f32_to_16f16_rtz(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtz(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtz(float16 v, size_t i, __global half *p)
{
vstore16(__cvt_16f32_to_16f16_rtz(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtz(float16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtz(float16 v, size_t i, __local half *p)
{
vstore16(__cvt_16f32_to_16f16_rtz(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_cur(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2(double2 v, size_t i, half *p)
{
vstore2(__cvt_2f64_to_2f16_cur(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_cur(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2(double2 v, size_t i, __global half *p)
{
vstore2(__cvt_2f64_to_2f16_cur(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_cur(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2(double2 v, size_t i, __local half *p)
{
vstore2(__cvt_2f64_to_2f16_cur(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rte(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rte(double2 v, size_t i, half *p)
{
vstore2(__cvt_2f64_to_2f16_rte(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rte(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rte(double2 v, size_t i, __global half *p)
{
vstore2(__cvt_2f64_to_2f16_rte(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rte(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rte(double2 v, size_t i, __local half *p)
{
vstore2(__cvt_2f64_to_2f16_rte(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtp(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtp(double2 v, size_t i, half *p)
{
vstore2(__cvt_2f64_to_2f16_rtp(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtp(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtp(double2 v, size_t i, __global half *p)
{
vstore2(__cvt_2f64_to_2f16_rtp(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtp(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtp(double2 v, size_t i, __local half *p)
{
vstore2(__cvt_2f64_to_2f16_rtp(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtn(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtn(double2 v, size_t i, half *p)
{
vstore2(__cvt_2f64_to_2f16_rtn(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtn(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtn(double2 v, size_t i, __global half *p)
{
vstore2(__cvt_2f64_to_2f16_rtn(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtn(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtn(double2 v, size_t i, __local half *p)
{
vstore2(__cvt_2f64_to_2f16_rtn(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtz(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtz(double2 v, size_t i, half *p)
{
vstore2(__cvt_2f64_to_2f16_rtz(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtz(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtz(double2 v, size_t i, __global half *p)
{
vstore2(__cvt_2f64_to_2f16_rtz(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtz(double2);
__attribute__((overloadable, always_inline, weak)) void
vstore_half2_rtz(double2 v, size_t i, __local half *p)
{
vstore2(__cvt_2f64_to_2f16_rtz(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_cur(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3(double3 v, size_t i, half *p)
{
vstore3(__cvt_3f64_to_3f16_cur(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_cur(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3(double3 v, size_t i, __global half *p)
{
vstore3(__cvt_3f64_to_3f16_cur(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_cur(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3(double3 v, size_t i, __local half *p)
{
vstore3(__cvt_3f64_to_3f16_cur(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rte(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rte(double3 v, size_t i, half *p)
{
vstore3(__cvt_3f64_to_3f16_rte(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rte(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rte(double3 v, size_t i, __global half *p)
{
vstore3(__cvt_3f64_to_3f16_rte(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rte(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rte(double3 v, size_t i, __local half *p)
{
vstore3(__cvt_3f64_to_3f16_rte(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtp(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtp(double3 v, size_t i, half *p)
{
vstore3(__cvt_3f64_to_3f16_rtp(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtp(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtp(double3 v, size_t i, __global half *p)
{
vstore3(__cvt_3f64_to_3f16_rtp(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtp(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtp(double3 v, size_t i, __local half *p)
{
vstore3(__cvt_3f64_to_3f16_rtp(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtn(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtn(double3 v, size_t i, half *p)
{
vstore3(__cvt_3f64_to_3f16_rtn(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtn(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtn(double3 v, size_t i, __global half *p)
{
vstore3(__cvt_3f64_to_3f16_rtn(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtn(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtn(double3 v, size_t i, __local half *p)
{
vstore3(__cvt_3f64_to_3f16_rtn(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtz(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtz(double3 v, size_t i, half *p)
{
vstore3(__cvt_3f64_to_3f16_rtz(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtz(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtz(double3 v, size_t i, __global half *p)
{
vstore3(__cvt_3f64_to_3f16_rtz(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtz(double3);
__attribute__((overloadable, always_inline, weak)) void
vstore_half3_rtz(double3 v, size_t i, __local half *p)
{
vstore3(__cvt_3f64_to_3f16_rtz(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_cur(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4(double4 v, size_t i, half *p)
{
vstore4(__cvt_4f64_to_4f16_cur(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_cur(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4(double4 v, size_t i, __global half *p)
{
vstore4(__cvt_4f64_to_4f16_cur(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_cur(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4(double4 v, size_t i, __local half *p)
{
vstore4(__cvt_4f64_to_4f16_cur(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rte(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rte(double4 v, size_t i, half *p)
{
vstore4(__cvt_4f64_to_4f16_rte(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rte(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rte(double4 v, size_t i, __global half *p)
{
vstore4(__cvt_4f64_to_4f16_rte(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rte(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rte(double4 v, size_t i, __local half *p)
{
vstore4(__cvt_4f64_to_4f16_rte(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtp(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtp(double4 v, size_t i, half *p)
{
vstore4(__cvt_4f64_to_4f16_rtp(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtp(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtp(double4 v, size_t i, __global half *p)
{
vstore4(__cvt_4f64_to_4f16_rtp(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtp(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtp(double4 v, size_t i, __local half *p)
{
vstore4(__cvt_4f64_to_4f16_rtp(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtn(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtn(double4 v, size_t i, half *p)
{
vstore4(__cvt_4f64_to_4f16_rtn(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtn(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtn(double4 v, size_t i, __global half *p)
{
vstore4(__cvt_4f64_to_4f16_rtn(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtn(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtn(double4 v, size_t i, __local half *p)
{
vstore4(__cvt_4f64_to_4f16_rtn(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtz(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtz(double4 v, size_t i, half *p)
{
vstore4(__cvt_4f64_to_4f16_rtz(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtz(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtz(double4 v, size_t i, __global half *p)
{
vstore4(__cvt_4f64_to_4f16_rtz(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtz(double4);
__attribute__((overloadable, always_inline, weak)) void
vstore_half4_rtz(double4 v, size_t i, __local half *p)
{
vstore4(__cvt_4f64_to_4f16_rtz(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_cur(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8(double8 v, size_t i, half *p)
{
vstore8(__cvt_8f64_to_8f16_cur(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_cur(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8(double8 v, size_t i, __global half *p)
{
vstore8(__cvt_8f64_to_8f16_cur(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_cur(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8(double8 v, size_t i, __local half *p)
{
vstore8(__cvt_8f64_to_8f16_cur(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rte(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rte(double8 v, size_t i, half *p)
{
vstore8(__cvt_8f64_to_8f16_rte(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rte(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rte(double8 v, size_t i, __global half *p)
{
vstore8(__cvt_8f64_to_8f16_rte(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rte(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rte(double8 v, size_t i, __local half *p)
{
vstore8(__cvt_8f64_to_8f16_rte(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtp(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtp(double8 v, size_t i, half *p)
{
vstore8(__cvt_8f64_to_8f16_rtp(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtp(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtp(double8 v, size_t i, __global half *p)
{
vstore8(__cvt_8f64_to_8f16_rtp(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtp(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtp(double8 v, size_t i, __local half *p)
{
vstore8(__cvt_8f64_to_8f16_rtp(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtn(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtn(double8 v, size_t i, half *p)
{
vstore8(__cvt_8f64_to_8f16_rtn(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtn(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtn(double8 v, size_t i, __global half *p)
{
vstore8(__cvt_8f64_to_8f16_rtn(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtn(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtn(double8 v, size_t i, __local half *p)
{
vstore8(__cvt_8f64_to_8f16_rtn(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtz(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtz(double8 v, size_t i, half *p)
{
vstore8(__cvt_8f64_to_8f16_rtz(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtz(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtz(double8 v, size_t i, __global half *p)
{
vstore8(__cvt_8f64_to_8f16_rtz(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtz(double8);
__attribute__((overloadable, always_inline, weak)) void
vstore_half8_rtz(double8 v, size_t i, __local half *p)
{
vstore8(__cvt_8f64_to_8f16_rtz(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_cur(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16(double16 v, size_t i, half *p)
{
vstore16(__cvt_16f64_to_16f16_cur(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_cur(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16(double16 v, size_t i, __global half *p)
{
vstore16(__cvt_16f64_to_16f16_cur(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_cur(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16(double16 v, size_t i, __local half *p)
{
vstore16(__cvt_16f64_to_16f16_cur(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rte(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rte(double16 v, size_t i, half *p)
{
vstore16(__cvt_16f64_to_16f16_rte(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rte(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rte(double16 v, size_t i, __global half *p)
{
vstore16(__cvt_16f64_to_16f16_rte(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rte(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rte(double16 v, size_t i, __local half *p)
{
vstore16(__cvt_16f64_to_16f16_rte(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtp(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtp(double16 v, size_t i, half *p)
{
vstore16(__cvt_16f64_to_16f16_rtp(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtp(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtp(double16 v, size_t i, __global half *p)
{
vstore16(__cvt_16f64_to_16f16_rtp(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtp(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtp(double16 v, size_t i, __local half *p)
{
vstore16(__cvt_16f64_to_16f16_rtp(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtn(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtn(double16 v, size_t i, half *p)
{
vstore16(__cvt_16f64_to_16f16_rtn(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtn(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtn(double16 v, size_t i, __global half *p)
{
vstore16(__cvt_16f64_to_16f16_rtn(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtn(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtn(double16 v, size_t i, __local half *p)
{
vstore16(__cvt_16f64_to_16f16_rtn(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtz(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtz(double16 v, size_t i, half *p)
{
vstore16(__cvt_16f64_to_16f16_rtz(v), i, (ushort *)p);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtz(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtz(double16 v, size_t i, __global half *p)
{
vstore16(__cvt_16f64_to_16f16_rtz(v), i, (__global ushort *)p);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtz(double16);
__attribute__((overloadable, always_inline, weak)) void
vstore_half16_rtz(double16 v, size_t i, __local half *p)
{
vstore16(__cvt_16f64_to_16f16_rtz(v), i, (__local ushort *)p);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_cur(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2(float2 v, size_t i, half *p)
{
*(ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_cur(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_cur(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2(float2 v, size_t i, __global half *p)
{
*(__global ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_cur(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_cur(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2(float2 v, size_t i, __local half *p)
{
*(__local ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_cur(v);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rte(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rte(float2 v, size_t i, half *p)
{
*(ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_rte(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rte(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rte(float2 v, size_t i, __global half *p)
{
*(__global ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_rte(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rte(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rte(float2 v, size_t i, __local half *p)
{
*(__local ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_rte(v);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtp(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtp(float2 v, size_t i, half *p)
{
*(ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_rtp(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtp(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtp(float2 v, size_t i, __global half *p)
{
*(__global ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_rtp(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtp(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtp(float2 v, size_t i, __local half *p)
{
*(__local ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_rtp(v);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtn(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtn(float2 v, size_t i, half *p)
{
*(ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_rtn(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtn(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtn(float2 v, size_t i, __global half *p)
{
*(__global ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_rtn(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtn(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtn(float2 v, size_t i, __local half *p)
{
*(__local ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_rtn(v);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtz(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtz(float2 v, size_t i, half *p)
{
*(ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_rtz(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtz(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtz(float2 v, size_t i, __global half *p)
{
*(__global ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_rtz(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f32_to_2f16_rtz(float2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtz(float2 v, size_t i, __local half *p)
{
*(__local ushort2 *)(p + i * 2) = __cvt_2f32_to_2f16_rtz(v);
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_cur(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3(float3 v, size_t i, half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_cur(v);
*(ushort4 *)(p + i * 4) = h;
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_cur(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3(float3 v, size_t i, __global half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_cur(v);
*(__global ushort4 *)(p + i * 4) = h;
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_cur(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3(float3 v, size_t i, __local half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_cur(v);
*(__local ushort4 *)(p + i * 4) = h;
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rte(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rte(float3 v, size_t i, half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_rte(v);
*(ushort4 *)(p + i * 4) = h;
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rte(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rte(float3 v, size_t i, __global half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_rte(v);
*(__global ushort4 *)(p + i * 4) = h;
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rte(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rte(float3 v, size_t i, __local half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_rte(v);
*(__local ushort4 *)(p + i * 4) = h;
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtp(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtp(float3 v, size_t i, half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_rtp(v);
*(ushort4 *)(p + i * 4) = h;
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtp(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtp(float3 v, size_t i, __global half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_rtp(v);
*(__global ushort4 *)(p + i * 4) = h;
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtp(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtp(float3 v, size_t i, __local half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_rtp(v);
*(__local ushort4 *)(p + i * 4) = h;
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtn(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtn(float3 v, size_t i, half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_rtn(v);
*(ushort4 *)(p + i * 4) = h;
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtn(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtn(float3 v, size_t i, __global half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_rtn(v);
*(__global ushort4 *)(p + i * 4) = h;
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtn(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtn(float3 v, size_t i, __local half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_rtn(v);
*(__local ushort4 *)(p + i * 4) = h;
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtz(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtz(float3 v, size_t i, half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_rtz(v);
*(ushort4 *)(p + i * 4) = h;
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtz(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtz(float3 v, size_t i, __global half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_rtz(v);
*(__global ushort4 *)(p + i * 4) = h;
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f32_to_3f16_rtz(float3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtz(float3 v, size_t i, __local half *p)
{
ushort4 h;
h.s012 = __cvt_3f32_to_3f16_rtz(v);
*(__local ushort4 *)(p + i * 4) = h;
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_cur(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4(float4 v, size_t i, half *p)
{
*(ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_cur(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_cur(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4(float4 v, size_t i, __global half *p)
{
*(__global ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_cur(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_cur(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4(float4 v, size_t i, __local half *p)
{
*(__local ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_cur(v);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rte(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rte(float4 v, size_t i, half *p)
{
*(ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_rte(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rte(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rte(float4 v, size_t i, __global half *p)
{
*(__global ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_rte(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rte(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rte(float4 v, size_t i, __local half *p)
{
*(__local ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_rte(v);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtp(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtp(float4 v, size_t i, half *p)
{
*(ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_rtp(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtp(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtp(float4 v, size_t i, __global half *p)
{
*(__global ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_rtp(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtp(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtp(float4 v, size_t i, __local half *p)
{
*(__local ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_rtp(v);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtn(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtn(float4 v, size_t i, half *p)
{
*(ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_rtn(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtn(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtn(float4 v, size_t i, __global half *p)
{
*(__global ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_rtn(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtn(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtn(float4 v, size_t i, __local half *p)
{
*(__local ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_rtn(v);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtz(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtz(float4 v, size_t i, half *p)
{
*(ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_rtz(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtz(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtz(float4 v, size_t i, __global half *p)
{
*(__global ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_rtz(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f32_to_4f16_rtz(float4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtz(float4 v, size_t i, __local half *p)
{
*(__local ushort4 *)(p + i * 4) = __cvt_4f32_to_4f16_rtz(v);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_cur(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8(float8 v, size_t i, half *p)
{
*(ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_cur(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_cur(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8(float8 v, size_t i, __global half *p)
{
*(__global ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_cur(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_cur(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8(float8 v, size_t i, __local half *p)
{
*(__local ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_cur(v);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rte(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rte(float8 v, size_t i, half *p)
{
*(ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_rte(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rte(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rte(float8 v, size_t i, __global half *p)
{
*(__global ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_rte(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rte(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rte(float8 v, size_t i, __local half *p)
{
*(__local ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_rte(v);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtp(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtp(float8 v, size_t i, half *p)
{
*(ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_rtp(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtp(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtp(float8 v, size_t i, __global half *p)
{
*(__global ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_rtp(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtp(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtp(float8 v, size_t i, __local half *p)
{
*(__local ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_rtp(v);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtn(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtn(float8 v, size_t i, half *p)
{
*(ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_rtn(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtn(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtn(float8 v, size_t i, __global half *p)
{
*(__global ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_rtn(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtn(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtn(float8 v, size_t i, __local half *p)
{
*(__local ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_rtn(v);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtz(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtz(float8 v, size_t i, half *p)
{
*(ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_rtz(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtz(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtz(float8 v, size_t i, __global half *p)
{
*(__global ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_rtz(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f32_to_8f16_rtz(float8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtz(float8 v, size_t i, __local half *p)
{
*(__local ushort8 *)(p + i * 8) = __cvt_8f32_to_8f16_rtz(v);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_cur(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16(float16 v, size_t i, half *p)
{
*(ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_cur(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_cur(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16(float16 v, size_t i, __global half *p)
{
*(__global ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_cur(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_cur(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16(float16 v, size_t i, __local half *p)
{
*(__local ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_cur(v);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rte(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rte(float16 v, size_t i, half *p)
{
*(ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_rte(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rte(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rte(float16 v, size_t i, __global half *p)
{
*(__global ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_rte(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rte(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rte(float16 v, size_t i, __local half *p)
{
*(__local ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_rte(v);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtp(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtp(float16 v, size_t i, half *p)
{
*(ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_rtp(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtp(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtp(float16 v, size_t i, __global half *p)
{
*(__global ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_rtp(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtp(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtp(float16 v, size_t i, __local half *p)
{
*(__local ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_rtp(v);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtn(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtn(float16 v, size_t i, half *p)
{
*(ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_rtn(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtn(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtn(float16 v, size_t i, __global half *p)
{
*(__global ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_rtn(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtn(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtn(float16 v, size_t i, __local half *p)
{
*(__local ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_rtn(v);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtz(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtz(float16 v, size_t i, half *p)
{
*(ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_rtz(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtz(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtz(float16 v, size_t i, __global half *p)
{
*(__global ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_rtz(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f32_to_16f16_rtz(float16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtz(float16 v, size_t i, __local half *p)
{
*(__local ushort16 *)(p + i * 16) = __cvt_16f32_to_16f16_rtz(v);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_cur(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2(double2 v, size_t i, half *p)
{
*(ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_cur(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_cur(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2(double2 v, size_t i, __global half *p)
{
*(__global ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_cur(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_cur(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2(double2 v, size_t i, __local half *p)
{
*(__local ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_cur(v);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rte(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rte(double2 v, size_t i, half *p)
{
*(ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_rte(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rte(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rte(double2 v, size_t i, __global half *p)
{
*(__global ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_rte(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rte(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rte(double2 v, size_t i, __local half *p)
{
*(__local ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_rte(v);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtp(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtp(double2 v, size_t i, half *p)
{
*(ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_rtp(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtp(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtp(double2 v, size_t i, __global half *p)
{
*(__global ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_rtp(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtp(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtp(double2 v, size_t i, __local half *p)
{
*(__local ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_rtp(v);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtn(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtn(double2 v, size_t i, half *p)
{
*(ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_rtn(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtn(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtn(double2 v, size_t i, __global half *p)
{
*(__global ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_rtn(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtn(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtn(double2 v, size_t i, __local half *p)
{
*(__local ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_rtn(v);
}
#endif
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtz(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtz(double2 v, size_t i, half *p)
{
*(ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_rtz(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtz(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtz(double2 v, size_t i, __global half *p)
{
*(__global ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_rtz(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort2 __cvt_2f64_to_2f16_rtz(double2);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half2_rtz(double2 v, size_t i, __local half *p)
{
*(__local ushort2 *)(p + i * 2) = __cvt_2f64_to_2f16_rtz(v);
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_cur(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3(double3 v, size_t i, half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_cur(v);
*(ushort4 *)(p + i * 4) = h;
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_cur(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3(double3 v, size_t i, __global half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_cur(v);
*(__global ushort4 *)(p + i * 4) = h;
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_cur(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3(double3 v, size_t i, __local half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_cur(v);
*(__local ushort4 *)(p + i * 4) = h;
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rte(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rte(double3 v, size_t i, half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_rte(v);
*(ushort4 *)(p + i * 4) = h;
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rte(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rte(double3 v, size_t i, __global half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_rte(v);
*(__global ushort4 *)(p + i * 4) = h;
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rte(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rte(double3 v, size_t i, __local half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_rte(v);
*(__local ushort4 *)(p + i * 4) = h;
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtp(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtp(double3 v, size_t i, half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_rtp(v);
*(ushort4 *)(p + i * 4) = h;
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtp(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtp(double3 v, size_t i, __global half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_rtp(v);
*(__global ushort4 *)(p + i * 4) = h;
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtp(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtp(double3 v, size_t i, __local half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_rtp(v);
*(__local ushort4 *)(p + i * 4) = h;
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtn(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtn(double3 v, size_t i, half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_rtn(v);
*(ushort4 *)(p + i * 4) = h;
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtn(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtn(double3 v, size_t i, __global half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_rtn(v);
*(__global ushort4 *)(p + i * 4) = h;
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtn(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtn(double3 v, size_t i, __local half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_rtn(v);
*(__local ushort4 *)(p + i * 4) = h;
}
#endif
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtz(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtz(double3 v, size_t i, half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_rtz(v);
*(ushort4 *)(p + i * 4) = h;
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtz(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtz(double3 v, size_t i, __global half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_rtz(v);
*(__global ushort4 *)(p + i * 4) = h;
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort3 __cvt_3f64_to_3f16_rtz(double3);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half3_rtz(double3 v, size_t i, __local half *p)
{
ushort4 h;
h.s012 = __cvt_3f64_to_3f16_rtz(v);
*(__local ushort4 *)(p + i * 4) = h;
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_cur(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4(double4 v, size_t i, half *p)
{
*(ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_cur(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_cur(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4(double4 v, size_t i, __global half *p)
{
*(__global ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_cur(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_cur(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4(double4 v, size_t i, __local half *p)
{
*(__local ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_cur(v);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rte(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rte(double4 v, size_t i, half *p)
{
*(ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_rte(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rte(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rte(double4 v, size_t i, __global half *p)
{
*(__global ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_rte(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rte(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rte(double4 v, size_t i, __local half *p)
{
*(__local ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_rte(v);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtp(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtp(double4 v, size_t i, half *p)
{
*(ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_rtp(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtp(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtp(double4 v, size_t i, __global half *p)
{
*(__global ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_rtp(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtp(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtp(double4 v, size_t i, __local half *p)
{
*(__local ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_rtp(v);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtn(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtn(double4 v, size_t i, half *p)
{
*(ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_rtn(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtn(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtn(double4 v, size_t i, __global half *p)
{
*(__global ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_rtn(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtn(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtn(double4 v, size_t i, __local half *p)
{
*(__local ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_rtn(v);
}
#endif
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtz(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtz(double4 v, size_t i, half *p)
{
*(ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_rtz(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtz(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtz(double4 v, size_t i, __global half *p)
{
*(__global ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_rtz(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort4 __cvt_4f64_to_4f16_rtz(double4);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half4_rtz(double4 v, size_t i, __local half *p)
{
*(__local ushort4 *)(p + i * 4) = __cvt_4f64_to_4f16_rtz(v);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_cur(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8(double8 v, size_t i, half *p)
{
*(ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_cur(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_cur(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8(double8 v, size_t i, __global half *p)
{
*(__global ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_cur(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_cur(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8(double8 v, size_t i, __local half *p)
{
*(__local ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_cur(v);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rte(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rte(double8 v, size_t i, half *p)
{
*(ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_rte(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rte(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rte(double8 v, size_t i, __global half *p)
{
*(__global ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_rte(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rte(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rte(double8 v, size_t i, __local half *p)
{
*(__local ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_rte(v);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtp(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtp(double8 v, size_t i, half *p)
{
*(ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_rtp(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtp(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtp(double8 v, size_t i, __global half *p)
{
*(__global ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_rtp(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtp(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtp(double8 v, size_t i, __local half *p)
{
*(__local ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_rtp(v);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtn(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtn(double8 v, size_t i, half *p)
{
*(ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_rtn(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtn(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtn(double8 v, size_t i, __global half *p)
{
*(__global ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_rtn(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtn(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtn(double8 v, size_t i, __local half *p)
{
*(__local ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_rtn(v);
}
#endif
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtz(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtz(double8 v, size_t i, half *p)
{
*(ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_rtz(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtz(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtz(double8 v, size_t i, __global half *p)
{
*(__global ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_rtz(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort8 __cvt_8f64_to_8f16_rtz(double8);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half8_rtz(double8 v, size_t i, __local half *p)
{
*(__local ushort8 *)(p + i * 8) = __cvt_8f64_to_8f16_rtz(v);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_cur(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16(double16 v, size_t i, half *p)
{
*(ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_cur(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_cur(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16(double16 v, size_t i, __global half *p)
{
*(__global ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_cur(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_cur(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16(double16 v, size_t i, __local half *p)
{
*(__local ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_cur(v);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rte(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rte(double16 v, size_t i, half *p)
{
*(ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_rte(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rte(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rte(double16 v, size_t i, __global half *p)
{
*(__global ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_rte(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rte(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rte(double16 v, size_t i, __local half *p)
{
*(__local ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_rte(v);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtp(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtp(double16 v, size_t i, half *p)
{
*(ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_rtp(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtp(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtp(double16 v, size_t i, __global half *p)
{
*(__global ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_rtp(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtp(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtp(double16 v, size_t i, __local half *p)
{
*(__local ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_rtp(v);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtn(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtn(double16 v, size_t i, half *p)
{
*(ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_rtn(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtn(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtn(double16 v, size_t i, __global half *p)
{
*(__global ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_rtn(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtn(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtn(double16 v, size_t i, __local half *p)
{
*(__local ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_rtn(v);
}
#endif
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtz(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtz(double16 v, size_t i, half *p)
{
*(ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_rtz(v);
}
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtz(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtz(double16 v, size_t i, __global half *p)
{
*(__global ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_rtz(v);
}
#endif
#if __OPENCL_C_VERSION__ < 200
extern __attribute__((pure)) ushort16 __cvt_16f64_to_16f16_rtz(double16);
__attribute__((overloadable, always_inline, weak)) void
vstorea_half16_rtz(double16 v, size_t i, __local half *p)
{
*(__local ushort16 *)(p + i * 16) = __cvt_16f64_to_16f16_rtz(v);
}
#endif