14#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
15#ifndef cl_khr_depth_images
16#define cl_khr_depth_images
20#if __OPENCL_C_VERSION__ < CL_VERSION_2_0
21#ifdef cl_khr_3d_image_writes
22#pragma OPENCL EXTENSION cl_khr_3d_image_writes : enable
26#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_1_2)
27#pragma OPENCL EXTENSION cl_intel_planar_yuv : begin
28#pragma OPENCL EXTENSION cl_intel_planar_yuv : end
31#define __ovld __attribute__((overloadable))
32#define __conv __attribute__((convergent))
35#define __purefn __attribute__((pure))
36#define __cnfn __attribute__((const))
6344#define as_char(x) __builtin_astype((x), char)
6345#define as_char2(x) __builtin_astype((x), char2)
6346#define as_char3(x) __builtin_astype((x), char3)
6347#define as_char4(x) __builtin_astype((x), char4)
6348#define as_char8(x) __builtin_astype((x), char8)
6349#define as_char16(x) __builtin_astype((x), char16)
6351#define as_uchar(x) __builtin_astype((x), uchar)
6352#define as_uchar2(x) __builtin_astype((x), uchar2)
6353#define as_uchar3(x) __builtin_astype((x), uchar3)
6354#define as_uchar4(x) __builtin_astype((x), uchar4)
6355#define as_uchar8(x) __builtin_astype((x), uchar8)
6356#define as_uchar16(x) __builtin_astype((x), uchar16)
6358#define as_short(x) __builtin_astype((x), short)
6359#define as_short2(x) __builtin_astype((x), short2)
6360#define as_short3(x) __builtin_astype((x), short3)
6361#define as_short4(x) __builtin_astype((x), short4)
6362#define as_short8(x) __builtin_astype((x), short8)
6363#define as_short16(x) __builtin_astype((x), short16)
6365#define as_ushort(x) __builtin_astype((x), ushort)
6366#define as_ushort2(x) __builtin_astype((x), ushort2)
6367#define as_ushort3(x) __builtin_astype((x), ushort3)
6368#define as_ushort4(x) __builtin_astype((x), ushort4)
6369#define as_ushort8(x) __builtin_astype((x), ushort8)
6370#define as_ushort16(x) __builtin_astype((x), ushort16)
6372#define as_int(x) __builtin_astype((x), int)
6373#define as_int2(x) __builtin_astype((x), int2)
6374#define as_int3(x) __builtin_astype((x), int3)
6375#define as_int4(x) __builtin_astype((x), int4)
6376#define as_int8(x) __builtin_astype((x), int8)
6377#define as_int16(x) __builtin_astype((x), int16)
6379#define as_uint(x) __builtin_astype((x), uint)
6380#define as_uint2(x) __builtin_astype((x), uint2)
6381#define as_uint3(x) __builtin_astype((x), uint3)
6382#define as_uint4(x) __builtin_astype((x), uint4)
6383#define as_uint8(x) __builtin_astype((x), uint8)
6384#define as_uint16(x) __builtin_astype((x), uint16)
6386#define as_long(x) __builtin_astype((x), long)
6387#define as_long2(x) __builtin_astype((x), long2)
6388#define as_long3(x) __builtin_astype((x), long3)
6389#define as_long4(x) __builtin_astype((x), long4)
6390#define as_long8(x) __builtin_astype((x), long8)
6391#define as_long16(x) __builtin_astype((x), long16)
6393#define as_ulong(x) __builtin_astype((x), ulong)
6394#define as_ulong2(x) __builtin_astype((x), ulong2)
6395#define as_ulong3(x) __builtin_astype((x), ulong3)
6396#define as_ulong4(x) __builtin_astype((x), ulong4)
6397#define as_ulong8(x) __builtin_astype((x), ulong8)
6398#define as_ulong16(x) __builtin_astype((x), ulong16)
6400#define as_float(x) __builtin_astype((x), float)
6401#define as_float2(x) __builtin_astype((x), float2)
6402#define as_float3(x) __builtin_astype((x), float3)
6403#define as_float4(x) __builtin_astype((x), float4)
6404#define as_float8(x) __builtin_astype((x), float8)
6405#define as_float16(x) __builtin_astype((x), float16)
6408#define as_double(x) __builtin_astype((x), double)
6409#define as_double2(x) __builtin_astype((x), double2)
6410#define as_double3(x) __builtin_astype((x), double3)
6411#define as_double4(x) __builtin_astype((x), double4)
6412#define as_double8(x) __builtin_astype((x), double8)
6413#define as_double16(x) __builtin_astype((x), double16)
6417#define as_half(x) __builtin_astype((x), half)
6418#define as_half2(x) __builtin_astype((x), half2)
6419#define as_half3(x) __builtin_astype((x), half3)
6420#define as_half4(x) __builtin_astype((x), half4)
6421#define as_half8(x) __builtin_astype((x), half8)
6422#define as_half16(x) __builtin_astype((x), half16)
6427#define __kernel_exec(X, typen) __kernel \
6428 __attribute__((work_group_size_hint(X, 1, 1))) \
6429 __attribute__((vec_type_hint(typen)))
6427#define __kernel_exec(X, typen) __kernel \ …
6431#define kernel_exec(X, typen) __kernel \
6432 __attribute__((work_group_size_hint(X, 1, 1))) \
6433 __attribute__((vec_type_hint(typen)))
6431#define kernel_exec(X, typen) __kernel \ …
6520#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
7355#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
7380float2
__ovld fract(float2 x, __global float2 *iptr);
7381float3
__ovld fract(float3 x, __global float3 *iptr);
7382float4
__ovld fract(float4 x, __global float4 *iptr);
7383float8
__ovld fract(float8 x, __global float8 *iptr);
7384float16
__ovld fract(float16 x, __global float16 *iptr);
7386float2
__ovld fract(float2 x, __local float2 *iptr);
7387float3
__ovld fract(float3 x, __local float3 *iptr);
7388float4
__ovld fract(float4 x, __local float4 *iptr);
7389float8
__ovld fract(float8 x, __local float8 *iptr);
7390float16
__ovld fract(float16 x, __local float16 *iptr);
7391float __ovld fract(
float x, __private
float *iptr);
7392float2
__ovld fract(float2 x, __private float2 *iptr);
7393float3
__ovld fract(float3 x, __private float3 *iptr);
7394float4
__ovld fract(float4 x, __private float4 *iptr);
7395float8
__ovld fract(float8 x, __private float8 *iptr);
7396float16
__ovld fract(float16 x, __private float16 *iptr);
7398double __ovld fract(
double x, __global
double *iptr);
7399double2
__ovld fract(double2 x, __global double2 *iptr);
7400double3
__ovld fract(double3 x, __global double3 *iptr);
7401double4
__ovld fract(double4 x, __global double4 *iptr);
7402double8
__ovld fract(double8 x, __global double8 *iptr);
7403double16
__ovld fract(double16 x, __global double16 *iptr);
7404double __ovld fract(
double x, __local
double *iptr);
7405double2
__ovld fract(double2 x, __local double2 *iptr);
7406double3
__ovld fract(double3 x, __local double3 *iptr);
7407double4
__ovld fract(double4 x, __local double4 *iptr);
7408double8
__ovld fract(double8 x, __local double8 *iptr);
7409double16
__ovld fract(double16 x, __local double16 *iptr);
7410double __ovld fract(
double x, __private
double *iptr);
7411double2
__ovld fract(double2 x, __private double2 *iptr);
7412double3
__ovld fract(double3 x, __private double3 *iptr);
7413double4
__ovld fract(double4 x, __private double4 *iptr);
7414double8
__ovld fract(double8 x, __private double8 *iptr);
7415double16
__ovld fract(double16 x, __private double16 *iptr);
7423half16
__ovld fract(half16 x, __global half16 *iptr);
7429half16
__ovld fract(half16 x, __local half16 *iptr);
7431half2
__ovld fract(half2 x, __private half2 *iptr);
7432half3
__ovld fract(half3 x, __private half3 *iptr);
7433half4
__ovld fract(half4 x, __private half4 *iptr);
7434half8
__ovld fract(half8 x, __private half8 *iptr);
7435half16
__ovld fract(half16 x, __private half16 *iptr);
7445#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
7652#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
7958#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
7967double2
__ovld modf(double2 x, double2 *iptr);
7968double3
__ovld modf(double3 x, double3 *iptr);
7969double4
__ovld modf(double4 x, double4 *iptr);
7970double8
__ovld modf(double8 x, double8 *iptr);
7971double16
__ovld modf(double16 x, double16 *iptr);
7982float __ovld modf(
float x, __global
float *iptr);
7983float2
__ovld modf(float2 x, __global float2 *iptr);
7984float3
__ovld modf(float3 x, __global float3 *iptr);
7985float4
__ovld modf(float4 x, __global float4 *iptr);
7986float8
__ovld modf(float8 x, __global float8 *iptr);
7987float16
__ovld modf(float16 x, __global float16 *iptr);
7988float __ovld modf(
float x, __local
float *iptr);
7989float2
__ovld modf(float2 x, __local float2 *iptr);
7990float3
__ovld modf(float3 x, __local float3 *iptr);
7991float4
__ovld modf(float4 x, __local float4 *iptr);
7992float8
__ovld modf(float8 x, __local float8 *iptr);
7993float16
__ovld modf(float16 x, __local float16 *iptr);
7994float __ovld modf(
float x, __private
float *iptr);
7995float2
__ovld modf(float2 x, __private float2 *iptr);
7996float3
__ovld modf(float3 x, __private float3 *iptr);
7997float4
__ovld modf(float4 x, __private float4 *iptr);
7998float8
__ovld modf(float8 x, __private float8 *iptr);
7999float16
__ovld modf(float16 x, __private float16 *iptr);
8001double __ovld modf(
double x, __global
double *iptr);
8002double2
__ovld modf(double2 x, __global double2 *iptr);
8003double3
__ovld modf(double3 x, __global double3 *iptr);
8004double4
__ovld modf(double4 x, __global double4 *iptr);
8005double8
__ovld modf(double8 x, __global double8 *iptr);
8006double16
__ovld modf(double16 x, __global double16 *iptr);
8007double __ovld modf(
double x, __local
double *iptr);
8008double2
__ovld modf(double2 x, __local double2 *iptr);
8009double3
__ovld modf(double3 x, __local double3 *iptr);
8010double4
__ovld modf(double4 x, __local double4 *iptr);
8011double8
__ovld modf(double8 x, __local double8 *iptr);
8012double16
__ovld modf(double16 x, __local double16 *iptr);
8013double __ovld modf(
double x, __private
double *iptr);
8014double2
__ovld modf(double2 x, __private double2 *iptr);
8015double3
__ovld modf(double3 x, __private double3 *iptr);
8016double4
__ovld modf(double4 x, __private double4 *iptr);
8017double8
__ovld modf(double8 x, __private double8 *iptr);
8018double16
__ovld modf(double16 x, __private double16 *iptr);
8021half
__ovld modf(half x, __global half *iptr);
8022half2
__ovld modf(half2 x, __global half2 *iptr);
8023half3
__ovld modf(half3 x, __global half3 *iptr);
8024half4
__ovld modf(half4 x, __global half4 *iptr);
8025half8
__ovld modf(half8 x, __global half8 *iptr);
8026half16
__ovld modf(half16 x, __global half16 *iptr);
8028half2
__ovld modf(half2 x, __local half2 *iptr);
8029half3
__ovld modf(half3 x, __local half3 *iptr);
8030half4
__ovld modf(half4 x, __local half4 *iptr);
8031half8
__ovld modf(half8 x, __local half8 *iptr);
8032half16
__ovld modf(half16 x, __local half16 *iptr);
8033half
__ovld modf(half x, __private half *iptr);
8034half2
__ovld modf(half2 x, __private half2 *iptr);
8035half3
__ovld modf(half3 x, __private half3 *iptr);
8036half4
__ovld modf(half4 x, __private half4 *iptr);
8037half8
__ovld modf(half8 x, __private half8 *iptr);
8038half16
__ovld modf(half16 x, __private half16 *iptr);
8218#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
8243float __ovld remquo(
float x,
float y, __global
int *quo);
8244float2
__ovld remquo(float2 x, float2 y, __global int2 *quo);
8245float3
__ovld remquo(float3 x, float3 y, __global int3 *quo);
8246float4
__ovld remquo(float4 x, float4 y, __global int4 *quo);
8249float __ovld remquo(
float x,
float y, __local
int *quo);
8250float2
__ovld remquo(float2 x, float2 y, __local int2 *quo);
8251float3
__ovld remquo(float3 x, float3 y, __local int3 *quo);
8252float4
__ovld remquo(float4 x, float4 y, __local int4 *quo);
8255float __ovld remquo(
float x,
float y, __private
int *quo);
8256float2
__ovld remquo(float2 x, float2 y, __private int2 *quo);
8257float3
__ovld remquo(float3 x, float3 y, __private int3 *quo);
8258float4
__ovld remquo(float4 x, float4 y, __private int4 *quo);
8262double __ovld remquo(
double x,
double y, __global
int *quo);
8263double2
__ovld remquo(double2 x, double2 y, __global int2 *quo);
8264double3
__ovld remquo(double3 x, double3 y, __global int3 *quo);
8265double4
__ovld remquo(double4 x, double4 y, __global int4 *quo);
8268double __ovld remquo(
double x,
double y, __local
int *quo);
8269double2
__ovld remquo(double2 x, double2 y, __local int2 *quo);
8270double3
__ovld remquo(double3 x, double3 y, __local int3 *quo);
8271double4
__ovld remquo(double4 x, double4 y, __local int4 *quo);
8274double __ovld remquo(
double x,
double y, __private
int *quo);
8275double2
__ovld remquo(double2 x, double2 y, __private int2 *quo);
8276double3
__ovld remquo(double3 x, double3 y, __private int3 *quo);
8277double4
__ovld remquo(double4 x, double4 y, __private int4 *quo);
8283half2
__ovld remquo(half2 x, half2 y, __global int2 *quo);
8284half3
__ovld remquo(half3 x, half3 y, __global int3 *quo);
8285half4
__ovld remquo(half4 x, half4 y, __global int4 *quo);
8289half2
__ovld remquo(half2 x, half2 y, __local int2 *quo);
8290half3
__ovld remquo(half3 x, half3 y, __local int3 *quo);
8291half4
__ovld remquo(half4 x, half4 y, __local int4 *quo);
8295half2
__ovld remquo(half2 x, half2 y, __private int2 *quo);
8296half3
__ovld remquo(half3 x, half3 y, __private int3 *quo);
8297half4
__ovld remquo(half4 x, half4 y, __private int4 *quo);
8308float __ovld __cnfn rint(float);
8442#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
8467float2
__ovld sincos(float2 x, __global float2 *cosval);
8468float3
__ovld sincos(float3 x, __global float3 *cosval);
8469float4
__ovld sincos(float4 x, __global float4 *cosval);
8470float8
__ovld sincos(float8 x, __global float8 *cosval);
8471float16
__ovld sincos(float16 x, __global float16 *cosval);
8477float16
__ovld sincos(float16 x, __local float16 *cosval);
8479float2
__ovld sincos(float2 x, __private float2 *cosval);
8480float3
__ovld sincos(float3 x, __private float3 *cosval);
8481float4
__ovld sincos(float4 x, __private float4 *cosval);
8482float8
__ovld sincos(float8 x, __private float8 *cosval);
8483float16
__ovld sincos(float16 x, __private float16 *cosval);
8485double __ovld sincos(
double x, __global
double *cosval);
8486double2
__ovld sincos(double2 x, __global double2 *cosval);
8487double3
__ovld sincos(double3 x, __global double3 *cosval);
8488double4
__ovld sincos(double4 x, __global double4 *cosval);
8489double8
__ovld sincos(double8 x, __global double8 *cosval);
8490double16
__ovld sincos(double16 x, __global double16 *cosval);
8492double2
__ovld sincos(double2 x, __local double2 *cosval);
8493double3
__ovld sincos(double3 x, __local double3 *cosval);
8494double4
__ovld sincos(double4 x, __local double4 *cosval);
8495double8
__ovld sincos(double8 x, __local double8 *cosval);
8496double16
__ovld sincos(double16 x, __local double16 *cosval);
8497double __ovld sincos(
double x, __private
double *cosval);
8498double2
__ovld sincos(double2 x, __private double2 *cosval);
8499double3
__ovld sincos(double3 x, __private double3 *cosval);
8500double4
__ovld sincos(double4 x, __private double4 *cosval);
8501double8
__ovld sincos(double8 x, __private double8 *cosval);
8502double16
__ovld sincos(double16 x, __private double16 *cosval);
8510half16
__ovld sincos(half16 x, __global half16 *cosval);
8522half16
__ovld sincos(half16 x, __private half16 *cosval);
9449#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
11327double2
__ovld vload2(
size_t offset,
const __constant
double *p);
11328double3
__ovld vload3(
size_t offset,
const __constant
double *p);
11329double4
__ovld vload4(
size_t offset,
const __constant
double *p);
11330double8
__ovld vload8(
size_t offset,
const __constant
double *p);
11331double16
__ovld vload16(
size_t offset,
const __constant
double *p);
11335half
__ovld vload(
size_t offset,
const __constant half *p);
11336half2
__ovld vload2(
size_t offset,
const __constant half *p);
11337half3
__ovld vload3(
size_t offset,
const __constant half *p);
11338half4
__ovld vload4(
size_t offset,
const __constant half *p);
11339half8
__ovld vload8(
size_t offset,
const __constant half *p);
11340half16
__ovld vload16(
size_t offset,
const __constant half *p);
11343#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
11399half
__ovld vload(
size_t offset,
const half *p);
11407char2
__ovld vload2(
size_t offset,
const __global
char *p);
11409short2
__ovld vload2(
size_t offset,
const __global
short *p);
11411int2
__ovld vload2(
size_t offset,
const __global
int *p);
11413long2
__ovld vload2(
size_t offset,
const __global
long *p);
11415float2
__ovld vload2(
size_t offset,
const __global
float *p);
11416char3
__ovld vload3(
size_t offset,
const __global
char *p);
11418short3
__ovld vload3(
size_t offset,
const __global
short *p);
11420int3
__ovld vload3(
size_t offset,
const __global
int *p);
11422long3
__ovld vload3(
size_t offset,
const __global
long *p);
11424float3
__ovld vload3(
size_t offset,
const __global
float *p);
11425char4
__ovld vload4(
size_t offset,
const __global
char *p);
11427short4
__ovld vload4(
size_t offset,
const __global
short *p);
11429int4
__ovld vload4(
size_t offset,
const __global
int *p);
11431long4
__ovld vload4(
size_t offset,
const __global
long *p);
11433float4
__ovld vload4(
size_t offset,
const __global
float *p);
11434char8
__ovld vload8(
size_t offset,
const __global
char *p);
11436short8
__ovld vload8(
size_t offset,
const __global
short *p);
11440long8
__ovld vload8(
size_t offset,
const __global
long *p);
11442float8
__ovld vload8(
size_t offset,
const __global
float *p);
11443char16
__ovld vload16(
size_t offset,
const __global
char *p);
11445short16
__ovld vload16(
size_t offset,
const __global
short *p);
11449long16
__ovld vload16(
size_t offset,
const __global
long *p);
11451float16
__ovld vload16(
size_t offset,
const __global
float *p);
11452char2
__ovld vload2(
size_t offset,
const __local
char *p);
11454short2
__ovld vload2(
size_t offset,
const __local
short *p);
11456int2
__ovld vload2(
size_t offset,
const __local
int *p);
11458long2
__ovld vload2(
size_t offset,
const __local
long *p);
11460float2
__ovld vload2(
size_t offset,
const __local
float *p);
11461char3
__ovld vload3(
size_t offset,
const __local
char *p);
11463short3
__ovld vload3(
size_t offset,
const __local
short *p);
11465int3
__ovld vload3(
size_t offset,
const __local
int *p);
11467long3
__ovld vload3(
size_t offset,
const __local
long *p);
11469float3
__ovld vload3(
size_t offset,
const __local
float *p);
11470char4
__ovld vload4(
size_t offset,
const __local
char *p);
11472short4
__ovld vload4(
size_t offset,
const __local
short *p);
11474int4
__ovld vload4(
size_t offset,
const __local
int *p);
11476long4
__ovld vload4(
size_t offset,
const __local
long *p);
11478float4
__ovld vload4(
size_t offset,
const __local
float *p);
11479char8
__ovld vload8(
size_t offset,
const __local
char *p);
11481short8
__ovld vload8(
size_t offset,
const __local
short *p);
11485long8
__ovld vload8(
size_t offset,
const __local
long *p);
11487float8
__ovld vload8(
size_t offset,
const __local
float *p);
11488char16
__ovld vload16(
size_t offset,
const __local
char *p);
11490short16
__ovld vload16(
size_t offset,
const __local
short *p);
11494long16
__ovld vload16(
size_t offset,
const __local
long *p);
11496float16
__ovld vload16(
size_t offset,
const __local
float *p);
11497char2
__ovld vload2(
size_t offset,
const __private
char *p);
11499short2
__ovld vload2(
size_t offset,
const __private
short *p);
11501int2
__ovld vload2(
size_t offset,
const __private
int *p);
11503long2
__ovld vload2(
size_t offset,
const __private
long *p);
11505float2
__ovld vload2(
size_t offset,
const __private
float *p);
11506char3
__ovld vload3(
size_t offset,
const __private
char *p);
11508short3
__ovld vload3(
size_t offset,
const __private
short *p);
11510int3
__ovld vload3(
size_t offset,
const __private
int *p);
11512long3
__ovld vload3(
size_t offset,
const __private
long *p);
11514float3
__ovld vload3(
size_t offset,
const __private
float *p);
11515char4
__ovld vload4(
size_t offset,
const __private
char *p);
11517short4
__ovld vload4(
size_t offset,
const __private
short *p);
11519int4
__ovld vload4(
size_t offset,
const __private
int *p);
11521long4
__ovld vload4(
size_t offset,
const __private
long *p);
11523float4
__ovld vload4(
size_t offset,
const __private
float *p);
11524char8
__ovld vload8(
size_t offset,
const __private
char *p);
11526short8
__ovld vload8(
size_t offset,
const __private
short *p);
11530long8
__ovld vload8(
size_t offset,
const __private
long *p);
11532float8
__ovld vload8(
size_t offset,
const __private
float *p);
11533char16
__ovld vload16(
size_t offset,
const __private
char *p);
11535short16
__ovld vload16(
size_t offset,
const __private
short *p);
11539long16
__ovld vload16(
size_t offset,
const __private
long *p);
11541float16
__ovld vload16(
size_t offset,
const __private
float *p);
11544double2
__ovld vload2(
size_t offset,
const __global
double *p);
11545double3
__ovld vload3(
size_t offset,
const __global
double *p);
11546double4
__ovld vload4(
size_t offset,
const __global
double *p);
11547double8
__ovld vload8(
size_t offset,
const __global
double *p);
11548double16
__ovld vload16(
size_t offset,
const __global
double *p);
11549double2
__ovld vload2(
size_t offset,
const __local
double *p);
11550double3
__ovld vload3(
size_t offset,
const __local
double *p);
11551double4
__ovld vload4(
size_t offset,
const __local
double *p);
11552double8
__ovld vload8(
size_t offset,
const __local
double *p);
11553double16
__ovld vload16(
size_t offset,
const __local
double *p);
11554double2
__ovld vload2(
size_t offset,
const __private
double *p);
11555double3
__ovld vload3(
size_t offset,
const __private
double *p);
11556double4
__ovld vload4(
size_t offset,
const __private
double *p);
11557double8
__ovld vload8(
size_t offset,
const __private
double *p);
11558double16
__ovld vload16(
size_t offset,
const __private
double *p);
11562half
__ovld vload(
size_t offset,
const __global half *p);
11563half2
__ovld vload2(
size_t offset,
const __global half *p);
11564half3
__ovld vload3(
size_t offset,
const __global half *p);
11565half4
__ovld vload4(
size_t offset,
const __global half *p);
11566half8
__ovld vload8(
size_t offset,
const __global half *p);
11567half16
__ovld vload16(
size_t offset,
const __global half *p);
11568half
__ovld vload(
size_t offset,
const __local half *p);
11569half2
__ovld vload2(
size_t offset,
const __local half *p);
11570half3
__ovld vload3(
size_t offset,
const __local half *p);
11571half4
__ovld vload4(
size_t offset,
const __local half *p);
11572half8
__ovld vload8(
size_t offset,
const __local half *p);
11573half16
__ovld vload16(
size_t offset,
const __local half *p);
11574half
__ovld vload(
size_t offset,
const __private half *p);
11575half2
__ovld vload2(
size_t offset,
const __private half *p);
11576half3
__ovld vload3(
size_t offset,
const __private half *p);
11577half4
__ovld vload4(
size_t offset,
const __private half *p);
11578half8
__ovld vload8(
size_t offset,
const __private half *p);
11579half16
__ovld vload16(
size_t offset,
const __private half *p);
11583#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
11630void __ovld vstore2(double2 data,
size_t offset,
double *p);
11631void __ovld vstore3(double3 data,
size_t offset,
double *p);
11632void __ovld vstore4(double4 data,
size_t offset,
double *p);
11633void __ovld vstore8(double8 data,
size_t offset,
double *p);
11637void __ovld vstore(half data,
size_t offset, half *p);
11645void __ovld vstore2(char2 data,
size_t offset, __global
char *p);
11647void __ovld vstore2(short2 data,
size_t offset, __global
short *p);
11649void __ovld vstore2(int2 data,
size_t offset, __global
int *p);
11651void __ovld vstore2(long2 data,
size_t offset, __global
long *p);
11653void __ovld vstore2(float2 data,
size_t offset, __global
float *p);
11654void __ovld vstore3(char3 data,
size_t offset, __global
char *p);
11656void __ovld vstore3(short3 data,
size_t offset, __global
short *p);
11658void __ovld vstore3(int3 data,
size_t offset, __global
int *p);
11660void __ovld vstore3(long3 data,
size_t offset, __global
long *p);
11662void __ovld vstore3(float3 data,
size_t offset, __global
float *p);
11663void __ovld vstore4(char4 data,
size_t offset, __global
char *p);
11665void __ovld vstore4(short4 data,
size_t offset, __global
short *p);
11667void __ovld vstore4(int4 data,
size_t offset, __global
int *p);
11669void __ovld vstore4(long4 data,
size_t offset, __global
long *p);
11671void __ovld vstore4(float4 data,
size_t offset, __global
float *p);
11672void __ovld vstore8(char8 data,
size_t offset, __global
char *p);
11674void __ovld vstore8(short8 data,
size_t offset, __global
short *p);
11678void __ovld vstore8(long8 data,
size_t offset, __global
long *p);
11680void __ovld vstore8(float8 data,
size_t offset, __global
float *p);
11681void __ovld vstore16(char16 data,
size_t offset, __global
char *p);
11683void __ovld vstore16(short16 data,
size_t offset, __global
short *p);
11687void __ovld vstore16(long16 data,
size_t offset, __global
long *p);
11689void __ovld vstore16(float16 data,
size_t offset, __global
float *p);
11690void __ovld vstore2(char2 data,
size_t offset, __local
char *p);
11692void __ovld vstore2(short2 data,
size_t offset, __local
short *p);
11694void __ovld vstore2(int2 data,
size_t offset, __local
int *p);
11696void __ovld vstore2(long2 data,
size_t offset, __local
long *p);
11698void __ovld vstore2(float2 data,
size_t offset, __local
float *p);
11699void __ovld vstore3(char3 data,
size_t offset, __local
char *p);
11701void __ovld vstore3(short3 data,
size_t offset, __local
short *p);
11703void __ovld vstore3(int3 data,
size_t offset, __local
int *p);
11705void __ovld vstore3(long3 data,
size_t offset, __local
long *p);
11707void __ovld vstore3(float3 data,
size_t offset, __local
float *p);
11708void __ovld vstore4(char4 data,
size_t offset, __local
char *p);
11710void __ovld vstore4(short4 data,
size_t offset, __local
short *p);
11712void __ovld vstore4(int4 data,
size_t offset, __local
int *p);
11714void __ovld vstore4(long4 data,
size_t offset, __local
long *p);
11716void __ovld vstore4(float4 data,
size_t offset, __local
float *p);
11717void __ovld vstore8(char8 data,
size_t offset, __local
char *p);
11719void __ovld vstore8(short8 data,
size_t offset, __local
short *p);
11723void __ovld vstore8(long8 data,
size_t offset, __local
long *p);
11725void __ovld vstore8(float8 data,
size_t offset, __local
float *p);
11726void __ovld vstore16(char16 data,
size_t offset, __local
char *p);
11728void __ovld vstore16(short16 data,
size_t offset, __local
short *p);
11732void __ovld vstore16(long16 data,
size_t offset, __local
long *p);
11734void __ovld vstore16(float16 data,
size_t offset, __local
float *p);
11735void __ovld vstore2(char2 data,
size_t offset, __private
char *p);
11737void __ovld vstore2(short2 data,
size_t offset, __private
short *p);
11739void __ovld vstore2(int2 data,
size_t offset, __private
int *p);
11741void __ovld vstore2(long2 data,
size_t offset, __private
long *p);
11743void __ovld vstore2(float2 data,
size_t offset, __private
float *p);
11744void __ovld vstore3(char3 data,
size_t offset, __private
char *p);
11746void __ovld vstore3(short3 data,
size_t offset, __private
short *p);
11748void __ovld vstore3(int3 data,
size_t offset, __private
int *p);
11750void __ovld vstore3(long3 data,
size_t offset, __private
long *p);
11752void __ovld vstore3(float3 data,
size_t offset, __private
float *p);
11753void __ovld vstore4(char4 data,
size_t offset, __private
char *p);
11755void __ovld vstore4(short4 data,
size_t offset, __private
short *p);
11757void __ovld vstore4(int4 data,
size_t offset, __private
int *p);
11759void __ovld vstore4(long4 data,
size_t offset, __private
long *p);
11761void __ovld vstore4(float4 data,
size_t offset, __private
float *p);
11762void __ovld vstore8(char8 data,
size_t offset, __private
char *p);
11764void __ovld vstore8(short8 data,
size_t offset, __private
short *p);
11768void __ovld vstore8(long8 data,
size_t offset, __private
long *p);
11770void __ovld vstore8(float8 data,
size_t offset, __private
float *p);
11771void __ovld vstore16(char16 data,
size_t offset, __private
char *p);
11773void __ovld vstore16(short16 data,
size_t offset, __private
short *p);
11777void __ovld vstore16(long16 data,
size_t offset, __private
long *p);
11779void __ovld vstore16(float16 data,
size_t offset, __private
float *p);
11781void __ovld vstore2(double2 data,
size_t offset, __global
double *p);
11782void __ovld vstore3(double3 data,
size_t offset, __global
double *p);
11783void __ovld vstore4(double4 data,
size_t offset, __global
double *p);
11784void __ovld vstore8(double8 data,
size_t offset, __global
double *p);
11785void __ovld vstore16(double16 data,
size_t offset, __global
double *p);
11786void __ovld vstore2(double2 data,
size_t offset, __local
double *p);
11787void __ovld vstore3(double3 data,
size_t offset, __local
double *p);
11788void __ovld vstore4(double4 data,
size_t offset, __local
double *p);
11789void __ovld vstore8(double8 data,
size_t offset, __local
double *p);
11790void __ovld vstore16(double16 data,
size_t offset, __local
double *p);
11791void __ovld vstore2(double2 data,
size_t offset, __private
double *p);
11792void __ovld vstore3(double3 data,
size_t offset, __private
double *p);
11793void __ovld vstore4(double4 data,
size_t offset, __private
double *p);
11794void __ovld vstore8(double8 data,
size_t offset, __private
double *p);
11795void __ovld vstore16(double16 data,
size_t offset, __private
double *p);
11798void __ovld vstore(half data,
size_t offset, __global half *p);
11799void __ovld vstore2(half2 data,
size_t offset, __global half *p);
11800void __ovld vstore3(half3 data,
size_t offset, __global half *p);
11801void __ovld vstore4(half4 data,
size_t offset, __global half *p);
11802void __ovld vstore8(half8 data,
size_t offset, __global half *p);
11803void __ovld vstore16(half16 data,
size_t offset, __global half *p);
11804void __ovld vstore(half data,
size_t offset, __local half *p);
11805void __ovld vstore2(half2 data,
size_t offset, __local half *p);
11806void __ovld vstore3(half3 data,
size_t offset, __local half *p);
11807void __ovld vstore4(half4 data,
size_t offset, __local half *p);
11808void __ovld vstore8(half8 data,
size_t offset, __local half *p);
11809void __ovld vstore16(half16 data,
size_t offset, __local half *p);
11810void __ovld vstore(half data,
size_t offset, __private half *p);
11811void __ovld vstore2(half2 data,
size_t offset, __private half *p);
11812void __ovld vstore3(half3 data,
size_t offset, __private half *p);
11813void __ovld vstore4(half4 data,
size_t offset, __private half *p);
11814void __ovld vstore8(half8 data,
size_t offset, __private half *p);
11815void __ovld vstore16(half16 data,
size_t offset, __private half *p);
11828#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
11849#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
11884#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
11943#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
12170#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
12214#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
12535#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
12583#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
13000void __ovld prefetch(
const __global
double *p,
size_t num_elements);
13001void __ovld prefetch(
const __global double2 *p,
size_t num_elements);
13002void __ovld prefetch(
const __global double3 *p,
size_t num_elements);
13003void __ovld prefetch(
const __global double4 *p,
size_t num_elements);
13004void __ovld prefetch(
const __global double8 *p,
size_t num_elements);
13005void __ovld prefetch(
const __global double16 *p,
size_t num_elements);
13008void __ovld prefetch(
const __global half *p,
size_t num_elements);
13009void __ovld prefetch(
const __global half2 *p,
size_t num_elements);
13010void __ovld prefetch(
const __global half3 *p,
size_t num_elements);
13011void __ovld prefetch(
const __global half4 *p,
size_t num_elements);
13012void __ovld prefetch(
const __global half8 *p,
size_t num_elements);
13013void __ovld prefetch(
const __global half16 *p,
size_t num_elements);
13018#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics)
13019#pragma OPENCL EXTENSION cl_khr_int64_base_atomics : enable
13020#pragma OPENCL EXTENSION cl_khr_int64_extended_atomics : enable
13032#ifdef __OPENCL_CPP_VERSION__
13034unsigned int __ovld atomic_add(
volatile unsigned int *p,
unsigned int val);
13037#if defined(cl_khr_global_int32_base_atomics)
13038int __ovld atom_add(
volatile __global
int *p,
int val);
13039unsigned int __ovld atom_add(
volatile __global
unsigned int *p,
unsigned int val);
13041#if defined(cl_khr_local_int32_base_atomics)
13042int __ovld atom_add(
volatile __local
int *p,
int val);
13043unsigned int __ovld atom_add(
volatile __local
unsigned int *p,
unsigned int val);
13046#if defined(cl_khr_int64_base_atomics)
13047long __ovld atom_add(
volatile __global
long *p,
long val);
13048unsigned long __ovld atom_add(
volatile __global
unsigned long *p,
unsigned long val);
13049long __ovld atom_add(
volatile __local
long *p,
long val);
13050unsigned long __ovld atom_add(
volatile __local
unsigned long *p,
unsigned long val);
13062#ifdef __OPENCL_CPP_VERSION__
13064unsigned int __ovld atomic_sub(
volatile unsigned int *p,
unsigned int val);
13067#if defined(cl_khr_global_int32_base_atomics)
13068int __ovld atom_sub(
volatile __global
int *p,
int val);
13069unsigned int __ovld atom_sub(
volatile __global
unsigned int *p,
unsigned int val);
13071#if defined(cl_khr_local_int32_base_atomics)
13072int __ovld atom_sub(
volatile __local
int *p,
int val);
13073unsigned int __ovld atom_sub(
volatile __local
unsigned int *p,
unsigned int val);
13076#if defined(cl_khr_int64_base_atomics)
13077long __ovld atom_sub(
volatile __global
long *p,
long val);
13078unsigned long __ovld atom_sub(
volatile __global
unsigned long *p,
unsigned long val);
13079long __ovld atom_sub(
volatile __local
long *p,
long val);
13080unsigned long __ovld atom_sub(
volatile __local
unsigned long *p,
unsigned long val);
13094#ifdef __OPENCL_CPP_VERSION__
13100#if defined(cl_khr_global_int32_base_atomics)
13101int __ovld atom_xchg(
volatile __global
int *p,
int val);
13102unsigned int __ovld atom_xchg(
volatile __global
unsigned int *p,
unsigned int val);
13104#if defined(cl_khr_local_int32_base_atomics)
13105int __ovld atom_xchg(
volatile __local
int *p,
int val);
13106unsigned int __ovld atom_xchg(
volatile __local
unsigned int *p,
unsigned int val);
13109#if defined(cl_khr_int64_base_atomics)
13110long __ovld atom_xchg(
volatile __global
long *p,
long val);
13111long __ovld atom_xchg(
volatile __local
long *p,
long val);
13112unsigned long __ovld atom_xchg(
volatile __global
unsigned long *p,
unsigned long val);
13113unsigned long __ovld atom_xchg(
volatile __local
unsigned long *p,
unsigned long val);
13126#ifdef __OPENCL_CPP_VERSION__
13131#if defined(cl_khr_global_int32_base_atomics)
13132int __ovld atom_inc(
volatile __global
int *p);
13133unsigned int __ovld atom_inc(
volatile __global
unsigned int *p);
13135#if defined(cl_khr_local_int32_base_atomics)
13136int __ovld atom_inc(
volatile __local
int *p);
13137unsigned int __ovld atom_inc(
volatile __local
unsigned int *p);
13140#if defined(cl_khr_int64_base_atomics)
13141long __ovld atom_inc(
volatile __global
long *p);
13142unsigned long __ovld atom_inc(
volatile __global
unsigned long *p);
13143long __ovld atom_inc(
volatile __local
long *p);
13144unsigned long __ovld atom_inc(
volatile __local
unsigned long *p);
13157#ifdef __OPENCL_CPP_VERSION__
13162#if defined(cl_khr_global_int32_base_atomics)
13163int __ovld atom_dec(
volatile __global
int *p);
13164unsigned int __ovld atom_dec(
volatile __global
unsigned int *p);
13166#if defined(cl_khr_local_int32_base_atomics)
13167int __ovld atom_dec(
volatile __local
int *p);
13168unsigned int __ovld atom_dec(
volatile __local
unsigned int *p);
13171#if defined(cl_khr_int64_base_atomics)
13172long __ovld atom_dec(
volatile __global
long *p);
13173unsigned long __ovld atom_dec(
volatile __global
unsigned long *p);
13174long __ovld atom_dec(
volatile __local
long *p);
13175unsigned long __ovld atom_dec(
volatile __local
unsigned long *p);
13189#ifdef __OPENCL_CPP_VERSION__
13191unsigned int __ovld atomic_cmpxchg(
volatile unsigned int *p,
unsigned int cmp,
unsigned int val);
13194#if defined(cl_khr_global_int32_base_atomics)
13195int __ovld atom_cmpxchg(
volatile __global
int *p,
int cmp,
int val);
13196unsigned int __ovld atom_cmpxchg(
volatile __global
unsigned int *p,
unsigned int cmp,
unsigned int val);
13198#if defined(cl_khr_local_int32_base_atomics)
13199int __ovld atom_cmpxchg(
volatile __local
int *p,
int cmp,
int val);
13200unsigned int __ovld atom_cmpxchg(
volatile __local
unsigned int *p,
unsigned int cmp,
unsigned int val);
13203#if defined(cl_khr_int64_base_atomics)
13204long __ovld atom_cmpxchg(
volatile __global
long *p,
long cmp,
long val);
13205unsigned long __ovld atom_cmpxchg(
volatile __global
unsigned long *p,
unsigned long cmp,
unsigned long val);
13206long __ovld atom_cmpxchg(
volatile __local
long *p,
long cmp,
long val);
13207unsigned long __ovld atom_cmpxchg(
volatile __local
unsigned long *p,
unsigned long cmp,
unsigned long val);
13221#ifdef __OPENCL_CPP_VERSION__
13223unsigned int __ovld atomic_min(
volatile unsigned int *p,
unsigned int val);
13226#if defined(cl_khr_global_int32_extended_atomics)
13227int __ovld atom_min(
volatile __global
int *p,
int val);
13228unsigned int __ovld atom_min(
volatile __global
unsigned int *p,
unsigned int val);
13230#if defined(cl_khr_local_int32_extended_atomics)
13231int __ovld atom_min(
volatile __local
int *p,
int val);
13232unsigned int __ovld atom_min(
volatile __local
unsigned int *p,
unsigned int val);
13235#if defined(cl_khr_int64_extended_atomics)
13236long __ovld atom_min(
volatile __global
long *p,
long val);
13237unsigned long __ovld atom_min(
volatile __global
unsigned long *p,
unsigned long val);
13238long __ovld atom_min(
volatile __local
long *p,
long val);
13239unsigned long __ovld atom_min(
volatile __local
unsigned long *p,
unsigned long val);
13253#ifdef __OPENCL_CPP_VERSION__
13255unsigned int __ovld atomic_max(
volatile unsigned int *p,
unsigned int val);
13258#if defined(cl_khr_global_int32_extended_atomics)
13259int __ovld atom_max(
volatile __global
int *p,
int val);
13260unsigned int __ovld atom_max(
volatile __global
unsigned int *p,
unsigned int val);
13262#if defined(cl_khr_local_int32_extended_atomics)
13263int __ovld atom_max(
volatile __local
int *p,
int val);
13264unsigned int __ovld atom_max(
volatile __local
unsigned int *p,
unsigned int val);
13267#if defined(cl_khr_int64_extended_atomics)
13268long __ovld atom_max(
volatile __global
long *p,
long val);
13269unsigned long __ovld atom_max(
volatile __global
unsigned long *p,
unsigned long val);
13270long __ovld atom_max(
volatile __local
long *p,
long val);
13271unsigned long __ovld atom_max(
volatile __local
unsigned long *p,
unsigned long val);
13284#ifdef __OPENCL_CPP_VERSION__
13286unsigned int __ovld atomic_and(
volatile unsigned int *p,
unsigned int val);
13289#if defined(cl_khr_global_int32_extended_atomics)
13290int __ovld atom_and(
volatile __global
int *p,
int val);
13291unsigned int __ovld atom_and(
volatile __global
unsigned int *p,
unsigned int val);
13293#if defined(cl_khr_local_int32_extended_atomics)
13294int __ovld atom_and(
volatile __local
int *p,
int val);
13295unsigned int __ovld atom_and(
volatile __local
unsigned int *p,
unsigned int val);
13298#if defined(cl_khr_int64_extended_atomics)
13299long __ovld atom_and(
volatile __global
long *p,
long val);
13300unsigned long __ovld atom_and(
volatile __global
unsigned long *p,
unsigned long val);
13301long __ovld atom_and(
volatile __local
long *p,
long val);
13302unsigned long __ovld atom_and(
volatile __local
unsigned long *p,
unsigned long val);
13315#ifdef __OPENCL_CPP_VERSION__
13317unsigned int __ovld atomic_or(
volatile unsigned int *p,
unsigned int val);
13320#if defined(cl_khr_global_int32_extended_atomics)
13321int __ovld atom_or(
volatile __global
int *p,
int val);
13322unsigned int __ovld atom_or(
volatile __global
unsigned int *p,
unsigned int val);
13324#if defined(cl_khr_local_int32_extended_atomics)
13325int __ovld atom_or(
volatile __local
int *p,
int val);
13326unsigned int __ovld atom_or(
volatile __local
unsigned int *p,
unsigned int val);
13329#if defined(cl_khr_int64_extended_atomics)
13330long __ovld atom_or(
volatile __global
long *p,
long val);
13331unsigned long __ovld atom_or(
volatile __global
unsigned long *p,
unsigned long val);
13332long __ovld atom_or(
volatile __local
long *p,
long val);
13333unsigned long __ovld atom_or(
volatile __local
unsigned long *p,
unsigned long val);
13346#ifdef __OPENCL_CPP_VERSION__
13348unsigned int __ovld atomic_xor(
volatile unsigned int *p,
unsigned int val);
13351#if defined(cl_khr_global_int32_extended_atomics)
13352int __ovld atom_xor(
volatile __global
int *p,
int val);
13353unsigned int __ovld atom_xor(
volatile __global
unsigned int *p,
unsigned int val);
13355#if defined(cl_khr_local_int32_extended_atomics)
13356int __ovld atom_xor(
volatile __local
int *p,
int val);
13357unsigned int __ovld atom_xor(
volatile __local
unsigned int *p,
unsigned int val);
13360#if defined(cl_khr_int64_extended_atomics)
13361long __ovld atom_xor(
volatile __global
long *p,
long val);
13362unsigned long __ovld atom_xor(
volatile __global
unsigned long *p,
unsigned long val);
13363long __ovld atom_xor(
volatile __local
long *p,
long val);
13364unsigned long __ovld atom_xor(
volatile __local
unsigned long *p,
unsigned long val);
13367#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics)
13368#pragma OPENCL EXTENSION cl_khr_int64_base_atomics : disable
13369#pragma OPENCL EXTENSION cl_khr_int64_extended_atomics : disable
13374#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
13377#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics)
13378#pragma OPENCL EXTENSION cl_khr_int64_base_atomics : enable
13379#pragma OPENCL EXTENSION cl_khr_int64_extended_atomics : enable
13386#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics)
13442#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics)
13491#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics)
13543#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics)
13568#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics)
13593#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics)
13639#if defined(cl_khr_int64_base_atomics) && defined(cl_khr_int64_extended_atomics)
14177#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_1_2)
14185#ifdef cl_khr_gl_msaa_sharing
14186#pragma OPENCL EXTENSION cl_khr_gl_msaa_sharing : enable
14298#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_1_2)
14316#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_1_2)
14326#ifdef cl_khr_depth_images
14334#if defined(cl_khr_gl_msaa_sharing)
14349#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
14350#ifdef cl_khr_mipmap_image
14376float4
__purefn __ovld read_imagef(read_only image1d_t image, sampler_t sampler,
float coord,
float gradientX,
float gradientY);
14377int4
__purefn __ovld read_imagei(read_only image1d_t image, sampler_t sampler,
float coord,
float gradientX,
float gradientY);
14378uint4
__purefn __ovld read_imageui(read_only image1d_t image, sampler_t sampler,
float coord,
float gradientX,
float gradientY);
14380float4
__purefn __ovld read_imagef(read_only image1d_array_t image_array, sampler_t sampler, float2 coord,
float gradientX,
float gradientY);
14381int4
__purefn __ovld read_imagei(read_only image1d_array_t image_array, sampler_t sampler, float2 coord,
float gradientX,
float gradientY);
14382uint4
__purefn __ovld read_imageui(read_only image1d_array_t image_array, sampler_t sampler, float2 coord,
float gradientX,
float gradientY);
14384float4
__purefn __ovld read_imagef(read_only image2d_t image, sampler_t sampler, float2 coord, float2 gradientX, float2 gradientY);
14385int4
__purefn __ovld read_imagei(read_only image2d_t image, sampler_t sampler, float2 coord, float2 gradientX, float2 gradientY);
14386uint4
__purefn __ovld read_imageui(read_only image2d_t image, sampler_t sampler, float2 coord, float2 gradientX, float2 gradientY);
14388float __purefn __ovld read_imagef(read_only image2d_depth_t image, sampler_t sampler, float2 coord, float2 gradientX, float2 gradientY);
14390float4
__purefn __ovld read_imagef(read_only image2d_array_t image_array, sampler_t sampler, float4 coord, float2 gradientX, float2 gradientY);
14391int4
__purefn __ovld read_imagei(read_only image2d_array_t image_array, sampler_t sampler, float4 coord, float2 gradientX, float2 gradientY);
14392uint4
__purefn __ovld read_imageui(read_only image2d_array_t image_array, sampler_t sampler, float4 coord, float2 gradientX, float2 gradientY);
14394float __purefn __ovld read_imagef(read_only image2d_array_depth_t image, sampler_t sampler, float4 coord, float2 gradientX, float2 gradientY);
14396float4
__purefn __ovld read_imagef(read_only image3d_t image, sampler_t sampler, float4 coord, float4 gradientX, float4 gradientY);
14397int4
__purefn __ovld read_imagei(read_only image3d_t image, sampler_t sampler, float4 coord, float4 gradientX, float4 gradientY);
14398uint4
__purefn __ovld read_imageui(read_only image3d_t image, sampler_t sampler, float4 coord, float4 gradientX, float4 gradientY);
14403#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_1_2)
14429#ifdef cl_khr_depth_images
14442half4
__purefn __ovld read_imageh(read_only image1d_t image, sampler_t sampler,
int coord);
14443half4
__purefn __ovld read_imageh(read_only image1d_t image, sampler_t sampler,
float coord);
14444half4
__purefn __ovld read_imageh(read_only image2d_t image, sampler_t sampler, int2 coord);
14445half4
__purefn __ovld read_imageh(read_only image2d_t image, sampler_t sampler, float2 coord);
14446half4
__purefn __ovld read_imageh(read_only image3d_t image, sampler_t sampler, int4 coord);
14447half4
__purefn __ovld read_imageh(read_only image3d_t image, sampler_t sampler, float4 coord);
14448#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_1_2)
14449half4
__purefn __ovld read_imageh(read_only image1d_array_t image, sampler_t sampler, int2 coord);
14450half4
__purefn __ovld read_imageh(read_only image1d_array_t image, sampler_t sampler, float2 coord);
14451half4
__purefn __ovld read_imageh(read_only image2d_array_t image, sampler_t sampler, int4 coord);
14452half4
__purefn __ovld read_imageh(read_only image2d_array_t image, sampler_t sampler, float4 coord);
14456half4
__purefn __ovld read_imageh(read_only image1d_t image,
int coord);
14457half4
__purefn __ovld read_imageh(read_only image2d_t image, int2 coord);
14458half4
__purefn __ovld read_imageh(read_only image3d_t image, int4 coord);
14459half4
__purefn __ovld read_imageh(read_only image1d_array_t image, int2 coord);
14460half4
__purefn __ovld read_imageh(read_only image2d_array_t image, int4 coord);
14461half4
__purefn __ovld read_imageh(read_only image1d_buffer_t image,
int coord);
14466#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
14491#ifdef cl_khr_depth_images
14496#if cl_khr_gl_msaa_sharing
14509#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
14510#ifdef cl_khr_mipmap_image
14535float4
__purefn __ovld read_imagef(read_write image1d_t image, sampler_t sampler,
float coord,
float gradientX,
float gradientY);
14536int4
__purefn __ovld read_imagei(read_write image1d_t image, sampler_t sampler,
float coord,
float gradientX,
float gradientY);
14537uint4
__purefn __ovld read_imageui(read_write image1d_t image, sampler_t sampler,
float coord,
float gradientX,
float gradientY);
14539float4
__purefn __ovld read_imagef(read_write image1d_array_t image_array, sampler_t sampler, float2 coord,
float gradientX,
float gradientY);
14540int4
__purefn __ovld read_imagei(read_write image1d_array_t image_array, sampler_t sampler, float2 coord,
float gradientX,
float gradientY);
14541uint4
__purefn __ovld read_imageui(read_write image1d_array_t image_array, sampler_t sampler, float2 coord,
float gradientX,
float gradientY);
14543float4
__purefn __ovld read_imagef(read_write image2d_t image, sampler_t sampler, float2 coord, float2 gradientX, float2 gradientY);
14544int4
__purefn __ovld read_imagei(read_write image2d_t image, sampler_t sampler, float2 coord, float2 gradientX, float2 gradientY);
14545uint4
__purefn __ovld read_imageui(read_write image2d_t image, sampler_t sampler, float2 coord, float2 gradientX, float2 gradientY);
14547float __purefn __ovld read_imagef(read_write image2d_depth_t image, sampler_t sampler, float2 coord, float2 gradientX, float2 gradientY);
14549float4
__purefn __ovld read_imagef(read_write image2d_array_t image_array, sampler_t sampler, float4 coord, float2 gradientX, float2 gradientY);
14550int4
__purefn __ovld read_imagei(read_write image2d_array_t image_array, sampler_t sampler, float4 coord, float2 gradientX, float2 gradientY);
14551uint4
__purefn __ovld read_imageui(read_write image2d_array_t image_array, sampler_t sampler, float4 coord, float2 gradientX, float2 gradientY);
14553float __purefn __ovld read_imagef(read_write image2d_array_depth_t image, sampler_t sampler, float4 coord, float2 gradientX, float2 gradientY);
14555float4
__purefn __ovld read_imagef(read_write image3d_t image, sampler_t sampler, float4 coord, float4 gradientX, float4 gradientY);
14556int4
__purefn __ovld read_imagei(read_write image3d_t image, sampler_t sampler, float4 coord, float4 gradientX, float4 gradientY);
14557uint4
__purefn __ovld read_imageui(read_write image3d_t image, sampler_t sampler, float4 coord, float4 gradientX, float4 gradientY);
14564half4
__purefn __ovld read_imageh(read_write image1d_t image,
int coord);
14565half4
__purefn __ovld read_imageh(read_write image2d_t image, int2 coord);
14566half4
__purefn __ovld read_imageh(read_write image3d_t image, int4 coord);
14567half4
__purefn __ovld read_imageh(read_write image1d_array_t image, int2 coord);
14568half4
__purefn __ovld read_imageh(read_write image2d_array_t image, int4 coord);
14569half4
__purefn __ovld read_imageh(read_write image1d_buffer_t image,
int coord);
14660#ifdef cl_khr_3d_image_writes
14666#ifdef cl_khr_depth_images
14672#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
14673#if defined(cl_khr_mipmap_image_writes)
14674void __ovld write_imagef(write_only image1d_t image,
int coord,
int lod, float4 color);
14675void __ovld write_imagei(write_only image1d_t image,
int coord,
int lod, int4 color);
14678void __ovld write_imagef(write_only image1d_array_t image_array, int2 coord,
int lod, float4 color);
14679void __ovld write_imagei(write_only image1d_array_t image_array, int2 coord,
int lod, int4 color);
14680void __ovld write_imageui(write_only image1d_array_t image_array, int2 coord,
int lod, uint4 color);
14682void __ovld write_imagef(write_only image2d_t image, int2 coord,
int lod, float4 color);
14683void __ovld write_imagei(write_only image2d_t image, int2 coord,
int lod, int4 color);
14686void __ovld write_imagef(write_only image2d_array_t image_array, int4 coord,
int lod, float4 color);
14687void __ovld write_imagei(write_only image2d_array_t image_array, int4 coord,
int lod, int4 color);
14688void __ovld write_imageui(write_only image2d_array_t image_array, int4 coord,
int lod, uint4 color);
14690void __ovld write_imagef(write_only image2d_depth_t image, int2 coord,
int lod,
float depth);
14691void __ovld write_imagef(write_only image2d_array_depth_t image, int4 coord,
int lod,
float depth);
14693#ifdef cl_khr_3d_image_writes
14694void __ovld write_imagef(write_only image3d_t image, int4 coord,
int lod, float4 color);
14695void __ovld write_imagei(write_only image3d_t image, int4 coord,
int lod, int4 color);
14704void __ovld write_imageh(write_only image1d_t image,
int coord, half4 color);
14705void __ovld write_imageh(write_only image2d_t image, int2 coord, half4 color);
14706#ifdef cl_khr_3d_image_writes
14707void __ovld write_imageh(write_only image3d_t image, int4 coord, half4 color);
14709void __ovld write_imageh(write_only image1d_array_t image, int2 coord, half4 color);
14710void __ovld write_imageh(write_only image2d_array_t image, int4 coord, half4 color);
14711void __ovld write_imageh(write_only image1d_buffer_t image,
int coord, half4 color);
14715#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
14736#ifdef cl_khr_3d_image_writes
14742#ifdef cl_khr_depth_images
14747#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
14748#if defined(cl_khr_mipmap_image_writes)
14749void __ovld write_imagef(read_write image1d_t image,
int coord,
int lod, float4 color);
14750void __ovld write_imagei(read_write image1d_t image,
int coord,
int lod, int4 color);
14753void __ovld write_imagef(read_write image1d_array_t image_array, int2 coord,
int lod, float4 color);
14754void __ovld write_imagei(read_write image1d_array_t image_array, int2 coord,
int lod, int4 color);
14755void __ovld write_imageui(read_write image1d_array_t image_array, int2 coord,
int lod, uint4 color);
14757void __ovld write_imagef(read_write image2d_t image, int2 coord,
int lod, float4 color);
14758void __ovld write_imagei(read_write image2d_t image, int2 coord,
int lod, int4 color);
14761void __ovld write_imagef(read_write image2d_array_t image_array, int4 coord,
int lod, float4 color);
14762void __ovld write_imagei(read_write image2d_array_t image_array, int4 coord,
int lod, int4 color);
14763void __ovld write_imageui(read_write image2d_array_t image_array, int4 coord,
int lod, uint4 color);
14765void __ovld write_imagef(read_write image2d_depth_t image, int2 coord,
int lod,
float color);
14766void __ovld write_imagef(read_write image2d_array_depth_t image, int4 coord,
int lod,
float color);
14768#ifdef cl_khr_3d_image_writes
14769void __ovld write_imagef(read_write image3d_t image, int4 coord,
int lod, float4 color);
14770void __ovld write_imagei(read_write image3d_t image, int4 coord,
int lod, int4 color);
14779void __ovld write_imageh(read_write image1d_t image,
int coord, half4 color);
14780void __ovld write_imageh(read_write image2d_t image, int2 coord, half4 color);
14781#ifdef cl_khr_3d_image_writes
14782void __ovld write_imageh(read_write image3d_t image, int4 coord, half4 color);
14784void __ovld write_imageh(read_write image1d_array_t image, int2 coord, half4 color);
14785void __ovld write_imageh(read_write image2d_array_t image, int4 coord, half4 color);
14786void __ovld write_imageh(read_write image1d_buffer_t image,
int coord, half4 color);
14801#ifdef cl_khr_3d_image_writes
14806#ifdef cl_khr_depth_images
14810#if defined(cl_khr_gl_msaa_sharing)
14820#ifdef cl_khr_3d_image_writes
14825#ifdef cl_khr_depth_images
14829#if defined(cl_khr_gl_msaa_sharing)
14836#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
14843#ifdef cl_khr_depth_images
14847#if defined(cl_khr_gl_msaa_sharing)
14861#ifdef cl_khr_depth_images
14865#if defined(cl_khr_gl_msaa_sharing)
14873#ifdef cl_khr_3d_image_writes
14877#ifdef cl_khr_depth_images
14881#if defined(cl_khr_gl_msaa_sharing)
14888#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
14892#ifdef cl_khr_depth_images
14896#if defined(cl_khr_gl_msaa_sharing)
14909#ifdef cl_khr_3d_image_writes
14913#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
14918#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
14919#ifdef cl_khr_mipmap_image
14924int __ovld get_image_num_mip_levels(read_only image1d_t image);
14925int __ovld get_image_num_mip_levels(read_only image2d_t image);
14926int __ovld get_image_num_mip_levels(read_only image3d_t image);
14928int __ovld get_image_num_mip_levels(write_only image1d_t image);
14929int __ovld get_image_num_mip_levels(write_only image2d_t image);
14930#ifdef cl_khr_3d_image_writes
14931int __ovld get_image_num_mip_levels(write_only image3d_t image);
14934int __ovld get_image_num_mip_levels(read_write image1d_t image);
14935int __ovld get_image_num_mip_levels(read_write image2d_t image);
14936int __ovld get_image_num_mip_levels(read_write image3d_t image);
14938int __ovld get_image_num_mip_levels(read_only image1d_array_t image);
14939int __ovld get_image_num_mip_levels(read_only image2d_array_t image);
14940int __ovld get_image_num_mip_levels(read_only image2d_array_depth_t image);
14941int __ovld get_image_num_mip_levels(read_only image2d_depth_t image);
14943int __ovld get_image_num_mip_levels(write_only image1d_array_t image);
14944int __ovld get_image_num_mip_levels(write_only image2d_array_t image);
14945int __ovld get_image_num_mip_levels(write_only image2d_array_depth_t image);
14946int __ovld get_image_num_mip_levels(write_only image2d_depth_t image);
14948int __ovld get_image_num_mip_levels(read_write image1d_array_t image);
14949int __ovld get_image_num_mip_levels(read_write image2d_array_t image);
14950int __ovld get_image_num_mip_levels(read_write image2d_array_depth_t image);
14951int __ovld get_image_num_mip_levels(read_write image2d_depth_t image);
14981#ifdef cl_khr_depth_images
14985#if defined(cl_khr_gl_msaa_sharing)
14995#ifdef cl_khr_3d_image_writes
15000#ifdef cl_khr_depth_images
15004#if defined(cl_khr_gl_msaa_sharing)
15011#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
15018#ifdef cl_khr_depth_images
15022#if defined(cl_khr_gl_msaa_sharing)
15053#ifdef cl_khr_depth_images
15057#if defined(cl_khr_gl_msaa_sharing)
15067#ifdef cl_khr_3d_image_writes
15072#ifdef cl_khr_depth_images
15076#if defined(cl_khr_gl_msaa_sharing)
15083#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
15090#ifdef cl_khr_depth_images
15094#if defined(cl_khr_gl_msaa_sharing)
15109#ifdef cl_khr_depth_images
15113#if defined(cl_khr_gl_msaa_sharing)
15122#ifdef cl_khr_depth_images
15126#if defined(cl_khr_gl_msaa_sharing)
15133#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
15136#ifdef cl_khr_depth_images
15140#if defined(cl_khr_gl_msaa_sharing)
15155#ifdef cl_khr_3d_image_writes
15158#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
15168#ifdef cl_khr_depth_images
15171#if defined(cl_khr_gl_msaa_sharing)
15178#ifdef cl_khr_depth_images
15181#if defined(cl_khr_gl_msaa_sharing)
15186#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
15189#ifdef cl_khr_depth_images
15192#if defined(cl_khr_gl_msaa_sharing)
15201#if defined(cl_khr_gl_msaa_sharing)
15202int __ovld get_image_num_samples(read_only image2d_msaa_t image);
15203int __ovld get_image_num_samples(read_only image2d_msaa_depth_t image);
15204int __ovld get_image_num_samples(read_only image2d_array_msaa_t image);
15205int __ovld get_image_num_samples(read_only image2d_array_msaa_depth_t image);
15207int __ovld get_image_num_samples(write_only image2d_msaa_t image);
15208int __ovld get_image_num_samples(write_only image2d_msaa_depth_t image);
15209int __ovld get_image_num_samples(write_only image2d_array_msaa_t image);
15210int __ovld get_image_num_samples(write_only image2d_array_msaa_depth_t image);
15212#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
15213int __ovld get_image_num_samples(read_write image2d_msaa_t image);
15214int __ovld get_image_num_samples(read_write image2d_msaa_depth_t image);
15215int __ovld get_image_num_samples(read_write image2d_array_msaa_t image);
15216int __ovld get_image_num_samples(read_write image2d_array_msaa_depth_t image);
15222#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
15323#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
15329#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
15362#if defined(cl_intel_subgroups) || defined(cl_khr_subgroups)
15367#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
15368uint __ovld get_enqueued_num_sub_groups(
void);
15374#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
15405long __ovld __conv sub_group_scan_exclusive_add(
long x);
15407float __ovld __conv sub_group_scan_exclusive_add(
float x);
15410long __ovld __conv sub_group_scan_exclusive_min(
long x);
15412float __ovld __conv sub_group_scan_exclusive_min(
float x);
15415long __ovld __conv sub_group_scan_exclusive_max(
long x);
15417float __ovld __conv sub_group_scan_exclusive_max(
float x);
15421long __ovld __conv sub_group_scan_inclusive_add(
long x);
15423float __ovld __conv sub_group_scan_inclusive_add(
float x);
15426long __ovld __conv sub_group_scan_inclusive_min(
long x);
15428float __ovld __conv sub_group_scan_inclusive_min(
float x);
15431long __ovld __conv sub_group_scan_inclusive_max(
long x);
15433float __ovld __conv sub_group_scan_inclusive_max(
float x);
15440half
__ovld __conv sub_group_scan_exclusive_add(half x);
15441half
__ovld __conv sub_group_scan_exclusive_min(half x);
15442half
__ovld __conv sub_group_scan_exclusive_max(half x);
15443half
__ovld __conv sub_group_scan_inclusive_add(half x);
15444half
__ovld __conv sub_group_scan_inclusive_min(half x);
15445half
__ovld __conv sub_group_scan_inclusive_max(half x);
15449double __ovld __conv sub_group_broadcast(
double x,
uint sub_group_local_id);
15453double __ovld __conv sub_group_scan_exclusive_add(
double x);
15454double __ovld __conv sub_group_scan_exclusive_min(
double x);
15455double __ovld __conv sub_group_scan_exclusive_max(
double x);
15456double __ovld __conv sub_group_scan_inclusive_add(
double x);
15457double __ovld __conv sub_group_scan_inclusive_min(
double x);
15458double __ovld __conv sub_group_scan_inclusive_max(
double x);
15463#if defined(cl_khr_subgroup_extended_types)
15529short __ovld __conv sub_group_reduce_add(
short value );
15534short __ovld __conv sub_group_reduce_min(
short value );
15539short __ovld __conv sub_group_reduce_max(
short value );
15542char __ovld __conv sub_group_scan_inclusive_add(
char value );
15544short __ovld __conv sub_group_scan_inclusive_add(
short value );
15547char __ovld __conv sub_group_scan_inclusive_min(
char value );
15549short __ovld __conv sub_group_scan_inclusive_min(
short value );
15552char __ovld __conv sub_group_scan_inclusive_max(
char value );
15554short __ovld __conv sub_group_scan_inclusive_max(
short value );
15557char __ovld __conv sub_group_scan_exclusive_add(
char value );
15559short __ovld __conv sub_group_scan_exclusive_add(
short value );
15562char __ovld __conv sub_group_scan_exclusive_min(
char value );
15564short __ovld __conv sub_group_scan_exclusive_min(
short value );
15567char __ovld __conv sub_group_scan_exclusive_max(
char value );
15569short __ovld __conv sub_group_scan_exclusive_max(
short value );
15572#if defined(cl_khr_fp16)
15581#if defined(cl_khr_fp64)
15592#if defined(cl_khr_subgroup_non_uniform_vote)
15593int __ovld sub_group_elect(
void);
15594int __ovld sub_group_non_uniform_all(
int predicate );
15595int __ovld sub_group_non_uniform_any(
int predicate );
15597int __ovld sub_group_non_uniform_all_equal(
char value );
15598int __ovld sub_group_non_uniform_all_equal(
uchar value );
15599int __ovld sub_group_non_uniform_all_equal(
short value );
15600int __ovld sub_group_non_uniform_all_equal(
ushort value );
15601int __ovld sub_group_non_uniform_all_equal(
int value );
15602int __ovld sub_group_non_uniform_all_equal(
uint value );
15603int __ovld sub_group_non_uniform_all_equal(
long value );
15604int __ovld sub_group_non_uniform_all_equal(
ulong value );
15605int __ovld sub_group_non_uniform_all_equal(
float value );
15607#if defined(cl_khr_fp16)
15608int __ovld sub_group_non_uniform_all_equal( half value );
15611#if defined(cl_khr_fp64)
15612int __ovld sub_group_non_uniform_all_equal(
double value );
15617#if defined(cl_khr_subgroup_ballot)
15618char __ovld sub_group_non_uniform_broadcast(
char value,
uint index );
15619char2
__ovld sub_group_non_uniform_broadcast( char2 value,
uint index );
15620char3
__ovld sub_group_non_uniform_broadcast( char3 value,
uint index );
15621char4
__ovld sub_group_non_uniform_broadcast( char4 value,
uint index );
15622char8
__ovld sub_group_non_uniform_broadcast( char8 value,
uint index );
15623char16
__ovld sub_group_non_uniform_broadcast( char16 value,
uint index );
15626uchar2
__ovld sub_group_non_uniform_broadcast( uchar2 value,
uint index );
15627uchar3
__ovld sub_group_non_uniform_broadcast( uchar3 value,
uint index );
15628uchar4
__ovld sub_group_non_uniform_broadcast( uchar4 value,
uint index );
15629uchar8
__ovld sub_group_non_uniform_broadcast( uchar8 value,
uint index );
15630uchar16
__ovld sub_group_non_uniform_broadcast( uchar16 value,
uint index );
15632short __ovld sub_group_non_uniform_broadcast(
short value,
uint index );
15633short2
__ovld sub_group_non_uniform_broadcast( short2 value,
uint index );
15634short3
__ovld sub_group_non_uniform_broadcast( short3 value,
uint index );
15635short4
__ovld sub_group_non_uniform_broadcast( short4 value,
uint index );
15636short8
__ovld sub_group_non_uniform_broadcast( short8 value,
uint index );
15637short16
__ovld sub_group_non_uniform_broadcast( short16 value,
uint index );
15640ushort2
__ovld sub_group_non_uniform_broadcast( ushort2 value,
uint index );
15641ushort3
__ovld sub_group_non_uniform_broadcast( ushort3 value,
uint index );
15642ushort4
__ovld sub_group_non_uniform_broadcast( ushort4 value,
uint index );
15643ushort8
__ovld sub_group_non_uniform_broadcast( ushort8 value,
uint index );
15644ushort16
__ovld sub_group_non_uniform_broadcast( ushort16 value,
uint index );
15646int __ovld sub_group_non_uniform_broadcast(
int value,
uint index );
15647int2
__ovld sub_group_non_uniform_broadcast( int2 value,
uint index );
15648int3
__ovld sub_group_non_uniform_broadcast( int3 value,
uint index );
15649int4
__ovld sub_group_non_uniform_broadcast( int4 value,
uint index );
15654uint2
__ovld sub_group_non_uniform_broadcast( uint2 value,
uint index );
15655uint3
__ovld sub_group_non_uniform_broadcast( uint3 value,
uint index );
15656uint4
__ovld sub_group_non_uniform_broadcast( uint4 value,
uint index );
15660long __ovld sub_group_non_uniform_broadcast(
long value,
uint index );
15661long2
__ovld sub_group_non_uniform_broadcast( long2 value,
uint index );
15662long3
__ovld sub_group_non_uniform_broadcast( long3 value,
uint index );
15663long4
__ovld sub_group_non_uniform_broadcast( long4 value,
uint index );
15664long8
__ovld sub_group_non_uniform_broadcast( long8 value,
uint index );
15665long16
__ovld sub_group_non_uniform_broadcast( long16 value,
uint index );
15668ulong2
__ovld sub_group_non_uniform_broadcast( ulong2 value,
uint index );
15669ulong3
__ovld sub_group_non_uniform_broadcast( ulong3 value,
uint index );
15670ulong4
__ovld sub_group_non_uniform_broadcast( ulong4 value,
uint index );
15671ulong8
__ovld sub_group_non_uniform_broadcast( ulong8 value,
uint index );
15672ulong16
__ovld sub_group_non_uniform_broadcast( ulong16 value,
uint index );
15674float __ovld sub_group_non_uniform_broadcast(
float value,
uint index );
15675float2
__ovld sub_group_non_uniform_broadcast( float2 value,
uint index );
15676float3
__ovld sub_group_non_uniform_broadcast( float3 value,
uint index );
15677float4
__ovld sub_group_non_uniform_broadcast( float4 value,
uint index );
15678float8
__ovld sub_group_non_uniform_broadcast( float8 value,
uint index );
15679float16
__ovld sub_group_non_uniform_broadcast( float16 value,
uint index );
15681char __ovld sub_group_broadcast_first(
char value );
15683short __ovld sub_group_broadcast_first(
short value );
15685int __ovld sub_group_broadcast_first(
int value );
15687long __ovld sub_group_broadcast_first(
long value );
15689float __ovld sub_group_broadcast_first(
float value );
15691uint4
__ovld sub_group_ballot(
int predicate );
15692int __ovld __cnfn sub_group_inverse_ballot( uint4 value );
15696uint __ovld sub_group_ballot_inclusive_scan( uint4 value );
15697uint __ovld sub_group_ballot_exclusive_scan( uint4 value );
15698uint __ovld sub_group_ballot_find_lsb( uint4 value );
15699uint __ovld sub_group_ballot_find_msb( uint4 value );
15707#if defined(cl_khr_fp16)
15708half
__ovld sub_group_non_uniform_broadcast( half value,
uint index );
15709half2
__ovld sub_group_non_uniform_broadcast( half2 value,
uint index );
15710half3
__ovld sub_group_non_uniform_broadcast( half3 value,
uint index );
15711half4
__ovld sub_group_non_uniform_broadcast( half4 value,
uint index );
15712half8
__ovld sub_group_non_uniform_broadcast( half8 value,
uint index );
15713half16
__ovld sub_group_non_uniform_broadcast( half16 value,
uint index );
15715half
__ovld sub_group_broadcast_first( half value );
15718#if defined(cl_khr_fp64)
15719double __ovld sub_group_non_uniform_broadcast(
double value,
uint index );
15720double2
__ovld sub_group_non_uniform_broadcast( double2 value,
uint index );
15721double3
__ovld sub_group_non_uniform_broadcast( double3 value,
uint index );
15722double4
__ovld sub_group_non_uniform_broadcast( double4 value,
uint index );
15723double8
__ovld sub_group_non_uniform_broadcast( double8 value,
uint index );
15724double16
__ovld sub_group_non_uniform_broadcast( double16 value,
uint index );
15726double __ovld sub_group_broadcast_first(
double value );
15731#if defined(cl_khr_subgroup_non_uniform_arithmetic)
15732char __ovld sub_group_non_uniform_reduce_add(
char value );
15734short __ovld sub_group_non_uniform_reduce_add(
short value );
15736int __ovld sub_group_non_uniform_reduce_add(
int value );
15738long __ovld sub_group_non_uniform_reduce_add(
long value );
15740float __ovld sub_group_non_uniform_reduce_add(
float value );
15742char __ovld sub_group_non_uniform_reduce_mul(
char value );
15744short __ovld sub_group_non_uniform_reduce_mul(
short value );
15746int __ovld sub_group_non_uniform_reduce_mul(
int value );
15748long __ovld sub_group_non_uniform_reduce_mul(
long value );
15750float __ovld sub_group_non_uniform_reduce_mul(
float value );
15752char __ovld sub_group_non_uniform_reduce_min(
char value );
15754short __ovld sub_group_non_uniform_reduce_min(
short value );
15756int __ovld sub_group_non_uniform_reduce_min(
int value );
15758long __ovld sub_group_non_uniform_reduce_min(
long value );
15760float __ovld sub_group_non_uniform_reduce_min(
float value );
15762char __ovld sub_group_non_uniform_reduce_max(
char value );
15764short __ovld sub_group_non_uniform_reduce_max(
short value );
15766int __ovld sub_group_non_uniform_reduce_max(
int value );
15768long __ovld sub_group_non_uniform_reduce_max(
long value );
15770float __ovld sub_group_non_uniform_reduce_max(
float value );
15772char __ovld sub_group_non_uniform_scan_inclusive_add(
char value );
15774short __ovld sub_group_non_uniform_scan_inclusive_add(
short value );
15776int __ovld sub_group_non_uniform_scan_inclusive_add(
int value );
15777uint __ovld sub_group_non_uniform_scan_inclusive_add(
uint value );
15778long __ovld sub_group_non_uniform_scan_inclusive_add(
long value );
15780float __ovld sub_group_non_uniform_scan_inclusive_add(
float value );
15782char __ovld sub_group_non_uniform_scan_inclusive_mul(
char value );
15784short __ovld sub_group_non_uniform_scan_inclusive_mul(
short value );
15786int __ovld sub_group_non_uniform_scan_inclusive_mul(
int value );
15787uint __ovld sub_group_non_uniform_scan_inclusive_mul(
uint value );
15788long __ovld sub_group_non_uniform_scan_inclusive_mul(
long value );
15790float __ovld sub_group_non_uniform_scan_inclusive_mul(
float value );
15792char __ovld sub_group_non_uniform_scan_inclusive_min(
char value );
15794short __ovld sub_group_non_uniform_scan_inclusive_min(
short value );
15796int __ovld sub_group_non_uniform_scan_inclusive_min(
int value );
15797uint __ovld sub_group_non_uniform_scan_inclusive_min(
uint value );
15798long __ovld sub_group_non_uniform_scan_inclusive_min(
long value );
15800float __ovld sub_group_non_uniform_scan_inclusive_min(
float value );
15802char __ovld sub_group_non_uniform_scan_inclusive_max(
char value );
15804short __ovld sub_group_non_uniform_scan_inclusive_max(
short value );
15806int __ovld sub_group_non_uniform_scan_inclusive_max(
int value );
15807uint __ovld sub_group_non_uniform_scan_inclusive_max(
uint value );
15808long __ovld sub_group_non_uniform_scan_inclusive_max(
long value );
15810float __ovld sub_group_non_uniform_scan_inclusive_max(
float value );
15812char __ovld sub_group_non_uniform_scan_exclusive_add(
char value );
15814short __ovld sub_group_non_uniform_scan_exclusive_add(
short value );
15816int __ovld sub_group_non_uniform_scan_exclusive_add(
int value );
15817uint __ovld sub_group_non_uniform_scan_exclusive_add(
uint value );
15818long __ovld sub_group_non_uniform_scan_exclusive_add(
long value );
15820float __ovld sub_group_non_uniform_scan_exclusive_add(
float value );
15822char __ovld sub_group_non_uniform_scan_exclusive_mul(
char value );
15824short __ovld sub_group_non_uniform_scan_exclusive_mul(
short value );
15826int __ovld sub_group_non_uniform_scan_exclusive_mul(
int value );
15827uint __ovld sub_group_non_uniform_scan_exclusive_mul(
uint value );
15828long __ovld sub_group_non_uniform_scan_exclusive_mul(
long value );
15830float __ovld sub_group_non_uniform_scan_exclusive_mul(
float value );
15832char __ovld sub_group_non_uniform_scan_exclusive_min(
char value );
15834short __ovld sub_group_non_uniform_scan_exclusive_min(
short value );
15836int __ovld sub_group_non_uniform_scan_exclusive_min(
int value );
15837uint __ovld sub_group_non_uniform_scan_exclusive_min(
uint value );
15838long __ovld sub_group_non_uniform_scan_exclusive_min(
long value );
15840float __ovld sub_group_non_uniform_scan_exclusive_min(
float value );
15842char __ovld sub_group_non_uniform_scan_exclusive_max(
char value );
15844short __ovld sub_group_non_uniform_scan_exclusive_max(
short value );
15846int __ovld sub_group_non_uniform_scan_exclusive_max(
int value );
15847uint __ovld sub_group_non_uniform_scan_exclusive_max(
uint value );
15848long __ovld sub_group_non_uniform_scan_exclusive_max(
long value );
15850float __ovld sub_group_non_uniform_scan_exclusive_max(
float value );
15852char __ovld sub_group_non_uniform_reduce_and(
char value );
15854short __ovld sub_group_non_uniform_reduce_and(
short value );
15856int __ovld sub_group_non_uniform_reduce_and(
int value );
15858long __ovld sub_group_non_uniform_reduce_and(
long value );
15861char __ovld sub_group_non_uniform_reduce_or(
char value );
15863short __ovld sub_group_non_uniform_reduce_or(
short value );
15865int __ovld sub_group_non_uniform_reduce_or(
int value );
15867long __ovld sub_group_non_uniform_reduce_or(
long value );
15870char __ovld sub_group_non_uniform_reduce_xor(
char value );
15872short __ovld sub_group_non_uniform_reduce_xor(
short value );
15874int __ovld sub_group_non_uniform_reduce_xor(
int value );
15876long __ovld sub_group_non_uniform_reduce_xor(
long value );
15879char __ovld sub_group_non_uniform_scan_inclusive_and(
char value );
15881short __ovld sub_group_non_uniform_scan_inclusive_and(
short value );
15883int __ovld sub_group_non_uniform_scan_inclusive_and(
int value );
15884uint __ovld sub_group_non_uniform_scan_inclusive_and(
uint value );
15885long __ovld sub_group_non_uniform_scan_inclusive_and(
long value );
15888char __ovld sub_group_non_uniform_scan_inclusive_or(
char value );
15890short __ovld sub_group_non_uniform_scan_inclusive_or(
short value );
15892int __ovld sub_group_non_uniform_scan_inclusive_or(
int value );
15893uint __ovld sub_group_non_uniform_scan_inclusive_or(
uint value );
15894long __ovld sub_group_non_uniform_scan_inclusive_or(
long value );
15897char __ovld sub_group_non_uniform_scan_inclusive_xor(
char value );
15899short __ovld sub_group_non_uniform_scan_inclusive_xor(
short value );
15901int __ovld sub_group_non_uniform_scan_inclusive_xor(
int value );
15902uint __ovld sub_group_non_uniform_scan_inclusive_xor(
uint value );
15903long __ovld sub_group_non_uniform_scan_inclusive_xor(
long value );
15906char __ovld sub_group_non_uniform_scan_exclusive_and(
char value );
15908short __ovld sub_group_non_uniform_scan_exclusive_and(
short value );
15910int __ovld sub_group_non_uniform_scan_exclusive_and(
int value );
15911uint __ovld sub_group_non_uniform_scan_exclusive_and(
uint value );
15912long __ovld sub_group_non_uniform_scan_exclusive_and(
long value );
15915char __ovld sub_group_non_uniform_scan_exclusive_or(
char value );
15917short __ovld sub_group_non_uniform_scan_exclusive_or(
short value );
15919int __ovld sub_group_non_uniform_scan_exclusive_or(
int value );
15920uint __ovld sub_group_non_uniform_scan_exclusive_or(
uint value );
15921long __ovld sub_group_non_uniform_scan_exclusive_or(
long value );
15924char __ovld sub_group_non_uniform_scan_exclusive_xor(
char value );
15926short __ovld sub_group_non_uniform_scan_exclusive_xor(
short value );
15928int __ovld sub_group_non_uniform_scan_exclusive_xor(
int value );
15929uint __ovld sub_group_non_uniform_scan_exclusive_xor(
uint value );
15930long __ovld sub_group_non_uniform_scan_exclusive_xor(
long value );
15933int __ovld sub_group_non_uniform_reduce_logical_and(
int predicate );
15934int __ovld sub_group_non_uniform_reduce_logical_or(
int predicate );
15935int __ovld sub_group_non_uniform_reduce_logical_xor(
int predicate );
15937int __ovld sub_group_non_uniform_scan_inclusive_logical_and(
int predicate );
15938int __ovld sub_group_non_uniform_scan_inclusive_logical_or(
int predicate );
15939int __ovld sub_group_non_uniform_scan_inclusive_logical_xor(
int predicate );
15941int __ovld sub_group_non_uniform_scan_exclusive_logical_and(
int predicate );
15942int __ovld sub_group_non_uniform_scan_exclusive_logical_or(
int predicate );
15943int __ovld sub_group_non_uniform_scan_exclusive_logical_xor(
int predicate );
15945#if defined(cl_khr_fp16)
15946half
__ovld sub_group_non_uniform_reduce_add( half value );
15947half
__ovld sub_group_non_uniform_reduce_mul( half value );
15948half
__ovld sub_group_non_uniform_reduce_min( half value );
15949half
__ovld sub_group_non_uniform_reduce_max( half value );
15950half
__ovld sub_group_non_uniform_scan_inclusive_add( half value );
15951half
__ovld sub_group_non_uniform_scan_inclusive_mul( half value );
15952half
__ovld sub_group_non_uniform_scan_inclusive_min( half value );
15953half
__ovld sub_group_non_uniform_scan_inclusive_max( half value );
15954half
__ovld sub_group_non_uniform_scan_exclusive_add( half value );
15955half
__ovld sub_group_non_uniform_scan_exclusive_mul( half value );
15956half
__ovld sub_group_non_uniform_scan_exclusive_min( half value );
15957half
__ovld sub_group_non_uniform_scan_exclusive_max( half value );
15960#if defined(cl_khr_fp64)
15961double __ovld sub_group_non_uniform_reduce_add(
double value );
15962double __ovld sub_group_non_uniform_reduce_mul(
double value );
15963double __ovld sub_group_non_uniform_reduce_min(
double value );
15964double __ovld sub_group_non_uniform_reduce_max(
double value );
15965double __ovld sub_group_non_uniform_scan_inclusive_add(
double value );
15966double __ovld sub_group_non_uniform_scan_inclusive_mul(
double value );
15967double __ovld sub_group_non_uniform_scan_inclusive_min(
double value );
15968double __ovld sub_group_non_uniform_scan_inclusive_max(
double value );
15969double __ovld sub_group_non_uniform_scan_exclusive_add(
double value );
15970double __ovld sub_group_non_uniform_scan_exclusive_mul(
double value );
15971double __ovld sub_group_non_uniform_scan_exclusive_min(
double value );
15972double __ovld sub_group_non_uniform_scan_exclusive_max(
double value );
15977#if defined(cl_khr_subgroup_shuffle)
15978char __ovld sub_group_shuffle(
char value,
uint index );
15980short __ovld sub_group_shuffle(
short value,
uint index );
15982int __ovld sub_group_shuffle(
int value,
uint index );
15984long __ovld sub_group_shuffle(
long value,
uint index );
15986float __ovld sub_group_shuffle(
float value,
uint index );
15988char __ovld sub_group_shuffle_xor(
char value,
uint mask );
15990short __ovld sub_group_shuffle_xor(
short value,
uint mask );
15992int __ovld sub_group_shuffle_xor(
int value,
uint mask );
15994long __ovld sub_group_shuffle_xor(
long value,
uint mask );
15996float __ovld sub_group_shuffle_xor(
float value,
uint mask );
15998#if defined(cl_khr_fp16)
15999half
__ovld sub_group_shuffle( half value,
uint index );
16000half
__ovld sub_group_shuffle_xor( half value,
uint mask );
16003#if defined(cl_khr_fp64)
16004double __ovld sub_group_shuffle(
double value,
uint index );
16005double __ovld sub_group_shuffle_xor(
double value,
uint mask );
16010#if defined(cl_khr_subgroup_shuffle_relative)
16011char __ovld sub_group_shuffle_up(
char value,
uint delta );
16013short __ovld sub_group_shuffle_up(
short value,
uint delta );
16015int __ovld sub_group_shuffle_up(
int value,
uint delta );
16017long __ovld sub_group_shuffle_up(
long value,
uint delta );
16019float __ovld sub_group_shuffle_up(
float value,
uint delta );
16021char __ovld sub_group_shuffle_down(
char value,
uint delta );
16023short __ovld sub_group_shuffle_down(
short value,
uint delta );
16025int __ovld sub_group_shuffle_down(
int value,
uint delta );
16027long __ovld sub_group_shuffle_down(
long value,
uint delta );
16029float __ovld sub_group_shuffle_down(
float value,
uint delta );
16031#if defined(cl_khr_fp16)
16032half
__ovld sub_group_shuffle_up( half value,
uint delta );
16033half
__ovld sub_group_shuffle_down( half value,
uint delta );
16036#if defined(cl_khr_fp64)
16037double __ovld sub_group_shuffle_up(
double value,
uint delta );
16038double __ovld sub_group_shuffle_down(
double value,
uint delta );
16043#if defined(cl_khr_subgroup_clustered_reduce)
16044char __ovld sub_group_clustered_reduce_add(
char value,
uint clustersize );
16046short __ovld sub_group_clustered_reduce_add(
short value,
uint clustersize );
16048int __ovld sub_group_clustered_reduce_add(
int value,
uint clustersize );
16050long __ovld sub_group_clustered_reduce_add(
long value,
uint clustersize );
16052float __ovld sub_group_clustered_reduce_add(
float value,
uint clustersize );
16054char __ovld sub_group_clustered_reduce_mul(
char value,
uint clustersize );
16056short __ovld sub_group_clustered_reduce_mul(
short value,
uint clustersize );
16058int __ovld sub_group_clustered_reduce_mul(
int value,
uint clustersize );
16060long __ovld sub_group_clustered_reduce_mul(
long value,
uint clustersize );
16062float __ovld sub_group_clustered_reduce_mul(
float value,
uint clustersize );
16064char __ovld sub_group_clustered_reduce_min(
char value,
uint clustersize );
16066short __ovld sub_group_clustered_reduce_min(
short value,
uint clustersize );
16068int __ovld sub_group_clustered_reduce_min(
int value,
uint clustersize );
16070long __ovld sub_group_clustered_reduce_min(
long value,
uint clustersize );
16072float __ovld sub_group_clustered_reduce_min(
float value,
uint clustersize );
16074char __ovld sub_group_clustered_reduce_max(
char value,
uint clustersize );
16076short __ovld sub_group_clustered_reduce_max(
short value,
uint clustersize );
16078int __ovld sub_group_clustered_reduce_max(
int value,
uint clustersize );
16080long __ovld sub_group_clustered_reduce_max(
long value,
uint clustersize );
16082float __ovld sub_group_clustered_reduce_max(
float value,
uint clustersize );
16084char __ovld sub_group_clustered_reduce_and(
char value,
uint clustersize );
16086short __ovld sub_group_clustered_reduce_and(
short value,
uint clustersize );
16088int __ovld sub_group_clustered_reduce_and(
int value,
uint clustersize );
16090long __ovld sub_group_clustered_reduce_and(
long value,
uint clustersize );
16093char __ovld sub_group_clustered_reduce_or(
char value,
uint clustersize );
16095short __ovld sub_group_clustered_reduce_or(
short value,
uint clustersize );
16097int __ovld sub_group_clustered_reduce_or(
int value,
uint clustersize );
16099long __ovld sub_group_clustered_reduce_or(
long value,
uint clustersize );
16102char __ovld sub_group_clustered_reduce_xor(
char value,
uint clustersize );
16104short __ovld sub_group_clustered_reduce_xor(
short value,
uint clustersize );
16106int __ovld sub_group_clustered_reduce_xor(
int value,
uint clustersize );
16108long __ovld sub_group_clustered_reduce_xor(
long value,
uint clustersize );
16111int __ovld sub_group_clustered_reduce_logical_and(
int predicate,
uint clustersize );
16112int __ovld sub_group_clustered_reduce_logical_or(
int predicate,
uint clustersize );
16113int __ovld sub_group_clustered_reduce_logical_xor(
int predicate,
uint clustersize );
16115#if defined(cl_khr_fp16)
16116half
__ovld sub_group_clustered_reduce_add( half value,
uint clustersize );
16117half
__ovld sub_group_clustered_reduce_mul( half value,
uint clustersize );
16118half
__ovld sub_group_clustered_reduce_min( half value,
uint clustersize );
16119half
__ovld sub_group_clustered_reduce_max( half value,
uint clustersize );
16122#if defined(cl_khr_fp64)
16123double __ovld sub_group_clustered_reduce_add(
double value,
uint clustersize );
16124double __ovld sub_group_clustered_reduce_mul(
double value,
uint clustersize );
16125double __ovld sub_group_clustered_reduce_min(
double value,
uint clustersize );
16126double __ovld sub_group_clustered_reduce_max(
double value,
uint clustersize );
16131#if defined(cl_intel_subgroups)
16157float __ovld __conv intel_sub_group_shuffle_down(
float cur,
float next,
uint c );
16158float2
__ovld __conv intel_sub_group_shuffle_down( float2 cur, float2 next,
uint c );
16159float3
__ovld __conv intel_sub_group_shuffle_down( float3 cur, float3 next,
uint c );
16160float4
__ovld __conv intel_sub_group_shuffle_down( float4 cur, float4 next,
uint c );
16161float8
__ovld __conv intel_sub_group_shuffle_down( float8 cur, float8 next,
uint c );
16162float16
__ovld __conv intel_sub_group_shuffle_down( float16 cur, float16 next,
uint c );
16172uint2
__ovld __conv intel_sub_group_shuffle_down( uint2 cur, uint2 next,
uint c );
16173uint3
__ovld __conv intel_sub_group_shuffle_down( uint3 cur, uint3 next,
uint c );
16174uint4
__ovld __conv intel_sub_group_shuffle_down( uint4 cur, uint4 next,
uint c );
16181float __ovld __conv intel_sub_group_shuffle_up(
float prev,
float cur,
uint c );
16182float2
__ovld __conv intel_sub_group_shuffle_up( float2 prev, float2 cur,
uint c );
16183float3
__ovld __conv intel_sub_group_shuffle_up( float3 prev, float3 cur,
uint c );
16184float4
__ovld __conv intel_sub_group_shuffle_up( float4 prev, float4 cur,
uint c );
16185float8
__ovld __conv intel_sub_group_shuffle_up( float8 prev, float8 cur,
uint c );
16186float16
__ovld __conv intel_sub_group_shuffle_up( float16 prev, float16 cur,
uint c );
16196uint2
__ovld __conv intel_sub_group_shuffle_up( uint2 prev, uint2 cur,
uint c );
16197uint3
__ovld __conv intel_sub_group_shuffle_up( uint3 prev, uint3 cur,
uint c );
16198uint4
__ovld __conv intel_sub_group_shuffle_up( uint4 prev, uint4 cur,
uint c );
16229uint __ovld __conv intel_sub_group_block_read( read_only image2d_t image, int2 coord );
16230uint2
__ovld __conv intel_sub_group_block_read2( read_only image2d_t image, int2 coord );
16231uint4
__ovld __conv intel_sub_group_block_read4( read_only image2d_t image, int2 coord );
16232uint8 __ovld __conv intel_sub_group_block_read8( read_only image2d_t image, int2 coord );
16234#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
16235uint __ovld __conv intel_sub_group_block_read(read_write image2d_t image, int2 coord);
16236uint2
__ovld __conv intel_sub_group_block_read2(read_write image2d_t image, int2 coord);
16237uint4
__ovld __conv intel_sub_group_block_read4(read_write image2d_t image, int2 coord);
16238uint8 __ovld __conv intel_sub_group_block_read8(read_write image2d_t image, int2 coord);
16246void __ovld __conv intel_sub_group_block_write(write_only image2d_t image, int2 coord,
uint data);
16247void __ovld __conv intel_sub_group_block_write2(write_only image2d_t image, int2 coord, uint2 data);
16248void __ovld __conv intel_sub_group_block_write4(write_only image2d_t image, int2 coord, uint4 data);
16249void __ovld __conv intel_sub_group_block_write8(write_only image2d_t image, int2 coord,
uint8 data);
16251#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
16252void __ovld __conv intel_sub_group_block_write(read_write image2d_t image, int2 coord,
uint data);
16253void __ovld __conv intel_sub_group_block_write2(read_write image2d_t image, int2 coord, uint2 data);
16254void __ovld __conv intel_sub_group_block_write4(read_write image2d_t image, int2 coord, uint4 data);
16255void __ovld __conv intel_sub_group_block_write8(read_write image2d_t image, int2 coord,
uint8 data);
16259void __ovld __conv intel_sub_group_block_write2( __global
uint* p, uint2 data );
16260void __ovld __conv intel_sub_group_block_write4( __global
uint* p, uint4 data );
16270#if defined(cl_khr_fp64)
16272double __ovld __conv intel_sub_group_shuffle_down(
double prev,
double cur,
uint c );
16273double __ovld __conv intel_sub_group_shuffle_up(
double prev,
double cur,
uint c );
16279#if defined(cl_intel_subgroups_short)
16280short __ovld __conv intel_sub_group_broadcast(
short x,
uint sub_group_local_id );
16281short2
__ovld __conv intel_sub_group_broadcast( short2 x,
uint sub_group_local_id );
16282short3
__ovld __conv intel_sub_group_broadcast( short3 x,
uint sub_group_local_id );
16283short4
__ovld __conv intel_sub_group_broadcast( short4 x,
uint sub_group_local_id );
16284short8
__ovld __conv intel_sub_group_broadcast( short8 x,
uint sub_group_local_id );
16287ushort2
__ovld __conv intel_sub_group_broadcast( ushort2 x,
uint sub_group_local_id );
16288ushort3
__ovld __conv intel_sub_group_broadcast( ushort3 x,
uint sub_group_local_id );
16289ushort4
__ovld __conv intel_sub_group_broadcast( ushort4 x,
uint sub_group_local_id );
16290ushort8
__ovld __conv intel_sub_group_broadcast( ushort8 x,
uint sub_group_local_id );
16306short __ovld __conv intel_sub_group_shuffle_down(
short cur,
short next,
uint c );
16307short2
__ovld __conv intel_sub_group_shuffle_down( short2 cur, short2 next,
uint c );
16308short3
__ovld __conv intel_sub_group_shuffle_down( short3 cur, short3 next,
uint c );
16309short4
__ovld __conv intel_sub_group_shuffle_down( short4 cur, short4 next,
uint c );
16310short8
__ovld __conv intel_sub_group_shuffle_down( short8 cur, short8 next,
uint c );
16311short16
__ovld __conv intel_sub_group_shuffle_down( short16 cur, short16 next,
uint c );
16314ushort2
__ovld __conv intel_sub_group_shuffle_down( ushort2 cur, ushort2 next,
uint c );
16315ushort3
__ovld __conv intel_sub_group_shuffle_down( ushort3 cur, ushort3 next,
uint c );
16316ushort4
__ovld __conv intel_sub_group_shuffle_down( ushort4 cur, ushort4 next,
uint c );
16317ushort8
__ovld __conv intel_sub_group_shuffle_down( ushort8 cur, ushort8 next,
uint c );
16318ushort16
__ovld __conv intel_sub_group_shuffle_down( ushort16 cur, ushort16 next,
uint c );
16320short __ovld __conv intel_sub_group_shuffle_up(
short cur,
short next,
uint c );
16321short2
__ovld __conv intel_sub_group_shuffle_up( short2 cur, short2 next,
uint c );
16322short3
__ovld __conv intel_sub_group_shuffle_up( short3 cur, short3 next,
uint c );
16323short4
__ovld __conv intel_sub_group_shuffle_up( short4 cur, short4 next,
uint c );
16324short8
__ovld __conv intel_sub_group_shuffle_up( short8 cur, short8 next,
uint c );
16325short16
__ovld __conv intel_sub_group_shuffle_up( short16 cur, short16 next,
uint c );
16328ushort2
__ovld __conv intel_sub_group_shuffle_up( ushort2 cur, ushort2 next,
uint c );
16329ushort3
__ovld __conv intel_sub_group_shuffle_up( ushort3 cur, ushort3 next,
uint c );
16330ushort4
__ovld __conv intel_sub_group_shuffle_up( ushort4 cur, ushort4 next,
uint c );
16331ushort8
__ovld __conv intel_sub_group_shuffle_up( ushort8 cur, ushort8 next,
uint c );
16332ushort16
__ovld __conv intel_sub_group_shuffle_up( ushort16 cur, ushort16 next,
uint c );
16348short __ovld __conv intel_sub_group_reduce_add(
short x );
16350short __ovld __conv intel_sub_group_reduce_min(
short x );
16352short __ovld __conv intel_sub_group_reduce_max(
short x );
16355short __ovld __conv intel_sub_group_scan_exclusive_add(
short x );
16357short __ovld __conv intel_sub_group_scan_exclusive_min(
short x );
16359short __ovld __conv intel_sub_group_scan_exclusive_max(
short x );
16362short __ovld __conv intel_sub_group_scan_inclusive_add(
short x );
16364short __ovld __conv intel_sub_group_scan_inclusive_min(
short x );
16366short __ovld __conv intel_sub_group_scan_inclusive_max(
short x );
16369uint __ovld __conv intel_sub_group_block_read_ui( read_only image2d_t image, int2 byte_coord );
16370uint2
__ovld __conv intel_sub_group_block_read_ui2( read_only image2d_t image, int2 byte_coord );
16371uint4
__ovld __conv intel_sub_group_block_read_ui4( read_only image2d_t image, int2 byte_coord );
16372uint8 __ovld __conv intel_sub_group_block_read_ui8( read_only image2d_t image, int2 byte_coord );
16374#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
16375uint __ovld __conv intel_sub_group_block_read_ui( read_write image2d_t image, int2 byte_coord );
16376uint2
__ovld __conv intel_sub_group_block_read_ui2( read_write image2d_t image, int2 byte_coord );
16377uint4
__ovld __conv intel_sub_group_block_read_ui4( read_write image2d_t image, int2 byte_coord );
16378uint8 __ovld __conv intel_sub_group_block_read_ui8( read_write image2d_t image, int2 byte_coord );
16382uint2
__ovld __conv intel_sub_group_block_read_ui2(
const __global
uint* p );
16383uint4
__ovld __conv intel_sub_group_block_read_ui4(
const __global
uint* p );
16386void __ovld __conv intel_sub_group_block_write_ui( read_only image2d_t image, int2 byte_coord,
uint data );
16387void __ovld __conv intel_sub_group_block_write_ui2( read_only image2d_t image, int2 byte_coord, uint2 data );
16388void __ovld __conv intel_sub_group_block_write_ui4( read_only image2d_t image, int2 byte_coord, uint4 data );
16389void __ovld __conv intel_sub_group_block_write_ui8( read_only image2d_t image, int2 byte_coord,
uint8 data );
16391#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
16392void __ovld __conv intel_sub_group_block_write_ui( read_write image2d_t image, int2 byte_coord,
uint data );
16393void __ovld __conv intel_sub_group_block_write_ui2( read_write image2d_t image, int2 byte_coord, uint2 data );
16394void __ovld __conv intel_sub_group_block_write_ui4( read_write image2d_t image, int2 byte_coord, uint4 data );
16395void __ovld __conv intel_sub_group_block_write_ui8( read_write image2d_t image, int2 byte_coord,
uint8 data );
16399void __ovld __conv intel_sub_group_block_write_ui2( __global
uint* p, uint2 data );
16400void __ovld __conv intel_sub_group_block_write_ui4( __global
uint* p, uint4 data );
16403ushort __ovld __conv intel_sub_group_block_read_us( read_only image2d_t image, int2 coord );
16404ushort2
__ovld __conv intel_sub_group_block_read_us2( read_only image2d_t image, int2 coord );
16405ushort4
__ovld __conv intel_sub_group_block_read_us4( read_only image2d_t image, int2 coord );
16406ushort8
__ovld __conv intel_sub_group_block_read_us8( read_only image2d_t image, int2 coord );
16408#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
16409ushort __ovld __conv intel_sub_group_block_read_us(read_write image2d_t image, int2 coord);
16410ushort2
__ovld __conv intel_sub_group_block_read_us2(read_write image2d_t image, int2 coord);
16411ushort4
__ovld __conv intel_sub_group_block_read_us4(read_write image2d_t image, int2 coord);
16412ushort8
__ovld __conv intel_sub_group_block_read_us8(read_write image2d_t image, int2 coord);
16420void __ovld __conv intel_sub_group_block_write_us(write_only image2d_t image, int2 coord,
ushort data);
16421void __ovld __conv intel_sub_group_block_write_us2(write_only image2d_t image, int2 coord, ushort2 data);
16422void __ovld __conv intel_sub_group_block_write_us4(write_only image2d_t image, int2 coord, ushort4 data);
16423void __ovld __conv intel_sub_group_block_write_us8(write_only image2d_t image, int2 coord, ushort8 data);
16425#if defined(__OPENCL_CPP_VERSION__) || (__OPENCL_C_VERSION__ >= CL_VERSION_2_0)
16426void __ovld __conv intel_sub_group_block_write_us(read_write image2d_t image, int2 coord,
ushort data);
16427void __ovld __conv intel_sub_group_block_write_us2(read_write image2d_t image, int2 coord, ushort2 data);
16428void __ovld __conv intel_sub_group_block_write_us4(read_write image2d_t image, int2 coord, ushort4 data);
16429void __ovld __conv intel_sub_group_block_write_us8(read_write image2d_t image, int2 coord, ushort8 data);
16433void __ovld __conv intel_sub_group_block_write_us2( __global
ushort* p, ushort2 data );
16434void __ovld __conv intel_sub_group_block_write_us4( __global
ushort* p, ushort4 data );
16435void __ovld __conv intel_sub_group_block_write_us8( __global
ushort* p, ushort8 data );
16438#ifdef cl_intel_device_side_avc_motion_estimation
16439#pragma OPENCL EXTENSION cl_intel_device_side_avc_motion_estimation : begin
16443intel_sub_group_avc_mce_get_default_inter_base_multi_reference_penalty(
16445ulong __ovld intel_sub_group_avc_mce_get_default_inter_shape_penalty(
16447uchar __ovld intel_sub_group_avc_mce_get_default_inter_direction_penalty(
16449uint __ovld intel_sub_group_avc_mce_get_default_intra_luma_shape_penalty(
16452intel_sub_group_avc_mce_get_default_inter_motion_vector_cost_table(
16454uchar __ovld intel_sub_group_avc_mce_get_default_intra_luma_mode_penalty(
16457uint2
__ovld intel_sub_group_avc_mce_get_default_high_penalty_cost_table();
16458uint2
__ovld intel_sub_group_avc_mce_get_default_medium_penalty_cost_table();
16459uint2
__ovld intel_sub_group_avc_mce_get_default_low_penalty_cost_table();
16460uint __ovld intel_sub_group_avc_mce_get_default_non_dc_luma_intra_penalty();
16462intel_sub_group_avc_mce_get_default_intra_chroma_mode_base_penalty();
16464intel_sub_group_avc_mce_payload_t
__ovld
16465intel_sub_group_avc_mce_set_inter_base_multi_reference_penalty(
16466 uchar reference_base_penalty, intel_sub_group_avc_mce_payload_t payload);
16467intel_sub_group_avc_mce_payload_t
__ovld
16468intel_sub_group_avc_mce_set_inter_shape_penalty(
16469 ulong packed_shape_penalty, intel_sub_group_avc_mce_payload_t payload);
16470intel_sub_group_avc_mce_payload_t
__ovld
16471intel_sub_group_avc_mce_set_inter_direction_penalty(
16472 uchar direction_cost, intel_sub_group_avc_mce_payload_t payload);
16473intel_sub_group_avc_mce_payload_t
__ovld
16474intel_sub_group_avc_mce_set_motion_vector_cost_function(
16475 ulong packed_cost_center_delta, uint2 packed_cost_table,
16476 uchar cost_precision, intel_sub_group_avc_mce_payload_t payload);
16477intel_sub_group_avc_mce_payload_t
__ovld
16478intel_sub_group_avc_mce_set_ac_only_haar(
16479 intel_sub_group_avc_mce_payload_t payload);
16480intel_sub_group_avc_mce_payload_t
__ovld
16481intel_sub_group_avc_mce_set_source_interlaced_field_polarity(
16482 uchar src_field_polarity, intel_sub_group_avc_mce_payload_t payload);
16483intel_sub_group_avc_mce_payload_t
__ovld
16484intel_sub_group_avc_mce_set_single_reference_interlaced_field_polarity(
16485 uchar ref_field_polarity, intel_sub_group_avc_mce_payload_t payload);
16486intel_sub_group_avc_mce_payload_t
__ovld
16487intel_sub_group_avc_mce_set_dual_reference_interlaced_field_polarities(
16488 uchar fwd_ref_field_polarity,
uchar bwd_ref_field_polarity,
16489 intel_sub_group_avc_mce_payload_t payload);
16491ulong __ovld intel_sub_group_avc_mce_get_motion_vectors(
16492 intel_sub_group_avc_mce_result_t result);
16493ushort __ovld intel_sub_group_avc_mce_get_inter_distortions(
16494 intel_sub_group_avc_mce_result_t result);
16495ushort __ovld intel_sub_group_avc_mce_get_best_inter_distortion(
16496 intel_sub_group_avc_mce_result_t result);
16497uchar __ovld intel_sub_group_avc_mce_get_inter_major_shape(
16498 intel_sub_group_avc_mce_result_t result);
16499uchar __ovld intel_sub_group_avc_mce_get_inter_minor_shapes(
16500 intel_sub_group_avc_mce_result_t result);
16501uchar __ovld intel_sub_group_avc_mce_get_inter_directions(
16502 intel_sub_group_avc_mce_result_t result);
16503uchar __ovld intel_sub_group_avc_mce_get_inter_motion_vector_count(
16504 intel_sub_group_avc_mce_result_t result);
16505uint __ovld intel_sub_group_avc_mce_get_inter_reference_ids(
16506 intel_sub_group_avc_mce_result_t result);
16508intel_sub_group_avc_mce_get_inter_reference_interlaced_field_polarities(
16509 uint packed_reference_ids,
uint packed_reference_parameter_field_polarities,
16510 intel_sub_group_avc_mce_result_t result);
16513intel_sub_group_avc_ime_payload_t
__ovld
16514intel_sub_group_avc_ime_initialize(
16515 ushort2 src_coord,
uchar partition_mask,
uchar sad_adjustment);
16516intel_sub_group_avc_ime_payload_t
__ovld
16517intel_sub_group_avc_ime_set_single_reference(
16518 short2 ref_offset,
uchar search_window_config,
16519 intel_sub_group_avc_ime_payload_t payload);
16520intel_sub_group_avc_ime_payload_t
__ovld
16521intel_sub_group_avc_ime_set_dual_reference(
16522 short2 fwd_ref_offset, short2 bwd_ref_offset,
uchar search_window_config,
16523 intel_sub_group_avc_ime_payload_t payload);
16524intel_sub_group_avc_ime_payload_t
__ovld
16525intel_sub_group_avc_ime_set_max_motion_vector_count(
16526 uchar max_motion_vector_count, intel_sub_group_avc_ime_payload_t payload);
16527intel_sub_group_avc_ime_payload_t
__ovld
16528intel_sub_group_avc_ime_set_unidirectional_mix_disable(
16529 intel_sub_group_avc_ime_payload_t payload);
16530intel_sub_group_avc_ime_payload_t
__ovld
16531intel_sub_group_avc_ime_set_early_search_termination_threshold(
16532 uchar threshold, intel_sub_group_avc_ime_payload_t payload);
16533intel_sub_group_avc_ime_payload_t
__ovld
16534intel_sub_group_avc_ime_set_weighted_sad(
16535 uint packed_sad_weights, intel_sub_group_avc_ime_payload_t payload);
16537__attribute__((deprecated(
"If you use the latest Intel driver, please use "
16538 "intel_sub_group_avc_ime_ref_window_size instead",
16539 "intel_sub_group_avc_ime_ref_window_size")))
16541intel_sub_group_ime_ref_window_size(
uchar search_window_config,
char dual_ref);
16542ushort2
__ovld intel_sub_group_avc_ime_ref_window_size(
16543 uchar search_window_config,
char dual_ref);
16544short2
__ovld intel_sub_group_avc_ime_adjust_ref_offset(
16545 short2 ref_offset, ushort2 src_coord, ushort2 ref_window_size,
16546 ushort2 image_size);
16548intel_sub_group_avc_ime_result_t
__ovld
16549intel_sub_group_avc_ime_evaluate_with_single_reference(
16550 read_only image2d_t src_image, read_only image2d_t ref_image,
16551 sampler_t vme_media_sampler, intel_sub_group_avc_ime_payload_t payload);
16552intel_sub_group_avc_ime_result_t
__ovld
16553intel_sub_group_avc_ime_evaluate_with_dual_reference(
16554 read_only image2d_t src_image, read_only image2d_t fwd_ref_image,
16555 read_only image2d_t bwd_ref_image, sampler_t vme_media_sampler,
16556 intel_sub_group_avc_ime_payload_t payload);
16557intel_sub_group_avc_ime_result_single_reference_streamout_t
__ovld
16558intel_sub_group_avc_ime_evaluate_with_single_reference_streamout(
16559 read_only image2d_t src_image, read_only image2d_t ref_image,
16560 sampler_t vme_media_sampler, intel_sub_group_avc_ime_payload_t payload);
16561intel_sub_group_avc_ime_result_dual_reference_streamout_t
__ovld
16562intel_sub_group_avc_ime_evaluate_with_dual_reference_streamout(
16563 read_only image2d_t src_image, read_only image2d_t fwd_ref_image,
16564 read_only image2d_t bwd_ref_image, sampler_t vme_media_sampler,
16565 intel_sub_group_avc_ime_payload_t payload);
16566intel_sub_group_avc_ime_result_t
__ovld
16567intel_sub_group_avc_ime_evaluate_with_single_reference_streamin(
16568 read_only image2d_t src_image, read_only image2d_t ref_image,
16569 sampler_t vme_media_sampler, intel_sub_group_avc_ime_payload_t payload,
16570 intel_sub_group_avc_ime_single_reference_streamin_t streamin_components);
16571intel_sub_group_avc_ime_result_t
__ovld
16572intel_sub_group_avc_ime_evaluate_with_dual_reference_streamin(
16573 read_only image2d_t src_image, read_only image2d_t fwd_ref_image,
16574 read_only image2d_t bwd_ref_image, sampler_t vme_media_sampler,
16575 intel_sub_group_avc_ime_payload_t payload,
16576 intel_sub_group_avc_ime_dual_reference_streamin_t streamin_components);
16577intel_sub_group_avc_ime_result_single_reference_streamout_t
__ovld
16578intel_sub_group_avc_ime_evaluate_with_single_reference_streaminout(
16579 read_only image2d_t src_image, read_only image2d_t ref_image,
16580 sampler_t vme_media_sampler, intel_sub_group_avc_ime_payload_t payload,
16581 intel_sub_group_avc_ime_single_reference_streamin_t streamin_components);
16582intel_sub_group_avc_ime_result_dual_reference_streamout_t
__ovld
16583intel_sub_group_avc_ime_evaluate_with_dual_reference_streaminout(
16584 read_only image2d_t src_image, read_only image2d_t fwd_ref_image,
16585 read_only image2d_t bwd_ref_image, sampler_t vme_media_sampler,
16586 intel_sub_group_avc_ime_payload_t payload,
16587 intel_sub_group_avc_ime_dual_reference_streamin_t streamin_components);
16589intel_sub_group_avc_ime_single_reference_streamin_t
__ovld
16590intel_sub_group_avc_ime_get_single_reference_streamin(
16591 intel_sub_group_avc_ime_result_single_reference_streamout_t result);
16592intel_sub_group_avc_ime_dual_reference_streamin_t
__ovld
16593intel_sub_group_avc_ime_get_dual_reference_streamin(
16594 intel_sub_group_avc_ime_result_dual_reference_streamout_t result);
16595intel_sub_group_avc_ime_result_t
__ovld
16596intel_sub_group_avc_ime_strip_single_reference_streamout(
16597 intel_sub_group_avc_ime_result_single_reference_streamout_t result);
16598intel_sub_group_avc_ime_result_t
__ovld
16599intel_sub_group_avc_ime_strip_dual_reference_streamout(
16600 intel_sub_group_avc_ime_result_dual_reference_streamout_t result);
16602uint __ovld intel_sub_group_avc_ime_get_streamout_major_shape_motion_vectors(
16603 intel_sub_group_avc_ime_result_single_reference_streamout_t result,
16604 uchar major_shape);
16605ushort __ovld intel_sub_group_avc_ime_get_streamout_major_shape_distortions(
16606 intel_sub_group_avc_ime_result_single_reference_streamout_t result,
16607 uchar major_shape);
16608uchar __ovld intel_sub_group_avc_ime_get_streamout_major_shape_reference_ids(
16609 intel_sub_group_avc_ime_result_single_reference_streamout_t result,
16610 uchar major_shape);
16611uint __ovld intel_sub_group_avc_ime_get_streamout_major_shape_motion_vectors(
16612 intel_sub_group_avc_ime_result_dual_reference_streamout_t result,
16614ushort __ovld intel_sub_group_avc_ime_get_streamout_major_shape_distortions(
16615 intel_sub_group_avc_ime_result_dual_reference_streamout_t result,
16617uchar __ovld intel_sub_group_avc_ime_get_streamout_major_shape_reference_ids(
16618 intel_sub_group_avc_ime_result_dual_reference_streamout_t result,
16621uchar __ovld intel_sub_group_avc_ime_get_border_reached(
16622 uchar image_select, intel_sub_group_avc_ime_result_t result);
16623uchar __ovld intel_sub_group_avc_ime_get_truncated_search_indication(
16624 intel_sub_group_avc_ime_result_t result);
16626intel_sub_group_avc_ime_get_unidirectional_early_search_termination(
16627 intel_sub_group_avc_ime_result_t result);
16628uint __ovld intel_sub_group_avc_ime_get_weighting_pattern_minimum_motion_vector(
16629 intel_sub_group_avc_ime_result_t result);
16630ushort __ovld intel_sub_group_avc_ime_get_weighting_pattern_minimum_distortion(
16631 intel_sub_group_avc_ime_result_t result);
16634intel_sub_group_avc_ref_payload_t
__ovld
16635intel_sub_group_avc_fme_initialize(
16636 ushort2 src_coord,
ulong motion_vectors,
uchar major_shapes,
16638 uchar sad_adjustment);
16639intel_sub_group_avc_ref_payload_t
__ovld
16640intel_sub_group_avc_bme_initialize(
16641 ushort2 src_coord,
ulong motion_vectors,
uchar major_shapes,
16643 uchar bidirectional_weight,
uchar sad_adjustment);
16645intel_sub_group_avc_ref_payload_t
__ovld
16646intel_sub_group_avc_ref_set_bidirectional_mix_disable(
16647 intel_sub_group_avc_ref_payload_t payload);
16648intel_sub_group_avc_ref_payload_t
__ovld
16649intel_sub_group_avc_ref_set_bilinear_filter_enable(
16650 intel_sub_group_avc_ref_payload_t payload);
16652intel_sub_group_avc_ref_result_t
__ovld
16653intel_sub_group_avc_ref_evaluate_with_single_reference(
16654 read_only image2d_t src_image, read_only image2d_t ref_image,
16655 sampler_t vme_media_sampler, intel_sub_group_avc_ref_payload_t payload);
16656intel_sub_group_avc_ref_result_t
__ovld
16657intel_sub_group_avc_ref_evaluate_with_dual_reference(
16658 read_only image2d_t src_image, read_only image2d_t fwd_ref_image,
16659 read_only image2d_t bwd_ref_image, sampler_t vme_media_sampler,
16660 intel_sub_group_avc_ref_payload_t payload);
16661intel_sub_group_avc_ref_result_t
__ovld
16662intel_sub_group_avc_ref_evaluate_with_multi_reference(
16663 read_only image2d_t src_image,
uint packed_reference_ids,
16664 sampler_t vme_media_sampler, intel_sub_group_avc_ref_payload_t payload);
16665intel_sub_group_avc_ref_result_t
__ovld
16666intel_sub_group_avc_ref_evaluate_with_multi_reference(
16667 read_only image2d_t src_image,
uint packed_reference_ids,
16668 uchar packed_reference_field_polarities, sampler_t vme_media_sampler,
16669 intel_sub_group_avc_ref_payload_t payload);
16672intel_sub_group_avc_sic_payload_t
__ovld
16673intel_sub_group_avc_sic_initialize(
16674 ushort2 src_coord);
16675intel_sub_group_avc_sic_payload_t
__ovld
16676intel_sub_group_avc_sic_configure_skc(
16677 uint skip_block_partition_type,
uint skip_motion_vector_mask,
16678 ulong motion_vectors,
uchar bidirectional_weight,
uchar skip_sad_adjustment,
16679 intel_sub_group_avc_sic_payload_t payload);
16680intel_sub_group_avc_sic_payload_t
__ovld
16681intel_sub_group_avc_sic_configure_ipe(
16682 uchar luma_intra_partition_mask,
uchar intra_neighbour_availabilty,
16683 uchar left_edge_luma_pixels,
uchar upper_left_corner_luma_pixel,
16684 uchar upper_edge_luma_pixels,
uchar upper_right_edge_luma_pixels,
16685 uchar intra_sad_adjustment, intel_sub_group_avc_sic_payload_t payload);
16686intel_sub_group_avc_sic_payload_t
__ovld
16687intel_sub_group_avc_sic_configure_ipe(
16688 uchar luma_intra_partition_mask,
uchar intra_neighbour_availabilty,
16689 uchar left_edge_luma_pixels,
uchar upper_left_corner_luma_pixel,
16690 uchar upper_edge_luma_pixels,
uchar upper_right_edge_luma_pixels,
16691 ushort left_edge_chroma_pixels,
ushort upper_left_corner_chroma_pixel,
16692 ushort upper_edge_chroma_pixels,
uchar intra_sad_adjustment,
16693 intel_sub_group_avc_sic_payload_t payload);
16695intel_sub_group_avc_sic_get_motion_vector_mask(
16696 uint skip_block_partition_type,
uchar direction);
16698intel_sub_group_avc_sic_payload_t
__ovld
16699intel_sub_group_avc_sic_set_intra_luma_shape_penalty(
16700 uint packed_shape_cost, intel_sub_group_avc_sic_payload_t payload);
16701intel_sub_group_avc_sic_payload_t
__ovld
16702intel_sub_group_avc_sic_set_intra_luma_mode_cost_function(
16703 uchar luma_mode_penalty,
uint luma_packed_neighbor_modes,
16704 uint luma_packed_non_dc_penalty, intel_sub_group_avc_sic_payload_t payload);
16705intel_sub_group_avc_sic_payload_t
__ovld
16706intel_sub_group_avc_sic_set_intra_chroma_mode_cost_function(
16707 uchar chroma_mode_penalty, intel_sub_group_avc_sic_payload_t payload);
16709intel_sub_group_avc_sic_payload_t
__ovld
16710intel_sub_group_avc_sic_set_skc_bilinear_filter_enable(
16711 intel_sub_group_avc_sic_payload_t payload);
16712intel_sub_group_avc_sic_payload_t
__ovld
16713intel_sub_group_avc_sic_set_skc_forward_transform_enable(
16714 ulong packed_sad_coefficients, intel_sub_group_avc_sic_payload_t payload);
16715intel_sub_group_avc_sic_payload_t
__ovld
16716intel_sub_group_avc_sic_set_block_based_raw_skip_sad(
16717 uchar block_based_skip_type,
16718 intel_sub_group_avc_sic_payload_t payload);
16720intel_sub_group_avc_sic_result_t
__ovld
16721intel_sub_group_avc_sic_evaluate_ipe(
16722 read_only image2d_t src_image, sampler_t vme_media_sampler,
16723 intel_sub_group_avc_sic_payload_t payload);
16724intel_sub_group_avc_sic_result_t
__ovld
16725intel_sub_group_avc_sic_evaluate_with_single_reference(
16726 read_only image2d_t src_image, read_only image2d_t ref_image,
16727 sampler_t vme_media_sampler, intel_sub_group_avc_sic_payload_t payload);
16728intel_sub_group_avc_sic_result_t
__ovld
16729intel_sub_group_avc_sic_evaluate_with_dual_reference(
16730 read_only image2d_t src_image, read_only image2d_t fwd_ref_image,
16731 read_only image2d_t bwd_ref_image, sampler_t vme_media_sampler,
16732 intel_sub_group_avc_sic_payload_t payload);
16733intel_sub_group_avc_sic_result_t
__ovld
16734intel_sub_group_avc_sic_evaluate_with_multi_reference(
16735 read_only image2d_t src_image,
uint packed_reference_ids,
16736 sampler_t vme_media_sampler, intel_sub_group_avc_sic_payload_t payload);
16737intel_sub_group_avc_sic_result_t
__ovld
16738intel_sub_group_avc_sic_evaluate_with_multi_reference(
16739 read_only image2d_t src_image,
uint packed_reference_ids,
16740 uchar packed_reference_field_polarities, sampler_t vme_media_sampler,
16741 intel_sub_group_avc_sic_payload_t payload);
16743uchar __ovld intel_sub_group_avc_sic_get_ipe_luma_shape(
16744 intel_sub_group_avc_sic_result_t result);
16745ushort __ovld intel_sub_group_avc_sic_get_best_ipe_luma_distortion(
16746 intel_sub_group_avc_sic_result_t result);
16747ushort __ovld intel_sub_group_avc_sic_get_best_ipe_chroma_distortion(
16748 intel_sub_group_avc_sic_result_t result);
16749ulong __ovld intel_sub_group_avc_sic_get_packed_ipe_luma_modes(
16750 intel_sub_group_avc_sic_result_t result);
16751uchar __ovld intel_sub_group_avc_sic_get_ipe_chroma_mode(
16752 intel_sub_group_avc_sic_result_t result);
16753uint __ovld intel_sub_group_avc_sic_get_packed_skc_luma_count_threshold(
16754 intel_sub_group_avc_sic_result_t result);
16755ulong __ovld intel_sub_group_avc_sic_get_packed_skc_luma_sum_threshold(
16756 intel_sub_group_avc_sic_result_t result);
16757ushort __ovld intel_sub_group_avc_sic_get_inter_raw_sads(
16758 intel_sub_group_avc_sic_result_t result);
16761intel_sub_group_avc_ime_payload_t
__ovld
16762intel_sub_group_avc_ime_set_inter_base_multi_reference_penalty(
16763 uchar reference_base_penalty, intel_sub_group_avc_ime_payload_t payload);
16764intel_sub_group_avc_ref_payload_t
__ovld
16765intel_sub_group_avc_ref_set_inter_base_multi_reference_penalty(
16766 uchar reference_base_penalty, intel_sub_group_avc_ref_payload_t payload);
16767intel_sub_group_avc_sic_payload_t
__ovld
16768intel_sub_group_avc_sic_set_inter_base_multi_reference_penalty(
16769 uchar reference_base_penalty, intel_sub_group_avc_sic_payload_t payload);
16771intel_sub_group_avc_ime_payload_t
__ovld
16772intel_sub_group_avc_ime_set_inter_shape_penalty(
16773 ulong packed_shape_cost, intel_sub_group_avc_ime_payload_t payload);
16774intel_sub_group_avc_ref_payload_t
__ovld
16775intel_sub_group_avc_ref_set_inter_shape_penalty(
16776 ulong packed_shape_cost, intel_sub_group_avc_ref_payload_t payload);
16777intel_sub_group_avc_sic_payload_t
__ovld
16778intel_sub_group_avc_sic_set_inter_shape_penalty(
16779 ulong packed_shape_cost, intel_sub_group_avc_sic_payload_t payload);
16781intel_sub_group_avc_ime_payload_t
__ovld
16782intel_sub_group_avc_ime_set_inter_direction_penalty(
16783 uchar direction_cost, intel_sub_group_avc_ime_payload_t payload);
16784intel_sub_group_avc_ref_payload_t
__ovld
16785intel_sub_group_avc_ref_set_inter_direction_penalty(
16786 uchar direction_cost, intel_sub_group_avc_ref_payload_t payload);
16787intel_sub_group_avc_sic_payload_t
__ovld
16788intel_sub_group_avc_sic_set_inter_direction_penalty(
16789 uchar direction_cost, intel_sub_group_avc_sic_payload_t payload);
16791intel_sub_group_avc_ime_payload_t
__ovld
16792intel_sub_group_avc_ime_set_motion_vector_cost_function(
16793 ulong packed_cost_center_delta, uint2 packed_cost_table,
16794 uchar cost_precision, intel_sub_group_avc_ime_payload_t payload);
16795intel_sub_group_avc_ref_payload_t
__ovld
16796intel_sub_group_avc_ref_set_motion_vector_cost_function(
16797 ulong packed_cost_center_delta, uint2 packed_cost_table,
16798 uchar cost_precision, intel_sub_group_avc_ref_payload_t payload);
16799intel_sub_group_avc_sic_payload_t
__ovld
16800intel_sub_group_avc_sic_set_motion_vector_cost_function(
16801 ulong packed_cost_center_delta, uint2 packed_cost_table,
16802 uchar cost_precision, intel_sub_group_avc_sic_payload_t payload);
16804intel_sub_group_avc_ime_payload_t
__ovld
16805intel_sub_group_avc_ime_set_source_interlaced_field_polarity(
16806 uchar src_field_polarity, intel_sub_group_avc_ime_payload_t payload);
16807intel_sub_group_avc_ref_payload_t
__ovld
16808intel_sub_group_avc_ref_set_source_interlaced_field_polarity(
16809 uchar src_field_polarity, intel_sub_group_avc_ref_payload_t payload);
16810intel_sub_group_avc_sic_payload_t
__ovld
16811intel_sub_group_avc_sic_set_source_interlaced_field_polarity(
16812 uchar src_field_polarity, intel_sub_group_avc_sic_payload_t payload);
16814intel_sub_group_avc_ime_payload_t
__ovld
16815intel_sub_group_avc_ime_set_single_reference_interlaced_field_polarity(
16816 uchar ref_field_polarity, intel_sub_group_avc_ime_payload_t payload);
16817intel_sub_group_avc_ref_payload_t
__ovld
16818intel_sub_group_avc_ref_set_single_reference_interlaced_field_polarity(
16819 uchar ref_field_polarity, intel_sub_group_avc_ref_payload_t payload);
16820intel_sub_group_avc_sic_payload_t
__ovld
16821intel_sub_group_avc_sic_set_single_reference_interlaced_field_polarity(
16822 uchar ref_field_polarity, intel_sub_group_avc_sic_payload_t payload);
16823intel_sub_group_avc_ime_payload_t
__ovld
16824intel_sub_group_avc_ime_set_dual_reference_interlaced_field_polarities(
16825 uchar fwd_ref_field_polarity,
uchar bwd_ref_field_polarity,
16826 intel_sub_group_avc_ime_payload_t payload);
16827intel_sub_group_avc_ref_payload_t
__ovld
16828intel_sub_group_avc_ref_set_dual_reference_interlaced_field_polarities(
16829 uchar fwd_ref_field_polarity,
uchar bwd_ref_field_polarity,
16830 intel_sub_group_avc_ref_payload_t payload);
16831intel_sub_group_avc_sic_payload_t
__ovld
16832intel_sub_group_avc_sic_set_dual_reference_interlaced_field_polarities(
16833 uchar fwd_ref_field_polarity,
uchar bwd_ref_field_polarity,
16834 intel_sub_group_avc_sic_payload_t payload);
16836intel_sub_group_avc_ime_payload_t
__ovld
16837intel_sub_group_avc_ime_set_ac_only_haar(
16838 intel_sub_group_avc_ime_payload_t payload);
16839intel_sub_group_avc_ref_payload_t
__ovld
16840intel_sub_group_avc_ref_set_ac_only_haar(
16841 intel_sub_group_avc_ref_payload_t payload);
16842intel_sub_group_avc_sic_payload_t
__ovld
16843intel_sub_group_avc_sic_set_ac_only_haar(
16844 intel_sub_group_avc_sic_payload_t payload);
16846ulong __ovld intel_sub_group_avc_ime_get_motion_vectors(
16847 intel_sub_group_avc_ime_result_t result);
16848ulong __ovld intel_sub_group_avc_ref_get_motion_vectors(
16849 intel_sub_group_avc_ref_result_t result);
16851ushort __ovld intel_sub_group_avc_ime_get_inter_distortions(
16852 intel_sub_group_avc_ime_result_t result);
16853ushort __ovld intel_sub_group_avc_ref_get_inter_distortions(
16854 intel_sub_group_avc_ref_result_t result);
16855ushort __ovld intel_sub_group_avc_sic_get_inter_distortions(
16856 intel_sub_group_avc_sic_result_t result);
16858ushort __ovld intel_sub_group_avc_ime_get_best_inter_distortion(
16859 intel_sub_group_avc_ime_result_t result);
16860ushort __ovld intel_sub_group_avc_ref_get_best_inter_distortion(
16861 intel_sub_group_avc_ref_result_t result);
16863uchar __ovld intel_sub_group_avc_ime_get_inter_major_shape(
16864 intel_sub_group_avc_ime_result_t result);
16865uchar __ovld intel_sub_group_avc_ref_get_inter_major_shape(
16866 intel_sub_group_avc_ref_result_t result);
16867uchar __ovld intel_sub_group_avc_ime_get_inter_minor_shapes(
16868 intel_sub_group_avc_ime_result_t result);
16869uchar __ovld intel_sub_group_avc_ref_get_inter_minor_shapes(
16870 intel_sub_group_avc_ref_result_t result);
16872uchar __ovld intel_sub_group_avc_ime_get_inter_directions(
16873 intel_sub_group_avc_ime_result_t result);
16874uchar __ovld intel_sub_group_avc_ref_get_inter_directions(
16875 intel_sub_group_avc_ref_result_t result);
16877uchar __ovld intel_sub_group_avc_ime_get_inter_motion_vector_count(
16878 intel_sub_group_avc_ime_result_t result);
16879uchar __ovld intel_sub_group_avc_ref_get_inter_motion_vector_count(
16880 intel_sub_group_avc_ref_result_t result);
16882uint __ovld intel_sub_group_avc_ime_get_inter_reference_ids(
16883 intel_sub_group_avc_ime_result_t result);
16884uint __ovld intel_sub_group_avc_ref_get_inter_reference_ids(
16885 intel_sub_group_avc_ref_result_t result);
16888intel_sub_group_avc_ime_get_inter_reference_interlaced_field_polarities(
16889 uint packed_reference_ids,
uint packed_reference_parameter_field_polarities,
16890 intel_sub_group_avc_ime_result_t result);
16892intel_sub_group_avc_ref_get_inter_reference_interlaced_field_polarities(
16893 uint packed_reference_ids,
uint packed_reference_parameter_field_polarities,
16894 intel_sub_group_avc_ref_result_t result);
16897intel_sub_group_avc_mce_payload_t
__ovld
16898intel_sub_group_avc_ime_convert_to_mce_payload(
16899 intel_sub_group_avc_ime_payload_t payload);
16900intel_sub_group_avc_ime_payload_t
__ovld
16901intel_sub_group_avc_mce_convert_to_ime_payload(
16902 intel_sub_group_avc_mce_payload_t payload);
16903intel_sub_group_avc_mce_payload_t
__ovld
16904intel_sub_group_avc_ref_convert_to_mce_payload(
16905 intel_sub_group_avc_ref_payload_t payload);
16906intel_sub_group_avc_ref_payload_t
__ovld
16907intel_sub_group_avc_mce_convert_to_ref_payload(
16908 intel_sub_group_avc_mce_payload_t payload);
16909intel_sub_group_avc_mce_payload_t
__ovld
16910intel_sub_group_avc_sic_convert_to_mce_payload(
16911 intel_sub_group_avc_sic_payload_t payload);
16912intel_sub_group_avc_sic_payload_t
__ovld
16913intel_sub_group_avc_mce_convert_to_sic_payload(
16914 intel_sub_group_avc_mce_payload_t payload);
16916intel_sub_group_avc_mce_result_t
__ovld
16917intel_sub_group_avc_ime_convert_to_mce_result(
16918 intel_sub_group_avc_ime_result_t result);
16919intel_sub_group_avc_ime_result_t
__ovld
16920intel_sub_group_avc_mce_convert_to_ime_result(
16921 intel_sub_group_avc_mce_result_t result);
16922intel_sub_group_avc_mce_result_t
__ovld
16923intel_sub_group_avc_ref_convert_to_mce_result(
16924 intel_sub_group_avc_ref_result_t result);
16925intel_sub_group_avc_ref_result_t
__ovld
16926intel_sub_group_avc_mce_convert_to_ref_result(
16927 intel_sub_group_avc_mce_result_t result);
16928intel_sub_group_avc_mce_result_t
__ovld
16929intel_sub_group_avc_sic_convert_to_mce_result(
16930 intel_sub_group_avc_sic_result_t result);
16931intel_sub_group_avc_sic_result_t
__ovld
16932intel_sub_group_avc_mce_convert_to_sic_result(
16933 intel_sub_group_avc_mce_result_t result);
16934#pragma OPENCL EXTENSION cl_intel_device_side_avc_motion_estimation : end
16937#ifdef cl_amd_media_ops
16939uint2
__ovld amd_bitalign(uint2 a, uint2
b, uint2
c);
16940uint3
__ovld amd_bitalign(uint3 a, uint3
b, uint3
c);
16941uint4
__ovld amd_bitalign(uint4 a, uint4
b, uint4
c);
16946uint2
__ovld amd_bytealign(uint2 a, uint2
b, uint2
c);
16947uint3
__ovld amd_bytealign(uint3 a, uint3
b, uint3
c);
16948uint4
__ovld amd_bytealign(uint4 a, uint4
b, uint4
c);
16953uint2
__ovld amd_lerp(uint2 a, uint2
b, uint2
c);
16954uint3
__ovld amd_lerp(uint3 a, uint3
b, uint3
c);
16955uint4
__ovld amd_lerp(uint4 a, uint4
b, uint4
c);
16964uint2
__ovld amd_sadhi(uint2 a, uint2
b, uint2
c);
16965uint3
__ovld amd_sadhi(uint3 a, uint3
b, uint3
c);
16966uint4
__ovld amd_sadhi(uint4 a, uint4
b, uint4
c);
16971uint2
__ovld amd_sad(uint2 a, uint2
b, uint2
c);
16972uint3
__ovld amd_sad(uint3 a, uint3
b, uint3
c);
16973uint4
__ovld amd_sad(uint4 a, uint4
b, uint4
c);
16978float2
__ovld amd_unpack0(uint2 a);
16979float3
__ovld amd_unpack0(uint3 a);
16980float4
__ovld amd_unpack0(uint4 a);
16985float2
__ovld amd_unpack1(uint2 a);
16986float3
__ovld amd_unpack1(uint3 a);
16987float4
__ovld amd_unpack1(uint4 a);
16992float2
__ovld amd_unpack2(uint2 a);
16993float3
__ovld amd_unpack2(uint3 a);
16994float4
__ovld amd_unpack2(uint4 a);
16999float2
__ovld amd_unpack3(uint2 a);
17000float3
__ovld amd_unpack3(uint3 a);
17001float4
__ovld amd_unpack3(uint4 a);
17006#ifdef cl_amd_media_ops2
17008int2
__ovld amd_bfe(int2 src0, uint2 src1, uint2 src2);
17009int3
__ovld amd_bfe(int3 src0, uint3 src1, uint3 src2);
17010int4
__ovld amd_bfe(int4 src0, uint4 src1, uint4 src2);
17015uint2
__ovld amd_bfe(uint2 src0, uint2 src1, uint2 src2);
17016uint3
__ovld amd_bfe(uint3 src0, uint3 src1, uint3 src2);
17017uint4
__ovld amd_bfe(uint4 src0, uint4 src1, uint4 src2);
17022uint2
__ovld amd_bfm(uint2 src0, uint2 src1);
17023uint3
__ovld amd_bfm(uint3 src0, uint3 src1);
17024uint4
__ovld amd_bfm(uint4 src0, uint4 src1);
17028float __ovld amd_max3(
float src0,
float src1,
float src2);
17029float2
__ovld amd_max3(float2 src0, float2 src1, float2 src2);
17030float3
__ovld amd_max3(float3 src0, float3 src1, float3 src2);
17031float4
__ovld amd_max3(float4 src0, float4 src1, float4 src2);
17032float8
__ovld amd_max3(float8 src0, float8 src1, float8 src2);
17033float16
__ovld amd_max3(float16 src0, float16 src1, float16 src2);
17035int __ovld amd_max3(
int src0,
int src1,
int src2);
17036int2
__ovld amd_max3(int2 src0, int2 src1, int2 src2);
17037int3
__ovld amd_max3(int3 src0, int3 src1, int3 src2);
17038int4
__ovld amd_max3(int4 src0, int4 src1, int4 src2);
17043uint2
__ovld amd_max3(uint2 src0, uint2 src1, uint2 src2);
17044uint3
__ovld amd_max3(uint3 src0, uint3 src1, uint3 src2);
17045uint4
__ovld amd_max3(uint4 src0, uint4 src1, uint4 src2);
17049float __ovld amd_median3(
float src0,
float src1,
float src2);
17050float2
__ovld amd_median3(float2 src0, float2 src1, float2 src2);
17051float3
__ovld amd_median3(float3 src0, float3 src1, float3 src2);
17052float4
__ovld amd_median3(float4 src0, float4 src1, float4 src2);
17053float8
__ovld amd_median3(float8 src0, float8 src1, float8 src2);
17054float16
__ovld amd_median3(float16 src0, float16 src1, float16 src2);
17056int __ovld amd_median3(
int src0,
int src1,
int src2);
17057int2
__ovld amd_median3(int2 src0, int2 src1, int2 src2);
17058int3
__ovld amd_median3(int3 src0, int3 src1, int3 src2);
17059int4
__ovld amd_median3(int4 src0, int4 src1, int4 src2);
17064uint2
__ovld amd_median3(uint2 src0, uint2 src1, uint2 src2);
17065uint3
__ovld amd_median3(uint3 src0, uint3 src1, uint3 src2);
17066uint4
__ovld amd_median3(uint4 src0, uint4 src1, uint4 src2);
17070float __ovld amd_min3(
float src0,
float src1,
float src);
17071float2
__ovld amd_min3(float2 src0, float2 src1, float2 src);
17072float3
__ovld amd_min3(float3 src0, float3 src1, float3 src);
17073float4
__ovld amd_min3(float4 src0, float4 src1, float4 src);
17074float8
__ovld amd_min3(float8 src0, float8 src1, float8 src);
17075float16
__ovld amd_min3(float16 src0, float16 src1, float16 src);
17077int __ovld amd_min3(
int src0,
int src1,
int src2);
17078int2
__ovld amd_min3(int2 src0, int2 src1, int2 src2);
17079int3
__ovld amd_min3(int3 src0, int3 src1, int3 src2);
17080int4
__ovld amd_min3(int4 src0, int4 src1, int4 src2);
17085uint2
__ovld amd_min3(uint2 src0, uint2 src1, uint2 src2);
17086uint3
__ovld amd_min3(uint3 src0, uint3 src1, uint3 src2);
17087uint4
__ovld amd_min3(uint4 src0, uint4 src1, uint4 src2);
17092ulong2
__ovld amd_mqsad(ulong2 src0, uint2 src1, ulong2 src2);
17093ulong3
__ovld amd_mqsad(ulong3 src0, uint3 src1, ulong3 src2);
17094ulong4
__ovld amd_mqsad(ulong4 src0, uint4 src1, ulong4 src2);
17095ulong8
__ovld amd_mqsad(ulong8 src0,
uint8 src1, ulong8 src2);
17096ulong16
__ovld amd_mqsad(ulong16 src0,
uint16 src1, ulong16 src2);
17099ulong2
__ovld amd_qsad(ulong2 src0, uint2 src1, ulong2 src2);
17100ulong3
__ovld amd_qsad(ulong3 src0, uint3 src1, ulong3 src2);
17101ulong4
__ovld amd_qsad(ulong4 src0, uint4 src1, ulong4 src2);
17102ulong8
__ovld amd_qsad(ulong8 src0,
uint8 src1, ulong8 src2);
17103ulong16
__ovld amd_qsad(ulong16 src0,
uint16 src1, ulong16 src2);
17106uint2
__ovld amd_msad(uint2 src0, uint2 src1, uint2 src2);
17107uint3
__ovld amd_msad(uint3 src0, uint3 src1, uint3 src2);
17108uint4
__ovld amd_msad(uint4 src0, uint4 src1, uint4 src2);
17113uint2
__ovld amd_sadd(uint2 src0, uint2 src1, uint2 src2);
17114uint3
__ovld amd_sadd(uint3 src0, uint3 src1, uint3 src2);
17115uint4
__ovld amd_sadd(uint4 src0, uint4 src1, uint4 src2);
17120uint2
__ovld amd_sadw(uint2 src0, uint2 src1, uint2 src2);
17121uint3
__ovld amd_sadw(uint3 src0, uint3 src1, uint3 src2);
17122uint4
__ovld amd_sadw(uint4 src0, uint4 src1, uint4 src2);
17127#if defined(cl_arm_integer_dot_product_int8)
17128#pragma OPENCL EXTENSION cl_arm_integer_dot_product_int8 : begin
17130int __ovld arm_dot(char4 a, char4
b);
17131#pragma OPENCL EXTENSION cl_arm_integer_dot_product_int8 : end
17134#if defined(cl_arm_integer_dot_product_accumulate_int8)
17135#pragma OPENCL EXTENSION cl_arm_integer_dot_product_accumulate_int8 : begin
17137int __ovld arm_dot_acc(char4 a, char4
b,
int c);
17138#pragma OPENCL EXTENSION cl_arm_integer_dot_product_accumulate_int8 : end
17141#if defined(cl_arm_integer_dot_product_accumulate_int16)
17142#pragma OPENCL EXTENSION cl_arm_integer_dot_product_accumulate_int16 : begin
17144int __ovld arm_dot_acc(short2 a, short2
b,
int c);
17145#pragma OPENCL EXTENSION cl_arm_integer_dot_product_accumulate_int16 : end
17148#if defined(cl_arm_integer_dot_product_accumulate_saturate_int8)
17149#pragma OPENCL EXTENSION cl_arm_integer_dot_product_accumulate_saturate_int8 : begin
17151int __ovld arm_dot_acc_sat(char4 a, char4
b,
int c);
17152#pragma OPENCL EXTENSION cl_arm_integer_dot_product_accumulate_saturate_int8 : end
17156#pragma OPENCL EXTENSION all : disable
_Float16 __2f16 __attribute__((ext_vector_type(2)))
Zeroes the upper 128 bits (bits 255:128) of all YMM registers.
__device__ __2f16 float c
__INTPTR_TYPE__ intptr_t
A signed integer type with the property that any valid pointer to void can be converted to this type,...
__UINTPTR_TYPE__ uintptr_t
An unsigned integer type with the property that any valid pointer to void can be converted to this ty...
unsigned char uchar
An unsigned 8-bit integer.
__PTRDIFF_TYPE__ ptrdiff_t
A signed integer type that is the result of subtracting two pointers.
unsigned long ulong
An unsigned 64-bit integer.
unsigned int uint
An unsigned 32-bit integer.
unsigned short ushort
An unsigned 16-bit integer.
int4 __ovld __cnfn convert_int4_rte(char4)
uint8 __ovld __cnfn convert_uint8_rte(char8)
long __ovld __cnfn convert_long_rtp(char)
long2 __ovld __cnfn convert_long2_sat_rtp(char2)
float8 __ovld vloada_half8(size_t offset, const __constant half *p)
void __ovld vstorea_half3_rtz(float3 data, size_t offset, half *p)
void __ovld vstore_half_rtp(float data, size_t offset, half *p)
char __ovld __cnfn bitselect(char a, char b, char c)
Each bit of the result is the corresponding bit of a if the corresponding bit of c is 0.
char2 __ovld __cnfn convert_char2_rtp(char2)
short8 __ovld __cnfn convert_short8_sat_rte(char8)
uchar8 __ovld __cnfn convert_uchar8_rtp(char8)
ulong16 __ovld __cnfn convert_ulong16_sat(char16)
float __ovld vloada_half(size_t offset, const __constant half *p)
For n = 1, 2, 4, 8 and 16 read sizeof (halfn) bytes of data from address (p + (offset * n)).
uchar __ovld __cnfn convert_uchar(char)
ulong8 __ovld __cnfn convert_ulong8_rte(char8)
void __ovld vstorea_half8_rte(float8 data, size_t offset, half *p)
int16 __ovld __cnfn convert_int16_sat_rtn(char16)
int3 __ovld __cnfn convert_int3_rtn(char3)
float __ovld __cnfn native_powr(float x, float y)
Compute x to the power y, where x is >= 0.
short4 __ovld __cnfn convert_short4_rtp(char4)
void __ovld vstore2(char2 data, size_t offset, char *p)
char __ovld __cnfn mul_hi(char x, char y)
Computes x * y and returns the high half of the product of x and y.
void __ovld vstorea_half_rtp(float data, size_t offset, half *p)
ulong2 __ovld __cnfn convert_ulong2_rtn(char2)
ushort8 __ovld __cnfn convert_ushort8_rtn(char8)
void __ovld vstorea_half2_rtz(float2 data, size_t offset, half *p)
uint16 __ovld __cnfn convert_uint16_sat_rtp(char16)
float __ovld __cnfn acospi(float x)
Compute acos (x) / PI.
float4 __ovld __cnfn cross(float4 p0, float4 p1)
Returns the cross product of p0.xyz and p1.xyz.
char __ovld __cnfn mad_sat(char a, char b, char c)
Returns a * b + c and saturates the result.
float16 __ovld vload_half16(size_t offset, const __constant half *p)
char __ovld __cnfn sub_sat(char x, char y)
Returns x - y and saturates the result.
int3 __ovld __cnfn convert_int3_rtp(char3)
char3 __ovld __cnfn convert_char3_sat(char3)
char4 __ovld __cnfn convert_char4_sat(char4)
long __ovld __cnfn convert_long_rtz(char)
ushort8 __ovld __cnfn convert_ushort8_sat_rtn(char8)
uint __ovld __cnfn convert_uint_sat_rtn(char)
uint16 __ovld __cnfn convert_uint16_sat_rtn(char16)
uchar8 __ovld __cnfn convert_uchar8(char8)
float __ovld __cnfn half_sin(float x)
Compute sine.
uchar2 __ovld __cnfn convert_uchar2_sat(char2)
void __ovld vstore_half2_rtz(float2 data, size_t offset, half *p)
float __ovld __cnfn radians(float degrees)
Converts degrees to radians, i.e.
int3 __ovld __cnfn convert_int3(char3)
short __ovld __cnfn convert_short_sat_rtn(char)
size_t __ovld __cnfn get_global_size(uint dimindx)
Returns the number of global work-items specified for dimension identified by dimindx.
uchar2 __ovld __cnfn convert_uchar2_rte(char2)
uchar16 __ovld __cnfn convert_uchar16_sat_rtn(char16)
ulong4 __ovld __cnfn convert_ulong4_rtp(char4)
ushort3 __ovld __cnfn convert_ushort3_rtz(char3)
int __ovld __cnfn get_image_depth(read_only image3d_t image)
Return the image depth in pixels.
int16 __ovld __cnfn convert_int16_sat(char16)
void __ovld vstore_half16_rte(float16 data, size_t offset, half *p)
char4 __ovld __cnfn convert_char4_rte(char4)
int2 __ovld __cnfn convert_int2_sat_rtz(char2)
float __ovld __cnfn half_cos(float x)
Compute cosine.
void __ovld set_user_event_status(clk_event_t e, int state)
void __ovld mem_fence(cl_mem_fence_flags flags)
Orders loads and stores of a work-item executing a kernel.
float __ovld __cnfn convert_float_rte(char)
int __ovld __cnfn islessequal(float x, float y)
Returns the component-wise compare of x <= y.
ulong __ovld __cnfn convert_ulong_rtz(char)
float2 __ovld __cnfn convert_float2_rtp(char2)
short4 __ovld __cnfn convert_short4_sat_rtn(char4)
short2 __ovld __cnfn convert_short2_rtz(char2)
void __ovld write_imageui(write_only image2d_t image, int2 coord, uint4 color)
char8 __ovld __cnfn convert_char8_sat_rte(char8)
float __ovld __cnfn maxmag(float x, float y)
Returns x if | x | > | y |, y if | y | > | x |, otherwise fmax(x, y).
ushort8 __ovld __cnfn convert_ushort8_sat_rtp(char8)
int3 __ovld __cnfn convert_int3_rtz(char3)
float __ovld __cnfn native_log(float x)
Compute natural logarithm over an implementationdefined range.
ushort8 __ovld __cnfn convert_ushort8_sat_rtz(char8)
int __ovld __cnfn isnotequal(float x, float y)
Returns the component-wise compare of x != y.
char8 __ovld __cnfn convert_char8_sat_rtn(char8)
int2 __ovld __cnfn convert_int2_sat(char2)
float __ovld __cnfn atan2pi(float y, float x)
Compute atan2 (y, x) / PI.
float __ovld __cnfn normalize(float p)
Returns a vector in the same direction as p but with a length of 1.
float __ovld __cnfn distance(float p0, float p1)
Returns the distance between p0 and p1.
void __ovld vstore_half4_rtp(float4 data, size_t offset, half *p)
int __ovld atomic_fetch_max_explicit(volatile atomic_int *object, int operand, memory_order order)
void __ovld vstore_half8(float8 data, size_t offset, half *p)
ushort3 __ovld __cnfn convert_ushort3_rtn(char3)
float4 __ovld __cnfn convert_float4(char4)
ulong8 __ovld __cnfn convert_ulong8_rtp(char8)
size_t __ovld __cnfn get_local_id(uint dimindx)
Returns the unique local work-item ID i.e.
uint3 __ovld __cnfn convert_uint3_rtn(char3)
ushort3 __ovld __cnfn convert_ushort3_sat_rtn(char3)
long2 __ovld __cnfn convert_long2_sat(char2)
ushort3 __ovld __cnfn convert_ushort3_rte(char3)
ulong16 __ovld __cnfn convert_ulong16_sat_rtp(char16)
int __ovld atomic_or(volatile __global int *p, int val)
Read the 32-bit value (referred to as old) stored at location pointed by p.
void __ovld vstore8(char8 data, size_t offset, char *p)
float2 __ovld vload_half2(size_t offset, const __constant half *p)
Read sizeof (halfn) bytes of data from address (p + (offset * n)).
char8 __ovld __cnfn convert_char8(char8)
int printf(__constant const char *st,...) __attribute__((format(printf
char __ovld __cnfn convert_char_sat(char)
ulong3 __ovld __cnfn convert_ulong3_sat_rtn(char3)
uchar __ovld __cnfn abs_diff(char x, char y)
Returns | x - y | without modulo overflow.
ushort __ovld __cnfn convert_ushort_rtn(char)
uint4 __ovld __cnfn convert_uint4_rtz(char4)
float16 __ovld __cnfn convert_float16_rtn(char16)
short3 __ovld __cnfn convert_short3_rtp(char3)
int __ovld __cnfn convert_int_sat_rtz(char)
float __ovld __cnfn sign(float x)
Returns 1.0 if x > 0, -0.0 if x = -0.0, +0.0 if x = +0.0, or -1.0 if x < 0.
int16 __ovld __cnfn convert_int16(char16)
float __ovld __cnfn native_sin(float x)
Compute sine over an implementation-defined range.
uint __ovld __cnfn convert_uint_rtz(char)
ushort8 __ovld __cnfn convert_ushort8_rte(char8)
long3 __ovld __cnfn convert_long3_sat_rtz(char3)
short16 __ovld __cnfn convert_short16_sat_rte(char16)
ulong8 __ovld __cnfn convert_ulong8_sat_rtn(char8)
ushort3 __ovld __cnfn convert_ushort3_sat(char3)
int8 __ovld __cnfn convert_int8_sat(char8)
void __ovld vstorea_half16(float16 data, size_t offset, half *p)
float3 __ovld __cnfn convert_float3_rtp(char3)
int16 __ovld __cnfn convert_int16_rtp(char16)
float __ovld __cnfn half_recip(float x)
Compute reciprocal.
void __ovld vstore_half3_rtp(float3 data, size_t offset, half *p)
char2 __ovld __cnfn shuffle(char2 x, uchar2 mask)
The shuffle and shuffle2 built-in functions construct a permutation of elements from one or two input...
void __ovld vstore_half3_rtn(float3 data, size_t offset, half *p)
ulong4 __ovld __cnfn convert_ulong4_sat_rtn(char4)
uchar2 __ovld __cnfn convert_uchar2_sat_rtp(char2)
char4 __ovld vload4(size_t offset, const __constant char *p)
void __ovld vstore16(char16 data, size_t offset, char *p)
uchar __ovld __cnfn abs(char x)
Returns | x |.
void __ovld vstorea_half_rte(float data, size_t offset, half *p)
ulong2 __ovld __cnfn convert_ulong2_sat_rtz(char2)
int4 __ovld __cnfn convert_int4_sat_rtz(char4)
ushort8 __ovld __cnfn convert_ushort8_sat(char8)
int __ovld atomic_xchg(volatile __global int *p, int val)
Swaps the old value stored at location p with new value given by val.
uint3 __ovld __cnfn convert_uint3_sat(char3)
void __ovld vstorea_half4_rte(float4 data, size_t offset, half *p)
size_t __ovld __cnfn get_num_groups(uint dimindx)
Returns the number of work-groups that will execute a kernel for dimension identified by dimindx.
void __ovld write_mem_fence(cl_mem_fence_flags flags)
Write memory barrier that orders only stores.
int __ovld atomic_sub(volatile __global int *p, int val)
Read the 32-bit value (referred to as old) stored at location pointed by p.
ulong4 __ovld __cnfn convert_ulong4_sat(char4)
float __ovld __cnfn nan(uint nancode)
Returns a quiet NaN.
int16 __ovld __cnfn convert_int16_sat_rtp(char16)
char16 __ovld __cnfn convert_char16_sat_rtz(char16)
uint __ovld __cnfn convert_uint_sat(char)
ushort4 __ovld __cnfn convert_ushort4_sat_rtn(char4)
void __ovld vstore_half3_rtz(float3 data, size_t offset, half *p)
float3 __ovld __cnfn convert_float3_rtn(char3)
int __ovld __cnfn isgreater(float x, float y)
Returns the component-wise compare of x > y.
long16 __ovld __cnfn convert_long16(char16)
short16 __ovld __cnfn convert_short16_rtn(char16)
float __ovld __cnfn atanpi(float x)
Compute atan (x) / PI.
char __ovld __cnfn rotate(char v, char i)
For each element in v, the bits are shifted left by the number of bits given by the corresponding ele...
short2 __ovld __cnfn convert_short2_rtp(char2)
uchar8 __ovld __cnfn convert_uchar8_rtz(char8)
float __ovld __cnfn native_recip(float x)
Compute reciprocal over an implementation-defined range.
int __ovld atomic_add(volatile __global int *p, int val)
Read the 32-bit value (referred to as old) stored at location pointed by p.
int __ovld __cnfn convert_int_rtz(char)
char16 __ovld __cnfn convert_char16_rtz(char16)
ushort16 __ovld __cnfn convert_ushort16_rte(char16)
int2 __ovld __cnfn convert_int2_sat_rtp(char2)
float __ovld __cnfn native_rsqrt(float x)
Compute inverse square root over an implementationdefined range.
void __ovld __conv barrier(cl_mem_fence_flags flags)
All work-items in a work-group executing the kernel on a processor must execute this function before ...
char __ovld __cnfn convert_char_sat_rtn(char)
short2 __ovld __cnfn convert_short2(char2)
short2 __ovld __cnfn convert_short2_sat_rtp(char2)
int __ovld __cnfn convert_int_rtn(char)
ushort __ovld __cnfn convert_ushort_sat_rtz(char)
long4 __ovld __cnfn convert_long4(char4)
short16 __ovld __cnfn convert_short16_sat(char16)
uchar3 __ovld __cnfn convert_uchar3_rtn(char3)
short8 __ovld __cnfn convert_short8(char8)
float __ovld __cnfn length(float p)
Return the length of vector p, i.e., sqrt(p.x2 + p.y 2 + ...)
ulong2 __ovld __cnfn convert_ulong2_sat(char2)
float __ovld __cnfn rootn(float x, int y)
Compute x to the power 1/y.
ulong3 __ovld __cnfn convert_ulong3_sat_rte(char3)
void __ovld vstore_half2_rte(float2 data, size_t offset, half *p)
short4 __ovld __cnfn convert_short4_sat_rte(char4)
float __ovld __cnfn sinpi(float x)
Compute sin (PI * x).
ulong8 __ovld __cnfn convert_ulong8_sat(char8)
char2 __ovld __cnfn convert_char2_sat_rtp(char2)
uint __ovld __cnfn convert_uint_sat_rte(char)
uint8 __ovld __cnfn convert_uint8_sat_rte(char8)
float __ovld __cnfn native_exp10(float x)
Compute the base- 10 exponential of x over an implementation-defined range.
int16 __ovld __cnfn convert_int16_rte(char16)
char16 __ovld __cnfn convert_char16_sat_rtn(char16)
ulong __ovld __cnfn convert_ulong_sat_rte(char)
float __ovld __cnfn convert_float_rtp(char)
ulong2 __ovld __cnfn convert_ulong2_sat_rtp(char2)
uint3 __ovld __cnfn convert_uint3_rtp(char3)
float16 __ovld __cnfn convert_float16_rtp(char16)
short4 __ovld __cnfn convert_short4_sat_rtz(char4)
int3 __ovld __cnfn convert_int3_sat_rtz(char3)
ushort3 __ovld __cnfn convert_ushort3_sat_rte(char3)
ulong __ovld __cnfn convert_ulong_sat(char)
long3 __ovld __cnfn convert_long3_sat(char3)
ulong4 __ovld __cnfn convert_ulong4_sat_rtz(char4)
long8 __ovld __cnfn convert_long8_sat_rte(char8)
int4 __ovld __cnfn convert_int4(char4)
ushort8 __ovld __cnfn convert_ushort8_rtz(char8)
short __ovld __cnfn convert_short_sat_rtp(char)
ulong4 __ovld __cnfn convert_ulong4_rtn(char4)
void __ovld vstorea_half4(float4 data, size_t offset, half *p)
long16 __ovld __cnfn convert_long16_rtn(char16)
uint __ovld __cnfn convert_uint_rtn(char)
short2 __ovld __cnfn convert_short2_rte(char2)
void __ovld vstore_half4_rte(float4 data, size_t offset, half *p)
float __ovld __cnfn half_powr(float x, float y)
Compute x to the power y, where x is >= 0.
ulong3 __ovld __cnfn convert_ulong3_rtp(char3)
char __ovld __cnfn clz(char x)
Returns the number of leading 0-bits in x, starting at the most significant bit position.
ulong16 __ovld __cnfn convert_ulong16_rtz(char16)
int2 __ovld __cnfn convert_int2_rte(char2)
void __ovld vstorea_half16_rtz(float16 data, size_t offset, half *p)
float8 __ovld __cnfn convert_float8_rte(char8)
uchar3 __ovld __cnfn convert_uchar3(char3)
char2 __ovld __cnfn shuffle2(char2 x, char2 y, uchar2 mask)
float __ovld __cnfn convert_float_rtz(char)
char4 __ovld __cnfn convert_char4_sat_rte(char4)
float __ovld __cnfn exp10(float)
Exponential base 10 function.
char __ovld __cnfn convert_char(char)
ushort16 __ovld __cnfn convert_ushort16_sat_rte(char16)
void __ovld vstorea_half8_rtp(float8 data, size_t offset, half *p)
queue_t __ovld get_default_queue(void)
int __ovld __cnfn isinf(float)
Test for infinity value (+ve or -ve) .
int __ovld atomic_fetch_max(volatile atomic_int *object, int operand)
ushort3 __ovld __cnfn convert_ushort3_sat_rtz(char3)
short __ovld __cnfn convert_short_rtp(char)
void __ovld wait_group_events(int num_events, event_t *event_list)
Wait for events that identify the async_work_group_copy operations to complete.
uchar __ovld __cnfn convert_uchar_rte(char)
void __ovld release_event(clk_event_t)
float8 __ovld vload_half8(size_t offset, const __constant half *p)
float3 __ovld __cnfn convert_float3_rtz(char3)
long __ovld __cnfn convert_long_rte(char)
float2 __ovld vloada_half2(size_t offset, const __constant half *p)
short8 __ovld __cnfn convert_short8_rtz(char8)
size_t __ovld get_global_linear_id(void)
char __ovld __cnfn convert_char_sat_rtz(char)
int __ovld __cnfn convert_int_rtp(char)
long3 __ovld __cnfn convert_long3_sat_rtp(char3)
uchar __ovld __cnfn convert_uchar_rtp(char)
void __ovld __conv work_group_barrier(cl_mem_fence_flags flags, memory_scope scope)
ulong4 __ovld __cnfn convert_ulong4(char4)
uint4 __ovld __cnfn convert_uint4_sat(char4)
ulong2 __ovld __cnfn convert_ulong2(char2)
long2 __ovld __cnfn convert_long2_rtn(char2)
int __ovld __cnfn isequal(float x, float y)
intn isequal (floatn x, floatn y) Returns the component-wise compare of x == y.
long16 __ovld __cnfn convert_long16_rtp(char16)
void __ovld vstorea_half8(float8 data, size_t offset, half *p)
int __ovld atomic_and(volatile __global int *p, int val)
Read the 32-bit value (referred to as old) stored at location pointed by p.
ushort16 __ovld __cnfn convert_ushort16_sat_rtn(char16)
long3 __ovld __cnfn convert_long3_sat_rtn(char3)
uint2 __ovld __cnfn convert_uint2_rtp(char2)
uint3 __ovld __cnfn convert_uint3(char3)
size_t __ovld __cnfn get_global_id(uint dimindx)
Returns the unique global work-item ID value for dimension identified by dimindx.
ushort4 __ovld __cnfn convert_ushort4_sat(char4)
short __ovld __cnfn convert_short_rtz(char)
uint8 __ovld __cnfn convert_uint8_sat_rtn(char8)
uchar __ovld __cnfn convert_uchar_sat(char)
float8 __ovld __cnfn convert_float8_rtn(char8)
short4 __ovld __cnfn convert_short4_sat(char4)
float4 __ovld __cnfn convert_float4_rte(char4)
uchar4 __ovld __cnfn convert_uchar4_rtz(char4)
char4 __ovld __cnfn convert_char4_rtp(char4)
uchar16 __ovld __cnfn convert_uchar16_sat(char16)
long8 __ovld __cnfn convert_long8_sat_rtp(char8)
short3 __ovld __cnfn convert_short3_rte(char3)
uint3 __ovld __cnfn convert_uint3_sat_rtz(char3)
float __ovld __cnfn native_cos(float x)
Compute cosine over an implementation-defined range.
void __ovld capture_event_profiling_info(clk_event_t, clk_profiling_info, __global void *value)
char3 __ovld __cnfn convert_char3_sat_rtp(char3)
int __ovld __cnfn isless(float x, float y)
Returns the component-wise compare of x < y.
float __ovld __cnfn half_log10(float x)
Compute a base 10 logarithm.
ushort16 __ovld __cnfn convert_ushort16(char16)
float __ovld __cnfn half_exp2(float x)
Compute the base- 2 exponential of x.
float __ovld __cnfn native_exp2(float x)
Compute the base- 2 exponential of x over an implementation-defined range.
long4 __ovld __cnfn convert_long4_sat_rtp(char4)
uint8 __ovld __cnfn convert_uint8_rtn(char8)
size_t __ovld __cnfn get_global_offset(uint dimindx)
get_global_offset returns the offset values specified in global_work_offset argument to clEnqueueNDRa...
int __ovld __conv work_group_scan_exclusive_min(int x)
void __ovld vstore_half16_rtz(float16 data, size_t offset, half *p)
float8 __ovld __cnfn convert_float8(char8)
void __ovld vstorea_half4_rtn(float4 data, size_t offset, half *p)
int __ovld __cnfn any(char x)
Returns 1 if the most significant bit in any component of x is set; otherwise returns 0.
float16 __ovld __cnfn convert_float16(char16)
char8 __ovld __cnfn convert_char8_rtp(char8)
short3 __ovld __cnfn convert_short3_rtz(char3)
char16 __ovld __cnfn convert_char16_sat_rte(char16)
long16 __ovld __cnfn convert_long16_rte(char16)
uchar3 __ovld __cnfn convert_uchar3_sat(char3)
uchar16 __ovld __cnfn convert_uchar16_sat_rte(char16)
float __ovld __cnfn tanpi(float x)
Compute tan (PI * x).
long8 __ovld __cnfn convert_long8_rtz(char8)
ushort16 __ovld __cnfn convert_ushort16_rtn(char16)
ulong2 __ovld __cnfn convert_ulong2_sat_rtn(char2)
float __ovld __cnfn fast_distance(float p0, float p1)
Returns fast_length(p0 - p1).
float __ovld __cnfn half_log2(float x)
Compute a base 2 logarithm.
char4 __ovld __cnfn convert_char4(char4)
int2 __ovld __cnfn convert_int2_rtz(char2)
short16 __ovld __cnfn convert_short16_sat_rtn(char16)
ulong __ovld __cnfn convert_ulong_rtn(char)
ulong16 __ovld __cnfn convert_ulong16_rtp(char16)
void __ovld vstorea_half8_rtn(float8 data, size_t offset, half *p)
float __ovld __cnfn minmag(float x, float y)
Returns x if | x | < | y |, y if | y | < | x |, otherwise fmin(x, y).
char3 __ovld __cnfn convert_char3_sat_rtn(char3)
short __ovld __cnfn convert_short_rte(char)
short3 __ovld __cnfn convert_short3_sat(char3)
long8 __ovld __cnfn convert_long8_sat(char8)
uint __ovld __cnfn convert_uint_sat_rtp(char)
char2 __ovld __cnfn convert_char2_sat_rte(char2)
char4 __ovld __cnfn convert_char4_sat_rtp(char4)
long8 __ovld __cnfn convert_long8_rtp(char8)
uint __ovld __cnfn convert_uint_rtp(char)
ulong __ovld __cnfn convert_ulong(char)
short4 __ovld __cnfn convert_short4_rtz(char4)
int __ovld atomic_xor(volatile __global int *p, int val)
Read the 32-bit value (referred to as old) stored at location pointed by p.
uchar3 __ovld __cnfn convert_uchar3_sat_rtn(char3)
int __ovld __conv work_group_scan_exclusive_add(int x)
ulong8 __ovld __cnfn convert_ulong8_rtn(char8)
float __ovld __cnfn mad(float a, float b, float c)
mad approximates a * b + c.
size_t __ovld get_local_linear_id(void)
short2 __ovld __cnfn convert_short2_sat(char2)
char3 __ovld __cnfn convert_char3_rtz(char3)
uint2 __ovld __cnfn convert_uint2_sat_rtz(char2)
int __ovld __conv work_group_scan_inclusive_max(int x)
uchar4 __ovld __cnfn convert_uchar4_sat_rte(char4)
int8 __ovld __cnfn convert_int8(char8)
ulong16 __ovld __cnfn convert_ulong16_rte(char16)
char16 __ovld __cnfn convert_char16_rtp(char16)
int16 __ovld __cnfn convert_int16_sat_rte(char16)
long16 __ovld __cnfn convert_long16_sat(char16)
uchar __ovld __cnfn convert_uchar_rtz(char)
char3 __ovld __cnfn convert_char3_rtp(char3)
char __ovld __cnfn clamp(char x, char minval, char maxval)
Returns min(max(x, minval), maxval).
int8 __ovld __cnfn convert_int8_sat_rtp(char8)
ulong2 __ovld __cnfn convert_ulong2_rte(char2)
char __ovld __cnfn convert_char_rtz(char)
int __ovld __conv work_group_scan_inclusive_min(int x)
short16 __ovld __cnfn convert_short16_sat_rtp(char16)
float4 __ovld __cnfn convert_float4_rtz(char4)
uint4 __ovld __cnfn convert_uint4_rtn(char4)
float __ovld __cnfn convert_float_rtn(char)
float __ovld __cnfn rsqrt(float)
Compute inverse square root.
char __ovld __cnfn mad_hi(char a, char b, char c)
Returns mul_hi(a, b) + c.
char __ovld __cnfn min(char x, char y)
Returns y if y < x, otherwise it returns x.
float2 __ovld __cnfn convert_float2_rte(char2)
void __ovld read_mem_fence(cl_mem_fence_flags flags)
Read memory barrier that orders only loads.
float __ovld __cnfn step(float edge, float x)
Returns 0.0 if x < edge, otherwise it returns 1.0.
ushort4 __ovld __cnfn convert_ushort4_rtp(char4)
int4 __purefn __ovld read_imagei(read_only image2d_t image, sampler_t sampler, int2 coord)
char3 __ovld __cnfn convert_char3_rtn(char3)
char3 __ovld __cnfn convert_char3_sat_rte(char3)
int __ovld atomic_max(volatile __global int *p, int val)
Read the 32-bit value (referred to as old) stored at location pointed by p.
int __ovld __cnfn convert_int_sat_rte(char)
short8 __ovld __cnfn convert_short8_sat_rtz(char8)
uchar8 __ovld __cnfn convert_uchar8_sat_rtp(char8)
uchar2 __ovld __cnfn convert_uchar2(char2)
uint4 __ovld __cnfn convert_uint4_rtp(char4)
ushort4 __ovld __cnfn convert_ushort4_rtz(char4)
ushort __ovld __cnfn convert_ushort_sat(char)
void __ovld vstore3(char3 data, size_t offset, char *p)
int3 __ovld __cnfn convert_int3_sat_rtp(char3)
uint8 __ovld __cnfn convert_uint8_sat_rtp(char8)
float __ovld __cnfn half_divide(float x, float y)
Compute x / y.
ulong8 __ovld __cnfn convert_ulong8_rtz(char8)
char4 __ovld __cnfn convert_char4_sat_rtn(char4)
short __ovld __cnfn convert_short_sat_rtz(char)
ulong3 __ovld __cnfn convert_ulong3_sat_rtp(char3)
uchar3 __ovld __cnfn convert_uchar3_sat_rte(char3)
ulong16 __ovld __cnfn convert_ulong16_rtn(char16)
char2 __ovld __cnfn convert_char2_rte(char2)
uchar4 __ovld __cnfn convert_uchar4_sat_rtn(char4)
float __ovld modf(float x, float *iptr)
Decompose a floating-point number.
char4 __ovld __cnfn convert_char4_sat_rtz(char4)
short3 __ovld __cnfn convert_short3_sat_rtp(char3)
ushort2 __ovld __cnfn convert_ushort2_sat(char2)
float8 __ovld __cnfn convert_float8_rtz(char8)
void __ovld retain_event(clk_event_t)
short3 __ovld __cnfn convert_short3_sat_rte(char3)
char8 __ovld __cnfn convert_char8_sat_rtz(char8)
uchar2 __ovld __cnfn convert_uchar2_rtp(char2)
int __ovld __conv work_group_any(int predicate)
ushort16 __ovld __cnfn convert_ushort16_sat_rtz(char16)
uint4 __ovld __cnfn convert_uint4_sat_rte(char4)
float __ovld lgamma_r(float x, int *signp)
short16 __ovld __cnfn convert_short16_sat_rtz(char16)
uchar3 __ovld __cnfn convert_uchar3_rtp(char3)
ushort4 __ovld __cnfn convert_ushort4_sat_rtz(char4)
int float4 __purefn __ovld read_imagef(read_only image2d_t image, sampler_t sampler, int2 coord)
Use the coordinate (coord.xy) to do an element lookup in the 2D image object specified by image.
void __ovld vstore_half8_rte(float8 data, size_t offset, half *p)
char __ovld __cnfn popcount(char x)
uint3 __ovld __cnfn convert_uint3_rtz(char3)
void __ovld vstore_half4(float4 data, size_t offset, half *p)
uint8 __ovld __cnfn convert_uint8_sat(char8)
uchar2 __ovld __cnfn convert_uchar2_sat_rtn(char2)
int __ovld __conv work_group_scan_exclusive_max(int x)
float3 __ovld vload_half3(size_t offset, const __constant half *p)
float __ovld __cnfn fast_normalize(float p)
Returns a vector in the same direction as p but with a length of 1.
ushort2 __ovld __cnfn convert_ushort2_rtz(char2)
int __ovld __cnfn isfinite(float)
Test for finite value.
float __ovld __cnfn native_tan(float x)
Compute tangent over an implementation-defined range.
float __ovld __cnfn half_tan(float x)
Compute tangent.
float3 __ovld __cnfn convert_float3(char3)
float __ovld __cnfn half_rsqrt(float x)
Compute inverse square root.
int4 __ovld __cnfn convert_int4_sat_rte(char4)
char8 __ovld __cnfn convert_char8_rtz(char8)
short4 __ovld __cnfn convert_short4_sat_rtp(char4)
float __ovld __cnfn native_exp(float x)
Compute the base- e exponential of x over an implementation-defined range.
float __ovld __cnfn pown(float x, int y)
Compute x to the power y, where y is an integer.
int2 __ovld __cnfn convert_int2_rtp(char2)
long4 __ovld __cnfn convert_long4_sat_rtn(char4)
int16 __ovld __cnfn convert_int16_sat_rtz(char16)
void __ovld write_imagef(write_only image2d_t image, int2 coord, float4 color)
Write color value to location specified by coordinate (coord.x, coord.y) in the 2D image object speci...
uchar4 __ovld __cnfn convert_uchar4_sat(char4)
ushort __ovld __cnfn convert_ushort_rtz(char)
short8 __ovld __cnfn convert_short8_rtp(char8)
long4 __ovld __cnfn convert_long4_rtn(char4)
void __ovld vstore4(char4 data, size_t offset, char *p)
int4 __ovld __cnfn convert_int4_sat_rtn(char4)
char __ovld __cnfn max(char x, char y)
Returns y if x < y, otherwise it returns x.
long __ovld __cnfn convert_long(char)
short8 __ovld __cnfn convert_short8_rte(char8)
void __ovld vstore_half3(float3 data, size_t offset, half *p)
char16 __ovld __cnfn convert_char16_rte(char16)
int3 __ovld __cnfn convert_int3_sat_rte(char3)
int __ovld enqueue_marker(queue_t, uint, const clk_event_t *, clk_event_t *)
ushort2 __ovld __cnfn convert_ushort2_sat_rtz(char2)
short4 __ovld __cnfn convert_short4_rtn(char4)
float2 __ovld __cnfn convert_float2(char2)
long2 __ovld __cnfn convert_long2_rtz(char2)
char __ovld __cnfn convert_char_sat_rtp(char)
int __ovld __conv work_group_broadcast(int a, size_t local_id)
uint16 __ovld __cnfn convert_uint16_rtz(char16)
short3 __ovld __cnfn convert_short3_sat_rtn(char3)
uchar16 __ovld __cnfn convert_uchar16(char16)
uint3 __ovld __cnfn convert_uint3_rte(char3)
uint16 __ovld __cnfn convert_uint16_sat_rte(char16)
long3 __ovld __cnfn convert_long3_rtp(char3)
int __ovld __cnfn isnormal(float)
Test for a normal value.
ushort2 __ovld __cnfn convert_ushort2_rtn(char2)
char8 __ovld __cnfn convert_char8_sat(char8)
uint16 __ovld __cnfn convert_uint16_rtn(char16)
long8 __ovld __cnfn convert_long8_sat_rtn(char8)
uchar8 __ovld __cnfn convert_uchar8_sat_rtn(char8)
uchar8 __ovld __cnfn convert_uchar8_rte(char8)
uint4 __ovld __cnfn convert_uint4_sat_rtz(char4)
float __ovld __cnfn native_sqrt(float x)
Compute square root over an implementation-defined range.
int16 __ovld __cnfn convert_int16_rtn(char16)
int4 __ovld __cnfn convert_int4_rtz(char4)
void __ovld vstorea_half4_rtz(float4 data, size_t offset, half *p)
event_t __ovld async_work_group_strided_copy(__local char *dst, const __global char *src, size_t num_elements, size_t src_stride, event_t event)
Perform an async gather of num_elements gentype elements from src to dst.
void __ovld vstorea_half4_rtp(float4 data, size_t offset, half *p)
uint2 __ovld __cnfn convert_uint2_rte(char2)
ulong16 __ovld __cnfn convert_ulong16(char16)
int __ovld atomic_dec(volatile __global int *p)
Read the 32-bit value (referred to as old) stored at location pointed by p.
char __ovld __cnfn convert_char_rtp(char)
uchar8 __ovld __cnfn convert_uchar8_sat_rtz(char8)
ulong3 __ovld __cnfn convert_ulong3(char3)
char3 __ovld __cnfn convert_char3(char3)
int __ovld __cnfn get_image_height(read_only image2d_t image)
Return the image height in pixels.
long __ovld __cnfn convert_long_sat_rtz(char)
void __ovld vstorea_half16_rtp(float16 data, size_t offset, half *p)
long2 __ovld __cnfn convert_long2_sat_rtz(char2)
ulong4 __ovld __cnfn convert_ulong4_sat_rte(char4)
char2 __ovld __cnfn convert_char2_rtn(char2)
short2 __ovld __cnfn convert_short2_sat_rtz(char2)
short8 __ovld __cnfn convert_short8_sat_rtn(char8)
uint2 __ovld __cnfn convert_uint2_sat_rtn(char2)
uchar3 __ovld __cnfn convert_uchar3_rtz(char3)
float __ovld __cnfn native_divide(float x, float y)
Compute x / y over an implementation-defined range.
void __ovld atomic_work_item_fence(cl_mem_fence_flags flags, memory_order order, memory_scope scope)
uint3 __ovld __cnfn convert_uint3_sat_rtn(char3)
float4 __ovld vloada_half4(size_t offset, const __constant half *p)
uchar4 __ovld __cnfn convert_uchar4_rtn(char4)
uint4 __ovld __cnfn convert_uint4_sat_rtn(char4)
int8 __ovld __cnfn convert_int8_sat_rte(char8)
ulong3 __ovld __cnfn convert_ulong3_sat(char3)
ushort3 __ovld __cnfn convert_ushort3_rtp(char3)
float3 __ovld __cnfn convert_float3_rte(char3)
uchar __ovld __cnfn convert_uchar_rtn(char)
long4 __ovld __cnfn convert_long4_sat_rte(char4)
int3 __ovld __cnfn convert_int3_sat_rtn(char3)
long __ovld __cnfn convert_long_rtn(char)
uchar8 __ovld __cnfn convert_uchar8_sat_rte(char8)
long2 __ovld __cnfn convert_long2(char2)
float __ovld fract(float x, float *iptr)
Returns fmin(x - floor (x), 0x1.fffffep-1f ).
ulong16 __ovld __cnfn convert_ulong16_sat_rte(char16)
long __ovld __cnfn convert_long_sat(char)
short __ovld __cnfn convert_short_sat_rte(char)
ndrange_t __ovld ndrange_2D(const size_t[2])
ndrange_t __ovld ndrange_1D(size_t)
ulong16 __ovld __cnfn convert_ulong16_sat_rtz(char16)
ushort __ovld __cnfn convert_ushort_sat_rte(char)
short2 __ovld __cnfn convert_short2_sat_rte(char2)
size_t __ovld __cnfn get_group_id(uint dimindx)
get_group_id returns the work-group ID which is a number from 0 .
uint8 __ovld __cnfn convert_uint8(char8)
float __ovld __cnfn half_sqrt(float x)
Compute square root.
uint __ovld __cnfn get_work_dim(void)
Returns the number of dimensions in use.
long2 __ovld __cnfn convert_long2_sat_rtn(char2)
int2 __ovld __cnfn convert_int2_rtn(char2)
char __ovld __cnfn rhadd(char x, char y)
Returns (x + y + 1) >> 1.
long8 __ovld __cnfn convert_long8_rte(char8)
char16 __ovld __cnfn convert_char16_sat_rtp(char16)
uchar __ovld __cnfn convert_uchar_sat_rte(char)
uchar4 __ovld __cnfn convert_uchar4(char4)
uchar8 __ovld __cnfn convert_uchar8_rtn(char8)
int __ovld __cnfn isgreaterequal(float x, float y)
Returns the component-wise compare of x >= y.
void __ovld vstorea_half_rtz(float data, size_t offset, half *p)
float __ovld __cnfn half_exp(float x)
Compute the base- e exponential of x.
int __ovld __conv work_group_reduce_min(int x)
ushort8 __ovld __cnfn convert_ushort8_rtp(char8)
float4 __ovld __cnfn convert_float4_rtp(char4)
void __ovld vstorea_half3_rte(float3 data, size_t offset, half *p)
uint2 __ovld __cnfn convert_uint2_sat_rtp(char2)
long8 __ovld __cnfn convert_long8_rtn(char8)
int __ovld __cnfn all(char x)
Returns 1 if the most significant bit in all components of x is set; otherwise returns 0.
int2 __ovld __cnfn get_image_dim(read_only image2d_t image)
Return the 2D image width and height as an int2 type.
char2 __ovld __cnfn convert_char2_rtz(char2)
ulong4 __ovld __cnfn convert_ulong4_rtz(char4)
ushort3 __ovld __cnfn convert_ushort3_sat_rtp(char3)
int __ovld __cnfn isunordered(float x, float y)
Test if arguments are unordered.
long16 __ovld __cnfn convert_long16_sat_rtp(char16)
uchar __ovld __cnfn convert_uchar_sat_rtn(char)
ushort4 __ovld __cnfn convert_ushort4_sat_rtp(char4)
uchar __ovld __cnfn convert_uchar_sat_rtz(char)
long4 __ovld __cnfn convert_long4_rtp(char4)
ushort3 __ovld __cnfn convert_ushort3(char3)
long2 __ovld __cnfn convert_long2_rtp(char2)
char4 __ovld __cnfn convert_char4_rtz(char4)
uchar4 __ovld __cnfn convert_uchar4_rtp(char4)
int __ovld __cnfn convert_int_sat_rtn(char)
uchar16 __ovld __cnfn convert_uchar16_rtz(char16)
int __ovld atomic_fetch_min_explicit(volatile atomic_int *object, int operand, memory_order order)
char2 __ovld __cnfn convert_char2(char2)
void __ovld vstorea_half2(float2 data, size_t offset, half *p)
char __ovld __cnfn select(char a, char b, char c)
For each component of a vector type, result[i] = if MSB of c[i] is set ? b[i] : a[i].
long4 __ovld __cnfn convert_long4_rtz(char4)
char __ovld __cnfn convert_char_rte(char)
ushort __ovld __cnfn convert_ushort(char)
uint8 __ovld __cnfn convert_uint8_rtp(char8)
long16 __ovld __cnfn convert_long16_rtz(char16)
int __ovld __cnfn mul24(int x, int y)
Multiply two 24-bit integer values x and y.
ushort8 __ovld __cnfn convert_ushort8_sat_rte(char8)
short16 __ovld __cnfn convert_short16_rtp(char16)
char2 __ovld vload2(size_t offset, const __constant char *p)
Use generic type gentype to indicate the built-in data types char, uchar, short, ushort,...
long4 __ovld __cnfn convert_long4_sat(char4)
long4 __ovld __cnfn convert_long4_rte(char4)
event_t __ovld async_work_group_copy(__local char *dst, const __global char *src, size_t num_elements, event_t event)
Builtin functions to_global, to_local, and to_private need to be declared as Clang builtin functions ...
float __ovld __cnfn powr(float x, float y)
Compute x to the power y, where x is >= 0.
char8 __ovld __cnfn convert_char8_rtn(char8)
short3 __ovld __cnfn convert_short3(char3)
int8 __ovld __cnfn convert_int8_sat_rtn(char8)
char3 __ovld __cnfn convert_char3_sat_rtz(char3)
ulong8 __ovld __cnfn convert_ulong8(char8)
uchar3 __ovld __cnfn convert_uchar3_sat_rtz(char3)
bool __ovld is_valid_event(clk_event_t event)
void __ovld vstore_half2(float2 data, size_t offset, half *p)
The floatn value given by data is converted to a halfn value using the appropriate rounding mode.
void __ovld vstorea_half2_rtp(float2 data, size_t offset, half *p)
int __ovld __conv work_group_scan_inclusive_add(int x)
long3 __ovld __cnfn convert_long3_rte(char3)
char8 __ovld __cnfn convert_char8_sat_rtp(char8)
char __ovld __cnfn convert_char_rtn(char)
long3 __ovld __cnfn convert_long3_sat_rte(char3)
char __ovld __cnfn convert_char_sat_rte(char)
void __ovld vstorea_half_rtn(float data, size_t offset, half *p)
void __ovld vstore_half8_rtp(float8 data, size_t offset, half *p)
ulong16 __ovld __cnfn convert_ulong16_sat_rtn(char16)
uint2 __ovld __cnfn convert_uint2_rtz(char2)
long __ovld __cnfn convert_long_sat_rte(char)
int2 __ovld __cnfn convert_int2(char2)
int __ovld __cnfn isnan(float)
Test for a NaN.
void __ovld vstore_half8_rtn(float8 data, size_t offset, half *p)
short3 __ovld __cnfn convert_short3_rtn(char3)
int2 __ovld __cnfn convert_int2_sat_rtn(char2)
short __ovld __cnfn convert_short_rtn(char)
ulong2 __ovld __cnfn convert_ulong2_rtz(char2)
uint2 __ovld __cnfn convert_uint2_sat(char2)
int4 __ovld __cnfn convert_int4_sat_rtp(char4)
uchar16 __ovld __cnfn convert_uchar16_sat_rtp(char16)
short3 __ovld __cnfn convert_short3_sat_rtz(char3)
float __ovld __cnfn native_log10(float x)
Compute a base 10 logarithm over an implementationdefined range.
uint2 __ovld __cnfn convert_uint2_rtn(char2)
int __ovld __cnfn convert_int_rte(char)
int8 __ovld __cnfn convert_int8_rte(char8)
uchar __ovld __cnfn convert_uchar_sat_rtp(char)
ulong3 __ovld __cnfn convert_ulong3_sat_rtz(char3)
void __ovld vstorea_half(float data, size_t offset, half *p)
The floatn value given by data is converted to a halfn value using the appropriate rounding mode.
ushort2 __ovld __cnfn convert_ushort2_sat_rtp(char2)
uchar2 __ovld __cnfn convert_uchar2_rtz(char2)
int __ovld __cnfn convert_int(char)
void __ovld prefetch(const __global char *p, size_t num_elements)
Prefetch num_elements * sizeof(gentype) bytes into the global cache.
ushort16 __ovld __cnfn convert_ushort16_rtp(char16)
ulong4 __ovld __cnfn convert_ulong4_sat_rtp(char4)
int4 __ovld __cnfn convert_int4_rtp(char4)
void __ovld vstorea_half8_rtz(float8 data, size_t offset, half *p)
float __ovld __cnfn half_exp10(float x)
Compute the base- 10 exponential of x.
ndrange_t __ovld ndrange_3D(const size_t[3])
uint4 __purefn __ovld read_imageui(read_only image2d_t image, sampler_t sampler, int2 coord)
float __ovld __cnfn native_log2(float x)
Compute a base 2 logarithm over an implementationdefined range.
ulong __ovld __cnfn convert_ulong_sat_rtp(char)
short2 __ovld __cnfn convert_short2_rtn(char2)
float __ovld sincos(float x, float *cosval)
Compute sine and cosine of x.
int __ovld __cnfn get_image_channel_data_type(read_only image1d_t image)
Return the channel data type.
void __ovld vstore_half_rtz(float data, size_t offset, half *p)
void __ovld vstorea_half16_rtn(float16 data, size_t offset, half *p)
int16 __ovld __cnfn convert_int16_rtz(char16)
ulong __ovld __cnfn convert_ulong_sat_rtz(char)
float __ovld __cnfn half_log(float x)
Compute natural logarithm.
long8 __ovld __cnfn convert_long8(char8)
uchar3 __ovld __cnfn convert_uchar3_rte(char3)
int __ovld __cnfn islessgreater(float x, float y)
Returns the component-wise compare of (x < y) || (x > y) .
long __ovld __cnfn convert_long_sat_rtn(char)
uchar2 __ovld __cnfn convert_uchar2_sat_rte(char2)
ushort16 __ovld __cnfn convert_ushort16_sat_rtp(char16)
ushort16 __ovld __cnfn convert_ushort16_rtz(char16)
ushort2 __ovld __cnfn convert_ushort2_sat_rtn(char2)
char8 __ovld vload8(size_t offset, const __constant char *p)
int8 __ovld __cnfn convert_int8_sat_rtz(char8)
long16 __ovld __cnfn convert_long16_sat_rte(char16)
uchar16 __ovld __cnfn convert_uchar16_rtp(char16)
size_t __ovld get_enqueued_local_size(uint dimindx)
uchar2 __ovld __cnfn convert_uchar2_rtn(char2)
int __ovld __cnfn signbit(float)
Test for sign bit.
short16 __ovld __cnfn convert_short16_rte(char16)
void __ovld vstore_half_rtn(float data, size_t offset, half *p)
ulong8 __ovld __cnfn convert_ulong8_sat_rtp(char8)
float __ovld vload_half(size_t offset, const __constant half *p)
Read sizeof (half) bytes of data from address (p + offset).
long8 __ovld __cnfn convert_long8_sat_rtz(char8)
int __ovld __cnfn get_image_width(read_only image1d_t image)
Return the image width in pixels.
short __ovld __cnfn upsample(char hi, uchar lo)
result[i] = ((short)hi[i] << 8) | lo[i] result[i] = ((ushort)hi[i] << 8) | lo[i]
short8 __ovld __cnfn convert_short8_sat(char8)
void __ovld vstore_half2_rtp(float2 data, size_t offset, half *p)
float2 __ovld __cnfn convert_float2_rtn(char2)
void __ovld vstore_half16(float16 data, size_t offset, half *p)
ulong3 __ovld __cnfn convert_ulong3_rtn(char3)
char4 __ovld __cnfn convert_char4_rtn(char4)
void __ovld vstorea_half3(float3 data, size_t offset, half *p)
int3 __ovld __cnfn convert_int3_rte(char3)
int2 __ovld __cnfn convert_int2_sat_rte(char2)
bool __ovld is_valid_reserve_id(reserve_id_t reserve_id)
long4 __ovld __cnfn convert_long4_sat_rtz(char4)
ulong __ovld __cnfn convert_ulong_rte(char)
float16 __ovld __cnfn convert_float16_rtz(char16)
void __ovld vstore_half16_rtn(float16 data, size_t offset, half *p)
ulong8 __ovld __cnfn convert_ulong8_sat_rtz(char8)
uint __ovld __cnfn convert_uint_rte(char)
uchar4 __ovld __cnfn convert_uchar4_sat_rtz(char4)
int __ovld __conv work_group_reduce_max(int x)
long3 __ovld __cnfn convert_long3(char3)
short8 __ovld __cnfn convert_short8_sat_rtp(char8)
uint16 __ovld __cnfn convert_uint16(char16)
float16 __ovld vloada_half16(size_t offset, const __constant half *p)
short16 __ovld __cnfn convert_short16(char16)
void __ovld vstore_half3_rte(float3 data, size_t offset, half *p)
long __ovld __cnfn convert_long_sat_rtp(char)
char16 __ovld vload16(size_t offset, const __constant char *p)
long3 __ovld __cnfn convert_long3_rtz(char3)
void __ovld vstorea_half2_rte(float2 data, size_t offset, half *p)
char16 __ovld __cnfn convert_char16_sat(char16)
short4 __ovld __cnfn convert_short4_rte(char4)
float __ovld __cnfn asinpi(float x)
Compute asin (x) / PI.
float __ovld __cnfn convert_float(char)
int4 __ovld __cnfn convert_int4_sat(char4)
long16 __ovld __cnfn convert_long16_sat_rtz(char16)
uchar16 __ovld __cnfn convert_uchar16_rte(char16)
int8 __ovld __cnfn convert_int8_rtp(char8)
int __ovld atomic_min(volatile __global int *p, int val)
Read the 32-bit value (referred to as old) stored at location pointed by p.
size_t __ovld __cnfn get_image_array_size(read_only image1d_array_t image_array)
Return the image array size.
char3 __ovld vload3(size_t offset, const __constant char *p)
int __ovld atomic_cmpxchg(volatile __global int *p, int cmp, int val)
Read the 32-bit value (referred to as old) stored at location pointed by p.
uint16 __ovld __cnfn convert_uint16_rtp(char16)
char __ovld __cnfn hadd(char x, char y)
Returns (x + y) >> 1.
ushort __ovld __cnfn convert_ushort_rte(char)
long2 __ovld __cnfn convert_long2_sat_rte(char2)
long16 __ovld __cnfn convert_long16_sat_rtn(char16)
void __ovld vstore_half(float data, size_t offset, half *p)
The float value given by data is first converted to a half value using the appropriate rounding mode.
ulong2 __ovld __cnfn convert_ulong2_sat_rte(char2)
uchar16 __ovld __cnfn convert_uchar16_sat_rtz(char16)
uchar4 __ovld __cnfn convert_uchar4_sat_rtp(char4)
ulong4 __ovld __cnfn convert_ulong4_rte(char4)
int __ovld __cnfn convert_int_sat_rtp(char)
ulong __ovld __cnfn convert_ulong_rtp(char)
ushort2 __ovld __cnfn convert_ushort2_rtp(char2)
int __ovld atomic_fetch_min(volatile atomic_int *object, int operand)
uint16 __ovld __cnfn convert_uint16_sat(char16)
uchar8 __ovld __cnfn convert_uchar8_sat(char8)
ushort2 __ovld __cnfn convert_ushort2_rte(char2)
void __ovld vstore_half16_rtp(float16 data, size_t offset, half *p)
char16 __ovld __cnfn convert_char16(char16)
float __ovld __cnfn dot(float p0, float p1)
Compute dot product.
float16 __ovld __cnfn convert_float16_rte(char16)
char2 __ovld __cnfn convert_char2_sat_rtz(char2)
uint __ovld __cnfn convert_uint(char)
void __ovld vstore_half2_rtn(float2 data, size_t offset, half *p)
int8 __ovld __cnfn convert_int8_rtn(char8)
int4 __ovld __cnfn convert_int4_rtn(char4)
int __ovld __cnfn get_image_channel_order(read_only image1d_t image)
Return the image channel order.
float8 __ovld __cnfn convert_float8_rtp(char8)
float4 __ovld __cnfn convert_float4_rtn(char4)
ushort4 __ovld __cnfn convert_ushort4_rte(char4)
void __ovld vstore_half4_rtz(float4 data, size_t offset, half *p)
uint3 __ovld __cnfn convert_uint3_sat_rtp(char3)
uint4 __ovld __cnfn convert_uint4(char4)
ushort2 __ovld __cnfn convert_ushort2_sat_rte(char2)
int __ovld atomic_inc(volatile __global int *p)
Read the 32-bit value (referred to as old) stored at location pointed by p.
void __ovld vstorea_half16_rte(float16 data, size_t offset, half *p)
short __ovld __cnfn convert_short_sat(char)
uint2 __ovld __cnfn convert_uint2_sat_rte(char2)
float __ovld __cnfn fast_length(float p)
Returns the length of vector p computed as: half_sqrt(p.x2 + p.y2 + ...)
ushort __ovld __cnfn convert_ushort_sat_rtn(char)
char __ovld __cnfn add_sat(char x, char y)
Returns x + y and saturates the result.
uint16 __ovld __cnfn convert_uint16_sat_rtz(char16)
ushort4 __ovld __cnfn convert_ushort4_rtn(char4)
uint4 __ovld __cnfn convert_uint4_sat_rtp(char4)
char __ovld ctz(char x)
Returns the count of trailing 0-bits in x.
clk_event_t __ovld create_user_event(void)
uchar4 __ovld __cnfn convert_uchar4_rte(char4)
ushort2 __ovld __cnfn convert_ushort2(char2)
uint __ovld __cnfn convert_uint_sat_rtz(char)
uchar2 __ovld __cnfn convert_uchar2_sat_rtz(char2)
uint8 __ovld __cnfn convert_uint8_rtz(char8)
ushort4 __ovld __cnfn convert_ushort4(char4)
char16 __ovld __cnfn convert_char16_rtn(char16)
ulong8 __ovld __cnfn convert_ulong8_sat_rte(char8)
int __ovld __cnfn isordered(float x, float y)
Test if arguments are ordered.
void __ovld vstore_half8_rtz(float8 data, size_t offset, half *p)
uint3 __ovld __cnfn convert_uint3_sat_rte(char3)
uint2 __ovld __cnfn convert_uint2(char2)
uint8 __ovld __cnfn convert_uint8_sat_rtz(char8)
uint16 __ovld __cnfn convert_uint16_rte(char16)
short2 __ovld __cnfn convert_short2_sat_rtn(char2)
float __ovld __cnfn degrees(float radians)
Converts radians to degrees, i.e.
char8 __ovld __cnfn convert_char8_rte(char8)
float __ovld __cnfn cospi(float x)
Compute cos (PI * x).
float2 __ovld __cnfn convert_float2_rtz(char2)
float4 __ovld vload_half4(size_t offset, const __constant half *p)
char3 __ovld __cnfn convert_char3_rte(char3)
int __ovld __cnfn mad24(int x, int y, int z)
Multiply two 24-bit integer values x and y and add the 32-bit integer result to the 32-bit integer z.
int __ovld __cnfn convert_int_sat(char)
char2 __ovld __cnfn convert_char2_sat_rtn(char2)
ushort __ovld __cnfn convert_ushort_rtp(char)
void __ovld vstorea_half3_rtn(float3 data, size_t offset, half *p)
void __ovld vstorea_half2_rtn(float2 data, size_t offset, half *p)
int __ovld __conv work_group_all(int predicate)
Return the number of samples associated with image.
ulong3 __ovld __cnfn convert_ulong3_rte(char3)
ulong2 __ovld __cnfn convert_ulong2_rtp(char2)
ushort16 __ovld __cnfn convert_ushort16_sat(char16)
short __ovld __cnfn convert_short(char)
short8 __ovld __cnfn convert_short8_rtn(char8)
long3 __ovld __cnfn convert_long3_rtn(char3)
void __ovld vstorea_half3_rtp(float3 data, size_t offset, half *p)
char2 __ovld __cnfn convert_char2_sat(char2)
ushort4 __ovld __cnfn convert_ushort4_sat_rte(char4)
void __ovld vstore_half4_rtn(float4 data, size_t offset, half *p)
uchar3 __ovld __cnfn convert_uchar3_sat_rtp(char3)
int __ovld __conv work_group_reduce_add(int x)
float __ovld __cnfn smoothstep(float edge0, float edge1, float x)
Returns 0.0 if x <= edge0 and 1.0 if x >= edge1 and performs smooth Hermite interpolation between 0 a...
short4 __ovld __cnfn convert_short4(char4)
ulong3 __ovld __cnfn convert_ulong3_rtz(char3)
uchar16 __ovld __cnfn convert_uchar16_rtn(char16)
size_t __ovld __cnfn get_local_size(uint dimindx)
Returns the number of local work-items specified in dimension identified by dimindx.
float __ovld __cnfn mix(float x, float y, float a)
Returns the linear blend of x & y implemented as: x + (y - x) * a a must be a value in the range 0....
ulong __ovld __cnfn convert_ulong_sat_rtn(char)
short16 __ovld __cnfn convert_short16_rtz(char16)
long2 __ovld __cnfn convert_long2_rte(char2)
void __ovld write_imagei(write_only image2d_t image, int2 coord, int4 color)
float3 __ovld vloada_half3(size_t offset, const __constant half *p)
uint4 __ovld __cnfn convert_uint4_rte(char4)
ushort8 __ovld __cnfn convert_ushort8(char8)
int8 __ovld __cnfn convert_int8_rtz(char8)
ushort __ovld __cnfn convert_ushort_sat_rtp(char)
int3 __ovld __cnfn convert_int3_sat(char3)
cl_mem_fence_flags __ovld get_fence(const void *ptr)
void __ovld vstore_half_rte(float data, size_t offset, half *p)
#define atomic_fetch_xor(object, operand)
#define atomic_store(object, desired)
#define atomic_compare_exchange_weak(object, expected, desired)
#define atomic_compare_exchange_weak_explicit
#define atomic_compare_exchange_strong(object, expected, desired)
#define atomic_exchange(object, desired)
#define atomic_fetch_or(object, operand)
#define atomic_flag_clear(object)
#define atomic_fetch_and_explicit
#define atomic_fetch_sub(object, operand)
#define atomic_fetch_sub_explicit
#define atomic_flag_test_and_set_explicit(object, order)
#define atomic_fetch_xor_explicit
#define atomic_store_explicit
#define atomic_flag_test_and_set(object)
#define atomic_fetch_or_explicit
#define atomic_load_explicit
#define atomic_flag_clear_explicit(object, order)
#define atomic_exchange_explicit
#define atomic_load(object)
#define atomic_fetch_and(object, operand)
#define atomic_compare_exchange_strong_explicit
#define atomic_fetch_add_explicit
#define atomic_fetch_add(object, operand)
#define copysign(__x, __y)
#define remquo(__x, __y, __z)
#define nextafter(__x, __y)
#define remainder(__x, __y)
#define fma(__x, __y, __z)