forked from OSchip/llvm-project
				
			
		
			
				
	
	
		
			59 lines
		
	
	
		
			2.2 KiB
		
	
	
	
		
			C
		
	
	
	
			
		
		
	
	
			59 lines
		
	
	
		
			2.2 KiB
		
	
	
	
		
			C
		
	
	
	
#define _CLC_VLOAD_DECL(SUFFIX, MEM_TYPE, VEC_TYPE, WIDTH, ADDR_SPACE) \
 | 
						|
  _CLC_OVERLOAD _CLC_DECL VEC_TYPE vload##SUFFIX##WIDTH(size_t offset, const ADDR_SPACE MEM_TYPE *x);
 | 
						|
 | 
						|
#define _CLC_VECTOR_VLOAD_DECL(SUFFIX, MEM_TYPE, PRIM_TYPE, ADDR_SPACE) \
 | 
						|
  _CLC_VLOAD_DECL(SUFFIX, MEM_TYPE, PRIM_TYPE##2, 2, ADDR_SPACE) \
 | 
						|
  _CLC_VLOAD_DECL(SUFFIX, MEM_TYPE, PRIM_TYPE##3, 3, ADDR_SPACE) \
 | 
						|
  _CLC_VLOAD_DECL(SUFFIX, MEM_TYPE, PRIM_TYPE##4, 4, ADDR_SPACE) \
 | 
						|
  _CLC_VLOAD_DECL(SUFFIX, MEM_TYPE, PRIM_TYPE##8, 8, ADDR_SPACE) \
 | 
						|
  _CLC_VLOAD_DECL(SUFFIX, MEM_TYPE, PRIM_TYPE##16, 16, ADDR_SPACE)
 | 
						|
 | 
						|
#define _CLC_VECTOR_VLOAD_PRIM3(SUFFIX, MEM_TYPE, PRIM_TYPE) \
 | 
						|
  _CLC_VECTOR_VLOAD_DECL(SUFFIX, MEM_TYPE, PRIM_TYPE, __private) \
 | 
						|
  _CLC_VECTOR_VLOAD_DECL(SUFFIX, MEM_TYPE, PRIM_TYPE, __local) \
 | 
						|
  _CLC_VECTOR_VLOAD_DECL(SUFFIX, MEM_TYPE, PRIM_TYPE, __constant) \
 | 
						|
  _CLC_VECTOR_VLOAD_DECL(SUFFIX, MEM_TYPE, PRIM_TYPE, __global)
 | 
						|
 | 
						|
#define _CLC_VECTOR_VLOAD_PRIM1(PRIM_TYPE) \
 | 
						|
  _CLC_VECTOR_VLOAD_PRIM3(, PRIM_TYPE, PRIM_TYPE)
 | 
						|
 | 
						|
// Declare vector load prototypes
 | 
						|
_CLC_VECTOR_VLOAD_PRIM1(char)
 | 
						|
_CLC_VECTOR_VLOAD_PRIM1(uchar)
 | 
						|
_CLC_VECTOR_VLOAD_PRIM1(short)
 | 
						|
_CLC_VECTOR_VLOAD_PRIM1(ushort)
 | 
						|
_CLC_VECTOR_VLOAD_PRIM1(int)
 | 
						|
_CLC_VECTOR_VLOAD_PRIM1(uint)
 | 
						|
_CLC_VECTOR_VLOAD_PRIM1(long)
 | 
						|
_CLC_VECTOR_VLOAD_PRIM1(ulong)
 | 
						|
_CLC_VECTOR_VLOAD_PRIM1(float)
 | 
						|
_CLC_VECTOR_VLOAD_PRIM3(_half, half, float)
 | 
						|
// Use suffix to declare aligned vloada_halfN
 | 
						|
_CLC_VECTOR_VLOAD_PRIM3(a_half, half, float)
 | 
						|
 | 
						|
#ifdef cl_khr_fp64
 | 
						|
#pragma OPENCL EXTENSION cl_khr_fp64: enable
 | 
						|
  _CLC_VECTOR_VLOAD_PRIM1(double)
 | 
						|
#endif
 | 
						|
#ifdef cl_khr_fp16
 | 
						|
#pragma OPENCL EXTENSION cl_khr_fp16: enable
 | 
						|
  _CLC_VECTOR_VLOAD_PRIM1(half)
 | 
						|
#endif
 | 
						|
 | 
						|
// Scalar vload_half also needs to be declared
 | 
						|
_CLC_VLOAD_DECL(_half, half, float, , __constant)
 | 
						|
_CLC_VLOAD_DECL(_half, half, float, , __global)
 | 
						|
_CLC_VLOAD_DECL(_half, half, float, , __local)
 | 
						|
_CLC_VLOAD_DECL(_half, half, float, , __private)
 | 
						|
 | 
						|
// Scalar vloada_half is not part of the specs but CTS expects it
 | 
						|
_CLC_VLOAD_DECL(a_half, half, float, , __constant)
 | 
						|
_CLC_VLOAD_DECL(a_half, half, float, , __global)
 | 
						|
_CLC_VLOAD_DECL(a_half, half, float, , __local)
 | 
						|
_CLC_VLOAD_DECL(a_half, half, float, , __private)
 | 
						|
 | 
						|
#undef _CLC_VLOAD_DECL
 | 
						|
#undef _CLC_VECTOR_VLOAD_DECL
 | 
						|
#undef _CLC_VECTOR_VLOAD_PRIM3
 | 
						|
#undef _CLC_VECTOR_VLOAD_PRIM1
 |