|  |  | @@ -53,6 +53,18 @@ | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  | #define noconvert |  |  |  | #define noconvert | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #if cn != 3 | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #define loadpix(addr)  *(__global const T*)(addr) | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #define storepix(val, addr)  *(__global T*)(addr) = val | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #define TSIZE ((int)sizeof(T)) | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #define convertScalar(a) (a) | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #else | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #define loadpix(addr)  vload3(0, (__global const T1*)(addr)) | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #define storepix(val, addr) vstore3(val, 0, (__global T1*)(addr)) | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #define TSIZE ((int)sizeof(T1)*3) | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #define convertScalar(a) (T)(a.x, a.y, a.z) | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  | #endif | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  | enum |  |  |  | enum | 
			
		
	
		
		
			
				
					
					|  |  |  | { |  |  |  | { | 
			
		
	
		
		
			
				
					
					|  |  |  |     INTER_BITS = 5, |  |  |  |     INTER_BITS = 5, | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -70,7 +82,7 @@ enum | 
			
		
	
		
		
			
				
					
					|  |  |  | #define EXTRAPOLATE(v2, v) \ |  |  |  | #define EXTRAPOLATE(v2, v) \ | 
			
		
	
		
		
			
				
					
					|  |  |  |     { \ |  |  |  |     { \ | 
			
		
	
		
		
			
				
					
					|  |  |  |         v2 = max(min(v2, (int2)(src_cols - 1, src_rows - 1)), (int2)(0)); \ |  |  |  |         v2 = max(min(v2, (int2)(src_cols - 1, src_rows - 1)), (int2)(0)); \ | 
			
		
	
		
		
			
				
					
					|  |  |  |         v = convertToWT(*((__global const T*)(srcptr + mad24(v2.y, src_step, v2.x * (int)sizeof(T) + src_offset)))); \ |  |  |  |         v = convertToWT(loadpix((__global const T*)(srcptr + mad24(v2.y, src_step, v2.x * TSIZE + src_offset)))); \ | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |     } |  |  |  |     } | 
			
		
	
		
		
			
				
					
					|  |  |  | #elif defined BORDER_WRAP |  |  |  | #elif defined BORDER_WRAP | 
			
		
	
		
		
			
				
					
					|  |  |  | #define EXTRAPOLATE(v2, v) \ |  |  |  | #define EXTRAPOLATE(v2, v) \ | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -84,7 +96,7 @@ enum | 
			
		
	
		
		
			
				
					
					|  |  |  |             v2.y -= ((v2.y - src_rows + 1) / src_rows) * src_rows; \ |  |  |  |             v2.y -= ((v2.y - src_rows + 1) / src_rows) * src_rows; \ | 
			
		
	
		
		
			
				
					
					|  |  |  |         if( v2.y >= src_rows ) \ |  |  |  |         if( v2.y >= src_rows ) \ | 
			
		
	
		
		
			
				
					
					|  |  |  |             v2.y %= src_rows; \ |  |  |  |             v2.y %= src_rows; \ | 
			
		
	
		
		
			
				
					
					|  |  |  |         v = convertToWT(*((__global const T*)(srcptr + mad24(v2.y, src_step, v2.x * (int)sizeof(T) + src_offset)))); \ |  |  |  |         v = convertToWT(loadpix((__global const T*)(srcptr + mad24(v2.y, src_step, v2.x * TSIZE + src_offset)))); \ | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |     } |  |  |  |     } | 
			
		
	
		
		
			
				
					
					|  |  |  | #elif defined(BORDER_REFLECT) || defined(BORDER_REFLECT_101) |  |  |  | #elif defined(BORDER_REFLECT) || defined(BORDER_REFLECT_101) | 
			
		
	
		
		
			
				
					
					|  |  |  | #ifdef BORDER_REFLECT |  |  |  | #ifdef BORDER_REFLECT | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -118,7 +130,7 @@ enum | 
			
		
	
		
		
			
				
					
					|  |  |  |                     v2.y = src_rows - 1 - (v2.y - src_rows) - delta; \ |  |  |  |                     v2.y = src_rows - 1 - (v2.y - src_rows) - delta; \ | 
			
		
	
		
		
			
				
					
					|  |  |  |             } \ |  |  |  |             } \ | 
			
		
	
		
		
			
				
					
					|  |  |  |             while (v2.y >= src_rows || v2.y < 0); \ |  |  |  |             while (v2.y >= src_rows || v2.y < 0); \ | 
			
		
	
		
		
			
				
					
					|  |  |  |         v = convertToWT(*((__global const T*)(srcptr + mad24(v2.y, src_step, v2.x * (int)sizeof(T) + src_offset)))); \ |  |  |  |         v = convertToWT(loadpix((__global const T*)(srcptr + mad24(v2.y, src_step, v2.x * TSIZE + src_offset)))); \ | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |     } |  |  |  |     } | 
			
		
	
		
		
			
				
					
					|  |  |  | #else |  |  |  | #else | 
			
		
	
		
		
			
				
					
					|  |  |  | #error No extrapolation method |  |  |  | #error No extrapolation method | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -132,16 +144,18 @@ __kernel void remap_2_32FC1(__global const uchar * srcptr, int src_step, int src | 
			
		
	
		
		
			
				
					
					|  |  |  |                             __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, |  |  |  |                             __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, | 
			
		
	
		
		
			
				
					
					|  |  |  |                             __global const uchar * map1ptr, int map1_step, int map1_offset, |  |  |  |                             __global const uchar * map1ptr, int map1_step, int map1_offset, | 
			
		
	
		
		
			
				
					
					|  |  |  |                             __global const uchar * map2ptr, int map2_step, int map2_offset, |  |  |  |                             __global const uchar * map2ptr, int map2_step, int map2_offset, | 
			
		
	
		
		
			
				
					
					|  |  |  |                             T scalar) |  |  |  |                             ST nVal) | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  | { |  |  |  | { | 
			
		
	
		
		
			
				
					
					|  |  |  |     int x = get_global_id(0); |  |  |  |     int x = get_global_id(0); | 
			
		
	
		
		
			
				
					
					|  |  |  |     int y = get_global_id(1); |  |  |  |     int y = get_global_id(1); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |     T scalar = convertScalar(nVal); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |     if (x < dst_cols && y < dst_rows) |  |  |  |     if (x < dst_cols && y < dst_rows) | 
			
		
	
		
		
			
				
					
					|  |  |  |     { |  |  |  |     { | 
			
		
	
		
		
			
				
					
					|  |  |  |         int map1_index = mad24(y, map1_step, x * (int)sizeof(float) + map1_offset); |  |  |  |         int map1_index = mad24(y, map1_step, x * (int)sizeof(float) + map1_offset); | 
			
		
	
		
		
			
				
					
					|  |  |  |         int map2_index = mad24(y, map2_step, x * (int)sizeof(float) + map2_offset); |  |  |  |         int map2_index = mad24(y, map2_step, x * (int)sizeof(float) + map2_offset); | 
			
		
	
		
		
			
				
					
					|  |  |  |         int dst_index = mad24(y, dst_step, x * (int)sizeof(T) + dst_offset); |  |  |  |         int dst_index = mad24(y, dst_step, x * TSIZE + dst_offset); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         __global const float * map1 = (__global const float *)(map1ptr + map1_index); |  |  |  |         __global const float * map1 = (__global const float *)(map1ptr + map1_index); | 
			
		
	
		
		
			
				
					
					|  |  |  |         __global const float * map2 = (__global const float *)(map2ptr + map2_index); |  |  |  |         __global const float * map2 = (__global const float *)(map2ptr + map2_index); | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -155,12 +169,14 @@ __kernel void remap_2_32FC1(__global const uchar * srcptr, int src_step, int src | 
			
		
	
		
		
			
				
					
					|  |  |  | #ifndef BORDER_CONSTANT |  |  |  | #ifndef BORDER_CONSTANT | 
			
		
	
		
		
			
				
					
					|  |  |  |             int2 gxy = (int2)(gx, gy); |  |  |  |             int2 gxy = (int2)(gx, gy); | 
			
		
	
		
		
			
				
					
					|  |  |  | #endif |  |  |  | #endif | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(gxy, dst[0]) |  |  |  |             T v; | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |             EXTRAPOLATE(gxy, v) | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |             storepix(v, dst); | 
			
		
	
		
		
			
				
					
					|  |  |  |         } |  |  |  |         } | 
			
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |         { |  |  |  |         { | 
			
		
	
		
		
			
				
					
					|  |  |  |             int src_index = mad24(gy, src_step, gx * (int)sizeof(T) + src_offset); |  |  |  |             int src_index = mad24(gy, src_step, gx * TSIZE + src_offset); | 
			
				
				
			
		
	
		
		
			
				
					
					|  |  |  |             dst[0] = *((__global const T*)(srcptr + src_index)); |  |  |  |             storepix(loadpix((__global const T*)(srcptr + src_index)), dst); | 
			
				
				
			
		
	
		
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         } |  |  |  |         } | 
			
		
	
		
		
			
				
					
					|  |  |  |     } |  |  |  |     } | 
			
		
	
		
		
			
				
					
					|  |  |  | } |  |  |  | } | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -168,14 +184,16 @@ __kernel void remap_2_32FC1(__global const uchar * srcptr, int src_step, int src | 
			
		
	
		
		
			
				
					
					|  |  |  | __kernel void remap_32FC2(__global const uchar * srcptr, int src_step, int src_offset, int src_rows, int src_cols, |  |  |  | __kernel void remap_32FC2(__global const uchar * srcptr, int src_step, int src_offset, int src_rows, int src_cols, | 
			
		
	
		
		
			
				
					
					|  |  |  |                           __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, |  |  |  |                           __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, | 
			
		
	
		
		
			
				
					
					|  |  |  |                           __global const uchar * mapptr, int map_step, int map_offset, |  |  |  |                           __global const uchar * mapptr, int map_step, int map_offset, | 
			
		
	
		
		
			
				
					
					|  |  |  |                           T scalar) |  |  |  |                           ST nVal) | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  | { |  |  |  | { | 
			
		
	
		
		
			
				
					
					|  |  |  |     int x = get_global_id(0); |  |  |  |     int x = get_global_id(0); | 
			
		
	
		
		
			
				
					
					|  |  |  |     int y = get_global_id(1); |  |  |  |     int y = get_global_id(1); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |     T scalar = convertScalar(nVal); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |     if (x < dst_cols && y < dst_rows) |  |  |  |     if (x < dst_cols && y < dst_rows) | 
			
		
	
		
		
			
				
					
					|  |  |  |     { |  |  |  |     { | 
			
		
	
		
		
			
				
					
					|  |  |  |         int dst_index = mad24(y, dst_step, x * (int)sizeof(T) + dst_offset); |  |  |  |         int dst_index = mad24(y, dst_step, x * TSIZE + dst_offset); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         int map_index = mad24(y, map_step, x * (int)sizeof(float2) + map_offset); |  |  |  |         int map_index = mad24(y, map_step, x * (int)sizeof(float2) + map_offset); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         __global const float2 * map = (__global const float2 *)(mapptr + map_index); |  |  |  |         __global const float2 * map = (__global const float2 *)(mapptr + map_index); | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -185,11 +203,15 @@ __kernel void remap_32FC2(__global const uchar * srcptr, int src_step, int src_o | 
			
		
	
		
		
			
				
					
					|  |  |  |         int gx = gxy.x, gy = gxy.y; |  |  |  |         int gx = gxy.x, gy = gxy.y; | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (NEED_EXTRAPOLATION(gx, gy)) |  |  |  |         if (NEED_EXTRAPOLATION(gx, gy)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(gxy, dst[0]) |  |  |  |         { | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |             T v; | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |             EXTRAPOLATE(gxy, v) | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |             storepix(v, dst); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |         } | 
			
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |         { |  |  |  |         { | 
			
		
	
		
		
			
				
					
					|  |  |  |             int src_index = mad24(gy, src_step, gx * (int)sizeof(T) + src_offset); |  |  |  |             int src_index = mad24(gy, src_step, gx * TSIZE + src_offset); | 
			
				
				
			
		
	
		
		
			
				
					
					|  |  |  |             dst[0] = *((__global const T *)(srcptr + src_index)); |  |  |  |             storepix(loadpix((__global const T *)(srcptr + src_index)), dst); | 
			
				
				
			
		
	
		
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         } |  |  |  |         } | 
			
		
	
		
		
			
				
					
					|  |  |  |     } |  |  |  |     } | 
			
		
	
		
		
			
				
					
					|  |  |  | } |  |  |  | } | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -197,14 +219,16 @@ __kernel void remap_32FC2(__global const uchar * srcptr, int src_step, int src_o | 
			
		
	
		
		
			
				
					
					|  |  |  | __kernel void remap_16SC2(__global const uchar * srcptr, int src_step, int src_offset, int src_rows, int src_cols, |  |  |  | __kernel void remap_16SC2(__global const uchar * srcptr, int src_step, int src_offset, int src_rows, int src_cols, | 
			
		
	
		
		
			
				
					
					|  |  |  |                           __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, |  |  |  |                           __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, | 
			
		
	
		
		
			
				
					
					|  |  |  |                           __global const uchar * mapptr, int map_step, int map_offset, |  |  |  |                           __global const uchar * mapptr, int map_step, int map_offset, | 
			
		
	
		
		
			
				
					
					|  |  |  |                           T scalar) |  |  |  |                           ST nVal) | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  | { |  |  |  | { | 
			
		
	
		
		
			
				
					
					|  |  |  |     int x = get_global_id(0); |  |  |  |     int x = get_global_id(0); | 
			
		
	
		
		
			
				
					
					|  |  |  |     int y = get_global_id(1); |  |  |  |     int y = get_global_id(1); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |     T scalar = convertScalar(nVal); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |     if (x < dst_cols && y < dst_rows) |  |  |  |     if (x < dst_cols && y < dst_rows) | 
			
		
	
		
		
			
				
					
					|  |  |  |     { |  |  |  |     { | 
			
		
	
		
		
			
				
					
					|  |  |  |         int dst_index = mad24(y, dst_step, x * (int)sizeof(T) + dst_offset); |  |  |  |         int dst_index = mad24(y, dst_step, x * TSIZE + dst_offset); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         int map_index = mad24(y, map_step, x * (int)sizeof(short2) + map_offset); |  |  |  |         int map_index = mad24(y, map_step, x * (int)sizeof(short2) + map_offset); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         __global const short2 * map = (__global const short2 *)(mapptr + map_index); |  |  |  |         __global const short2 * map = (__global const short2 *)(mapptr + map_index); | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -214,11 +238,15 @@ __kernel void remap_16SC2(__global const uchar * srcptr, int src_step, int src_o | 
			
		
	
		
		
			
				
					
					|  |  |  |         int gx = gxy.x, gy = gxy.y; |  |  |  |         int gx = gxy.x, gy = gxy.y; | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (NEED_EXTRAPOLATION(gx, gy)) |  |  |  |         if (NEED_EXTRAPOLATION(gx, gy)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(gxy, dst[0]) |  |  |  |         { | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |             T v; | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |             EXTRAPOLATE(gxy, v) | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |             storepix(v, dst); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |         } | 
			
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |         { |  |  |  |         { | 
			
		
	
		
		
			
				
					
					|  |  |  |             int src_index = mad24(gy, src_step, gx * (int)sizeof(T) + src_offset); |  |  |  |             int src_index = mad24(gy, src_step, gx * TSIZE + src_offset); | 
			
				
				
			
		
	
		
		
			
				
					
					|  |  |  |             dst[0] = *((__global const T *)(srcptr + src_index)); |  |  |  |             storepix(loadpix((__global const T *)(srcptr + src_index)), dst); | 
			
				
				
			
		
	
		
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         } |  |  |  |         } | 
			
		
	
		
		
			
				
					
					|  |  |  |     } |  |  |  |     } | 
			
		
	
		
		
			
				
					
					|  |  |  | } |  |  |  | } | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -227,14 +255,16 @@ __kernel void remap_16SC2_16UC1(__global const uchar * srcptr, int src_step, int | 
			
		
	
		
		
			
				
					
					|  |  |  |                                 __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, |  |  |  |                                 __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, | 
			
		
	
		
		
			
				
					
					|  |  |  |                                 __global const uchar * map1ptr, int map1_step, int map1_offset, |  |  |  |                                 __global const uchar * map1ptr, int map1_step, int map1_offset, | 
			
		
	
		
		
			
				
					
					|  |  |  |                                 __global const uchar * map2ptr, int map2_step, int map2_offset, |  |  |  |                                 __global const uchar * map2ptr, int map2_step, int map2_offset, | 
			
		
	
		
		
			
				
					
					|  |  |  |                                 T scalar) |  |  |  |                                 ST nVal) | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  | { |  |  |  | { | 
			
		
	
		
		
			
				
					
					|  |  |  |     int x = get_global_id(0); |  |  |  |     int x = get_global_id(0); | 
			
		
	
		
		
			
				
					
					|  |  |  |     int y = get_global_id(1); |  |  |  |     int y = get_global_id(1); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |     T scalar = convertScalar(nVal); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |     if (x < dst_cols && y < dst_rows) |  |  |  |     if (x < dst_cols && y < dst_rows) | 
			
		
	
		
		
			
				
					
					|  |  |  |     { |  |  |  |     { | 
			
		
	
		
		
			
				
					
					|  |  |  |         int dst_index = mad24(y, dst_step, x * (int)sizeof(T) + dst_offset); |  |  |  |         int dst_index = mad24(y, dst_step, x * TSIZE + dst_offset); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         int map1_index = mad24(y, map1_step, x * (int)sizeof(short2) + map1_offset); |  |  |  |         int map1_index = mad24(y, map1_step, x * (int)sizeof(short2) + map1_offset); | 
			
		
	
		
		
			
				
					
					|  |  |  |         int map2_index = mad24(y, map2_step, x * (int)sizeof(ushort) + map2_offset); |  |  |  |         int map2_index = mad24(y, map2_step, x * (int)sizeof(ushort) + map2_offset); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -249,11 +279,15 @@ __kernel void remap_16SC2_16UC1(__global const uchar * srcptr, int src_step, int | 
			
		
	
		
		
			
				
					
					|  |  |  |         int gx = gxy.x, gy = gxy.y; |  |  |  |         int gx = gxy.x, gy = gxy.y; | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (NEED_EXTRAPOLATION(gx, gy)) |  |  |  |         if (NEED_EXTRAPOLATION(gx, gy)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(gxy, dst[0]) |  |  |  |         { | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |             T v; | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |             EXTRAPOLATE(gxy, v) | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |             storepix(v, dst); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |         } | 
			
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |         { |  |  |  |         { | 
			
		
	
		
		
			
				
					
					|  |  |  |             int src_index = mad24(gy, src_step, gx * (int)sizeof(T) + src_offset); |  |  |  |             int src_index = mad24(gy, src_step, gx * TSIZE + src_offset); | 
			
				
				
			
		
	
		
		
			
				
					
					|  |  |  |             dst[0] = *((__global const T *)(srcptr + src_index)); |  |  |  |             storepix(loadpix((__global const T *)(srcptr + src_index)), dst); | 
			
				
				
			
		
	
		
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         } |  |  |  |         } | 
			
		
	
		
		
			
				
					
					|  |  |  |     } |  |  |  |     } | 
			
		
	
		
		
			
				
					
					|  |  |  | } |  |  |  | } | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -264,14 +298,14 @@ __kernel void remap_16SC2_16UC1(__global const uchar * srcptr, int src_step, int | 
			
		
	
		
		
			
				
					
					|  |  |  |                                 __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, |  |  |  |                                 __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, | 
			
		
	
		
		
			
				
					
					|  |  |  |                                 __global const uchar * map1ptr, int map1_step, int map1_offset, |  |  |  |                                 __global const uchar * map1ptr, int map1_step, int map1_offset, | 
			
		
	
		
		
			
				
					
					|  |  |  |                                 __global const uchar * map2ptr, int map2_step, int map2_offset, |  |  |  |                                 __global const uchar * map2ptr, int map2_step, int map2_offset, | 
			
		
	
		
		
			
				
					
					|  |  |  |                                 T nVal) |  |  |  |                                 ST nVal) | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  | { |  |  |  | { | 
			
		
	
		
		
			
				
					
					|  |  |  |     int x = get_global_id(0); |  |  |  |     int x = get_global_id(0); | 
			
		
	
		
		
			
				
					
					|  |  |  |     int y = get_global_id(1); |  |  |  |     int y = get_global_id(1); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |     if (x < dst_cols && y < dst_rows) |  |  |  |     if (x < dst_cols && y < dst_rows) | 
			
		
	
		
		
			
				
					
					|  |  |  |     { |  |  |  |     { | 
			
		
	
		
		
			
				
					
					|  |  |  |         int dst_index = mad24(y, dst_step, x * (int)sizeof(T) + dst_offset); |  |  |  |         int dst_index = mad24(y, dst_step, x * TSIZE + dst_offset); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         int map1_index = mad24(y, map1_step, x * (int)sizeof(short2) + map1_offset); |  |  |  |         int map1_index = mad24(y, map1_step, x * (int)sizeof(short2) + map1_offset); | 
			
		
	
		
		
			
				
					
					|  |  |  |         int map2_index = mad24(y, map2_step, x * (int)sizeof(ushort) + map2_offset); |  |  |  |         int map2_index = mad24(y, map2_step, x * (int)sizeof(ushort) + map2_offset); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -287,26 +321,26 @@ __kernel void remap_16SC2_16UC1(__global const uchar * srcptr, int src_step, int | 
			
		
	
		
		
			
				
					
					|  |  |  |         ushort map2Value = (ushort)(map2[0] & (INTER_TAB_SIZE2 - 1)); |  |  |  |         ushort map2Value = (ushort)(map2[0] & (INTER_TAB_SIZE2 - 1)); | 
			
		
	
		
		
			
				
					
					|  |  |  |         WT2 u = (WT2)(map2Value & (INTER_TAB_SIZE - 1), map2Value >> INTER_BITS) / (WT2)(INTER_TAB_SIZE); |  |  |  |         WT2 u = (WT2)(map2Value & (INTER_TAB_SIZE - 1), map2Value >> INTER_BITS) / (WT2)(INTER_TAB_SIZE); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         WT scalar = convertToWT(nVal); |  |  |  |         WT scalar = convertToWT(convertScalar(nVal)); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         WT a = scalar, b = scalar, c = scalar, d = scalar; |  |  |  |         WT a = scalar, b = scalar, c = scalar, d = scalar; | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (!NEED_EXTRAPOLATION(map_dataA.x, map_dataA.y)) |  |  |  |         if (!NEED_EXTRAPOLATION(map_dataA.x, map_dataA.y)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             a = convertToWT(*((__global const T *)(srcptr + mad24(map_dataA.y, src_step, map_dataA.x * (int)sizeof(T) + src_offset)))); |  |  |  |             a = convertToWT(loadpix((__global const T *)(srcptr + mad24(map_dataA.y, src_step, map_dataA.x * TSIZE + src_offset)))); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(map_dataA, a); |  |  |  |             EXTRAPOLATE(map_dataA, a); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (!NEED_EXTRAPOLATION(map_dataB.x, map_dataB.y)) |  |  |  |         if (!NEED_EXTRAPOLATION(map_dataB.x, map_dataB.y)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             b = convertToWT(*((__global const T *)(srcptr + mad24(map_dataB.y, src_step, map_dataB.x * (int)sizeof(T) + src_offset)))); |  |  |  |             b = convertToWT(loadpix((__global const T *)(srcptr + mad24(map_dataB.y, src_step, map_dataB.x * TSIZE + src_offset)))); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(map_dataB, b); |  |  |  |             EXTRAPOLATE(map_dataB, b); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (!NEED_EXTRAPOLATION(map_dataC.x, map_dataC.y)) |  |  |  |         if (!NEED_EXTRAPOLATION(map_dataC.x, map_dataC.y)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             c = convertToWT(*((__global const T *)(srcptr + mad24(map_dataC.y, src_step, map_dataC.x * (int)sizeof(T) + src_offset)))); |  |  |  |             c = convertToWT(loadpix((__global const T *)(srcptr + mad24(map_dataC.y, src_step, map_dataC.x * TSIZE + src_offset)))); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(map_dataC, c); |  |  |  |             EXTRAPOLATE(map_dataC, c); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (!NEED_EXTRAPOLATION(map_dataD.x, map_dataD.y)) |  |  |  |         if (!NEED_EXTRAPOLATION(map_dataD.x, map_dataD.y)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             d = convertToWT(*((__global const T *)(srcptr + mad24(map_dataD.y, src_step, map_dataD.x * (int)sizeof(T) + src_offset)))); |  |  |  |             d = convertToWT(loadpix((__global const T *)(srcptr + mad24(map_dataD.y, src_step, map_dataD.x * TSIZE + src_offset)))); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(map_dataD, d); |  |  |  |             EXTRAPOLATE(map_dataD, d); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -314,7 +348,7 @@ __kernel void remap_16SC2_16UC1(__global const uchar * srcptr, int src_step, int | 
			
		
	
		
		
			
				
					
					|  |  |  |                       b * (u.x)     * (1 - u.y) + |  |  |  |                       b * (u.x)     * (1 - u.y) + | 
			
		
	
		
		
			
				
					
					|  |  |  |                       c * (1 - u.x) * (u.y) + |  |  |  |                       c * (1 - u.x) * (u.y) + | 
			
		
	
		
		
			
				
					
					|  |  |  |                       d * (u.x)     * (u.y); |  |  |  |                       d * (u.x)     * (u.y); | 
			
		
	
		
		
			
				
					
					|  |  |  |         dst[0] = convertToT(dst_data); |  |  |  |         storepix(convertToT(dst_data), dst); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |     } |  |  |  |     } | 
			
		
	
		
		
			
				
					
					|  |  |  | } |  |  |  | } | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -322,14 +356,14 @@ __kernel void remap_2_32FC1(__global const uchar * srcptr, int src_step, int src | 
			
		
	
		
		
			
				
					
					|  |  |  |                             __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, |  |  |  |                             __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, | 
			
		
	
		
		
			
				
					
					|  |  |  |                             __global const uchar * map1ptr, int map1_step, int map1_offset, |  |  |  |                             __global const uchar * map1ptr, int map1_step, int map1_offset, | 
			
		
	
		
		
			
				
					
					|  |  |  |                             __global const uchar * map2ptr, int map2_step, int map2_offset, |  |  |  |                             __global const uchar * map2ptr, int map2_step, int map2_offset, | 
			
		
	
		
		
			
				
					
					|  |  |  |                             T nVal) |  |  |  |                             ST nVal) | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  | { |  |  |  | { | 
			
		
	
		
		
			
				
					
					|  |  |  |     int x = get_global_id(0); |  |  |  |     int x = get_global_id(0); | 
			
		
	
		
		
			
				
					
					|  |  |  |     int y = get_global_id(1); |  |  |  |     int y = get_global_id(1); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |     if (x < dst_cols && y < dst_rows) |  |  |  |     if (x < dst_cols && y < dst_rows) | 
			
		
	
		
		
			
				
					
					|  |  |  |     { |  |  |  |     { | 
			
		
	
		
		
			
				
					
					|  |  |  |         int dst_index = mad24(y, dst_step, x * (int)sizeof(T) + dst_offset); |  |  |  |         int dst_index = mad24(y, dst_step, x * TSIZE + dst_offset); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         int map1_index = mad24(y, map1_step, x * (int)sizeof(float) + map1_offset); |  |  |  |         int map1_index = mad24(y, map1_step, x * (int)sizeof(float) + map1_offset); | 
			
		
	
		
		
			
				
					
					|  |  |  |         int map2_index = mad24(y, map2_step, x * (int)sizeof(float) + map2_offset); |  |  |  |         int map2_index = mad24(y, map2_step, x * (int)sizeof(float) + map2_offset); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -346,26 +380,26 @@ __kernel void remap_2_32FC1(__global const uchar * srcptr, int src_step, int src | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         float2 _u = map_data - convert_float2(map_dataA); |  |  |  |         float2 _u = map_data - convert_float2(map_dataA); | 
			
		
	
		
		
			
				
					
					|  |  |  |         WT2 u = convertToWT2(convert_int2_rte(convertToWT2(_u) * (WT2)INTER_TAB_SIZE)) / (WT2)INTER_TAB_SIZE; |  |  |  |         WT2 u = convertToWT2(convert_int2_rte(convertToWT2(_u) * (WT2)INTER_TAB_SIZE)) / (WT2)INTER_TAB_SIZE; | 
			
		
	
		
		
			
				
					
					|  |  |  |         WT scalar = convertToWT(nVal); |  |  |  |         WT scalar = convertToWT(convertScalar(nVal)); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         WT a = scalar, b = scalar, c = scalar, d = scalar; |  |  |  |         WT a = scalar, b = scalar, c = scalar, d = scalar; | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (!NEED_EXTRAPOLATION(map_dataA.x, map_dataA.y)) |  |  |  |         if (!NEED_EXTRAPOLATION(map_dataA.x, map_dataA.y)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             a = convertToWT(*((__global const T *)(srcptr + mad24(map_dataA.y, src_step, map_dataA.x * (int)sizeof(T) + src_offset)))); |  |  |  |             a = convertToWT(loadpix((__global const T *)(srcptr + mad24(map_dataA.y, src_step, map_dataA.x * TSIZE + src_offset)))); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(map_dataA, a); |  |  |  |             EXTRAPOLATE(map_dataA, a); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (!NEED_EXTRAPOLATION(map_dataB.x, map_dataB.y)) |  |  |  |         if (!NEED_EXTRAPOLATION(map_dataB.x, map_dataB.y)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             b = convertToWT(*((__global const T *)(srcptr + mad24(map_dataB.y, src_step, map_dataB.x * (int)sizeof(T) + src_offset)))); |  |  |  |             b = convertToWT(loadpix((__global const T *)(srcptr + mad24(map_dataB.y, src_step, map_dataB.x * TSIZE + src_offset)))); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(map_dataB, b); |  |  |  |             EXTRAPOLATE(map_dataB, b); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (!NEED_EXTRAPOLATION(map_dataC.x, map_dataC.y)) |  |  |  |         if (!NEED_EXTRAPOLATION(map_dataC.x, map_dataC.y)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             c = convertToWT(*((__global const T *)(srcptr + mad24(map_dataC.y, src_step, map_dataC.x * (int)sizeof(T) + src_offset)))); |  |  |  |             c = convertToWT(loadpix((__global const T *)(srcptr + mad24(map_dataC.y, src_step, map_dataC.x * TSIZE + src_offset)))); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(map_dataC, c); |  |  |  |             EXTRAPOLATE(map_dataC, c); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (!NEED_EXTRAPOLATION(map_dataD.x, map_dataD.y)) |  |  |  |         if (!NEED_EXTRAPOLATION(map_dataD.x, map_dataD.y)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             d = convertToWT(*((__global const T *)(srcptr + mad24(map_dataD.y, src_step, map_dataD.x * (int)sizeof(T) + src_offset)))); |  |  |  |             d = convertToWT(loadpix((__global const T *)(srcptr + mad24(map_dataD.y, src_step, map_dataD.x * TSIZE + src_offset)))); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(map_dataD, d); |  |  |  |             EXTRAPOLATE(map_dataD, d); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -373,21 +407,21 @@ __kernel void remap_2_32FC1(__global const uchar * srcptr, int src_step, int src | 
			
		
	
		
		
			
				
					
					|  |  |  |                       b * (u.x)     * (1 - u.y) + |  |  |  |                       b * (u.x)     * (1 - u.y) + | 
			
		
	
		
		
			
				
					
					|  |  |  |                       c * (1 - u.x) * (u.y) + |  |  |  |                       c * (1 - u.x) * (u.y) + | 
			
		
	
		
		
			
				
					
					|  |  |  |                       d * (u.x)     * (u.y); |  |  |  |                       d * (u.x)     * (u.y); | 
			
		
	
		
		
			
				
					
					|  |  |  |         dst[0] = convertToT(dst_data); |  |  |  |         storepix(convertToT(dst_data), dst); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |     } |  |  |  |     } | 
			
		
	
		
		
			
				
					
					|  |  |  | } |  |  |  | } | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  | __kernel void remap_32FC2(__global const uchar * srcptr, int src_step, int src_offset, int src_rows, int src_cols, |  |  |  | __kernel void remap_32FC2(__global const uchar * srcptr, int src_step, int src_offset, int src_rows, int src_cols, | 
			
		
	
		
		
			
				
					
					|  |  |  |                           __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, |  |  |  |                           __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, | 
			
		
	
		
		
			
				
					
					|  |  |  |                           __global const uchar * mapptr, int map_step, int map_offset, |  |  |  |                           __global const uchar * mapptr, int map_step, int map_offset, | 
			
		
	
		
		
			
				
					
					|  |  |  |                           T nVal) |  |  |  |                           ST nVal) | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  | { |  |  |  | { | 
			
		
	
		
		
			
				
					
					|  |  |  |     int x = get_global_id(0); |  |  |  |     int x = get_global_id(0); | 
			
		
	
		
		
			
				
					
					|  |  |  |     int y = get_global_id(1); |  |  |  |     int y = get_global_id(1); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |     if (x < dst_cols && y < dst_rows) |  |  |  |     if (x < dst_cols && y < dst_rows) | 
			
		
	
		
		
			
				
					
					|  |  |  |     { |  |  |  |     { | 
			
		
	
		
		
			
				
					
					|  |  |  |         int dst_index = mad24(y, dst_step, x * (int)sizeof(T) + dst_offset); |  |  |  |         int dst_index = mad24(y, dst_step, x * TSIZE + dst_offset); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         int map_index = mad24(y, map_step, x * (int)sizeof(float2) + map_offset); |  |  |  |         int map_index = mad24(y, map_step, x * (int)sizeof(float2) + map_offset); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         __global const float2 * map = (__global const float2 *)(mapptr + map_index); |  |  |  |         __global const float2 * map = (__global const float2 *)(mapptr + map_index); | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -401,26 +435,26 @@ __kernel void remap_32FC2(__global const uchar * srcptr, int src_step, int src_o | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         float2 _u = map_data - convert_float2(map_dataA); |  |  |  |         float2 _u = map_data - convert_float2(map_dataA); | 
			
		
	
		
		
			
				
					
					|  |  |  |         WT2 u = convertToWT2(convert_int2_rte(convertToWT2(_u) * (WT2)INTER_TAB_SIZE)) / (WT2)INTER_TAB_SIZE; |  |  |  |         WT2 u = convertToWT2(convert_int2_rte(convertToWT2(_u) * (WT2)INTER_TAB_SIZE)) / (WT2)INTER_TAB_SIZE; | 
			
		
	
		
		
			
				
					
					|  |  |  |         WT scalar = convertToWT(nVal); |  |  |  |         WT scalar = convertToWT(convertScalar(nVal)); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         WT a = scalar, b = scalar, c = scalar, d = scalar; |  |  |  |         WT a = scalar, b = scalar, c = scalar, d = scalar; | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (!NEED_EXTRAPOLATION(map_dataA.x, map_dataA.y)) |  |  |  |         if (!NEED_EXTRAPOLATION(map_dataA.x, map_dataA.y)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             a = convertToWT(*((__global const T *)(srcptr + mad24(map_dataA.y, src_step, map_dataA.x * (int)sizeof(T) + src_offset)))); |  |  |  |             a = convertToWT(loadpix((__global const T *)(srcptr + mad24(map_dataA.y, src_step, map_dataA.x * TSIZE + src_offset)))); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(map_dataA, a); |  |  |  |             EXTRAPOLATE(map_dataA, a); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (!NEED_EXTRAPOLATION(map_dataB.x, map_dataB.y)) |  |  |  |         if (!NEED_EXTRAPOLATION(map_dataB.x, map_dataB.y)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             b = convertToWT(*((__global const T *)(srcptr + mad24(map_dataB.y, src_step, map_dataB.x * (int)sizeof(T) + src_offset)))); |  |  |  |             b = convertToWT(loadpix((__global const T *)(srcptr + mad24(map_dataB.y, src_step, map_dataB.x * TSIZE + src_offset)))); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(map_dataB, b); |  |  |  |             EXTRAPOLATE(map_dataB, b); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (!NEED_EXTRAPOLATION(map_dataC.x, map_dataC.y)) |  |  |  |         if (!NEED_EXTRAPOLATION(map_dataC.x, map_dataC.y)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             c = convertToWT(*((__global const T *)(srcptr + mad24(map_dataC.y, src_step, map_dataC.x * (int)sizeof(T) + src_offset)))); |  |  |  |             c = convertToWT(loadpix((__global const T *)(srcptr + mad24(map_dataC.y, src_step, map_dataC.x * TSIZE + src_offset)))); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(map_dataC, c); |  |  |  |             EXTRAPOLATE(map_dataC, c); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
		
		
			
				
					
					|  |  |  |         if (!NEED_EXTRAPOLATION(map_dataD.x, map_dataD.y)) |  |  |  |         if (!NEED_EXTRAPOLATION(map_dataD.x, map_dataD.y)) | 
			
		
	
		
		
			
				
					
					|  |  |  |             d = convertToWT(*((__global const T *)(srcptr + mad24(map_dataD.y, src_step, map_dataD.x * (int)sizeof(T) + src_offset)))); |  |  |  |             d = convertToWT(loadpix((__global const T *)(srcptr + mad24(map_dataD.y, src_step, map_dataD.x * TSIZE + src_offset)))); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |         else |  |  |  |         else | 
			
		
	
		
		
			
				
					
					|  |  |  |             EXTRAPOLATE(map_dataD, d); |  |  |  |             EXTRAPOLATE(map_dataD, d); | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
	
		
		
			
				
					
					|  |  | @@ -428,7 +462,7 @@ __kernel void remap_32FC2(__global const uchar * srcptr, int src_step, int src_o | 
			
		
	
		
		
			
				
					
					|  |  |  |                       b * (u.x)     * (1 - u.y) + |  |  |  |                       b * (u.x)     * (1 - u.y) + | 
			
		
	
		
		
			
				
					
					|  |  |  |                       c * (1 - u.x) * (u.y) + |  |  |  |                       c * (1 - u.x) * (u.y) + | 
			
		
	
		
		
			
				
					
					|  |  |  |                       d * (u.x)     * (u.y); |  |  |  |                       d * (u.x)     * (u.y); | 
			
		
	
		
		
			
				
					
					|  |  |  |         dst[0] = convertToT(dst_data); |  |  |  |         storepix(convertToT(dst_data), dst); | 
			
				
				
			
		
	
		
		
	
		
		
			
				
					
					|  |  |  |     } |  |  |  |     } | 
			
		
	
		
		
			
				
					
					|  |  |  | } |  |  |  | } | 
			
		
	
		
		
			
				
					
					|  |  |  |  |  |  |  |  | 
			
		
	
	
		
		
			
				
					
					|  |  |   |