1#include <clc/clc.h> 2#include "../clcmacro.h" 3 4_CLC_OVERLOAD _CLC_DEF char mad_sat(char x, char y, char z) { 5 return clamp((short)mad24((short)x, (short)y, (short)z), (short)CHAR_MIN, (short) CHAR_MAX); 6} 7 8_CLC_OVERLOAD _CLC_DEF uchar mad_sat(uchar x, uchar y, uchar z) { 9 return clamp((ushort)mad24((ushort)x, (ushort)y, (ushort)z), (ushort)0, (ushort) UCHAR_MAX); 10} 11 12_CLC_OVERLOAD _CLC_DEF short mad_sat(short x, short y, short z) { 13 return clamp((int)mad24((int)x, (int)y, (int)z), (int)SHRT_MIN, (int) SHRT_MAX); 14} 15 16_CLC_OVERLOAD _CLC_DEF ushort mad_sat(ushort x, ushort y, ushort z) { 17 return clamp((uint)mad24((uint)x, (uint)y, (uint)z), (uint)0, (uint) USHRT_MAX); 18} 19 20_CLC_OVERLOAD _CLC_DEF int mad_sat(int x, int y, int z) { 21 int mhi = mul_hi(x, y); 22 uint mlo = x * y; 23 long m = upsample(mhi, mlo); 24 m += z; 25 if (m > INT_MAX) 26 return INT_MAX; 27 if (m < INT_MIN) 28 return INT_MIN; 29 return m; 30} 31 32_CLC_OVERLOAD _CLC_DEF uint mad_sat(uint x, uint y, uint z) { 33 if (mul_hi(x, y) != 0) 34 return UINT_MAX; 35 return add_sat(x * y, z); 36} 37 38_CLC_OVERLOAD _CLC_DEF long mad_sat(long x, long y, long z) { 39 long hi = mul_hi(x, y); 40 ulong ulo = x * y; 41 long slo = x * y; 42 /* Big overflow of more than 2 bits, add can't fix this */ 43 if (((x < 0) == (y < 0)) && hi != 0) 44 return LONG_MAX; 45 /* Low overflow in mul and z not neg enough to correct it */ 46 if (hi == 0 && ulo >= LONG_MAX && (z > 0 || (ulo + z) > LONG_MAX)) 47 return LONG_MAX; 48 /* Big overflow of more than 2 bits, add can't fix this */ 49 if (((x < 0) != (y < 0)) && hi != -1) 50 return LONG_MIN; 51 /* Low overflow in mul and z not pos enough to correct it */ 52 if (hi == -1 && ulo <= ((ulong)LONG_MAX + 1UL) && (z < 0 || z < (LONG_MAX - ulo))) 53 return LONG_MIN; 54 /* We have checked all conditions, any overflow in addition returns 55 * the correct value */ 56 return ulo + z; 57} 58 59_CLC_OVERLOAD _CLC_DEF ulong mad_sat(ulong x, ulong y, ulong z) { 60 if (mul_hi(x, y) != 0) 61 return ULONG_MAX; 62 return add_sat(x * y, z); 63} 64 65_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, char, mad_sat, char, char, char) 66_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, uchar, mad_sat, uchar, uchar, uchar) 67_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, short, mad_sat, short, short, short) 68_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, ushort, mad_sat, ushort, ushort, ushort) 69_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, int, mad_sat, int, int, int) 70_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, uint, mad_sat, uint, uint, uint) 71_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, long, mad_sat, long, long, long) 72_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, ulong, mad_sat, ulong, ulong, ulong) 73