1#include <clc/clc.h>
2#include "../clcmacro.h"
3
4_CLC_OVERLOAD _CLC_DEF char mad_sat(char x, char y, char z) {
5  return clamp((short)mad24((short)x, (short)y, (short)z), (short)CHAR_MIN, (short) CHAR_MAX);
6}
7
8_CLC_OVERLOAD _CLC_DEF uchar mad_sat(uchar x, uchar y, uchar z) {
9  return clamp((ushort)mad24((ushort)x, (ushort)y, (ushort)z), (ushort)0, (ushort) UCHAR_MAX);
10}
11
12_CLC_OVERLOAD _CLC_DEF short mad_sat(short x, short y, short z) {
13  return clamp((int)mad24((int)x, (int)y, (int)z), (int)SHRT_MIN, (int) SHRT_MAX);
14}
15
16_CLC_OVERLOAD _CLC_DEF ushort mad_sat(ushort x, ushort y, ushort z) {
17  return clamp((uint)mad24((uint)x, (uint)y, (uint)z), (uint)0, (uint) USHRT_MAX);
18}
19
20_CLC_OVERLOAD _CLC_DEF int mad_sat(int x, int y, int z) {
21  int mhi = mul_hi(x, y);
22  uint mlo = x * y;
23  long m = upsample(mhi, mlo);
24  m += z;
25  if (m > INT_MAX)
26    return INT_MAX;
27  if (m < INT_MIN)
28    return INT_MIN;
29  return m;
30}
31
32_CLC_OVERLOAD _CLC_DEF uint mad_sat(uint x, uint y, uint z) {
33  if (mul_hi(x, y) != 0)
34    return UINT_MAX;
35  return add_sat(x * y, z);
36}
37
38_CLC_OVERLOAD _CLC_DEF long mad_sat(long x, long y, long z) {
39  long hi = mul_hi(x, y);
40  ulong ulo = x * y;
41  long  slo = x * y;
42  /* Big overflow of more than 2 bits, add can't fix this */
43  if (((x < 0) == (y < 0)) && hi != 0)
44    return LONG_MAX;
45  /* Low overflow in mul and z not neg enough to correct it */
46  if (hi == 0 && ulo >= LONG_MAX && (z > 0 || (ulo + z) > LONG_MAX))
47    return LONG_MAX;
48  /* Big overflow of more than 2 bits, add can't fix this */
49  if (((x < 0) != (y < 0)) && hi != -1)
50    return LONG_MIN;
51  /* Low overflow in mul and z not pos enough to correct it */
52  if (hi == -1 && ulo <= ((ulong)LONG_MAX + 1UL) && (z < 0 || z < (LONG_MAX - ulo)))
53    return LONG_MIN;
54  /* We have checked all conditions, any overflow in addition returns
55   * the correct value */
56  return ulo + z;
57}
58
59_CLC_OVERLOAD _CLC_DEF ulong mad_sat(ulong x, ulong y, ulong z) {
60  if (mul_hi(x, y) != 0)
61    return ULONG_MAX;
62  return add_sat(x * y, z);
63}
64
65_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, char, mad_sat, char, char, char)
66_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, uchar, mad_sat, uchar, uchar, uchar)
67_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, short, mad_sat, short, short, short)
68_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, ushort, mad_sat, ushort, ushort, ushort)
69_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, int, mad_sat, int, int, int)
70_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, uint, mad_sat, uint, uint, uint)
71_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, long, mad_sat, long, long, long)
72_CLC_TERNARY_VECTORIZE(_CLC_OVERLOAD _CLC_DEF, ulong, mad_sat, ulong, ulong, ulong)
73