#include "ref.h"
q31_t ref__QADD8(q31_t x, q31_t y)
{
q31_t sum;
q7_t r, s, t, u;
r = (q7_t) x;
s = (q7_t) y;
r = ref_sat_n((q31_t) (r + s), 8);
s = ref_sat_n(((q31_t) (((x << 16) >> 24) + ((y << 16) >> 24))), 8);
t = ref_sat_n(((q31_t) (((x << 8) >> 24) + ((y << 8) >> 24))), 8);
u = ref_sat_n(((q31_t) ((x >> 24) + (y >> 24))), 8);
sum =
(((q31_t) u << 24) & 0xFF000000) | (((q31_t) t << 16) & 0x00FF0000) |
(((q31_t) s << 8) & 0x0000FF00) | (r & 0x000000FF);
return sum;
}
q31_t ref__QSUB8(q31_t x, q31_t y)
{
q31_t sum;
q31_t r, s, t, u;
r = (q7_t) x;
s = (q7_t) y;
r = ref_sat_n((r - s), 8);
s = ref_sat_n(((q31_t) (((x << 16) >> 24) - ((y << 16) >> 24))), 8) << 8;
t = ref_sat_n(((q31_t) (((x << 8) >> 24) - ((y << 8) >> 24))), 8) << 16;
u = ref_sat_n(((q31_t) ((x >> 24) - (y >> 24))), 8) << 24;
sum = (u & 0xFF000000) | (t & 0x00FF0000) | (s & 0x0000FF00) | (r & 0x000000FF);
return sum;
}
q31_t ref__QADD16(q31_t x, q31_t y)
{
q31_t sum;
q31_t r, s;
r = (q15_t) x;
s = (q15_t) y;
r = ref_sat_q15(r + s);
s = (q31_t)ref_sat_q15(((q31_t) ((x >> 16) + (y >> 16)))) << 16;
sum = (s & 0xFFFF0000) | (r & 0x0000FFFF);
return sum;
}
q31_t ref__SHADD16(q31_t x, q31_t y)
{
q31_t sum;
q31_t r, s;
r = (q15_t) x;
s = (q15_t) y;
r = (r + s) >> 1;
s = ((q31_t) (((x >> 16) + (y >> 16)) >> 1) << 16);
sum = (s & 0xFFFF0000) | (r & 0x0000FFFF);
return sum;
}
q31_t ref__QSUB16(q31_t x, q31_t y)
{
q31_t sum;
q31_t r, s;
r = (q15_t) x;
s = (q15_t) y;
r = ref_sat_q15(r - s);
s = (q31_t)ref_sat_q15(((q31_t) ((x >> 16) - (y >> 16)))) << 16;
sum = (s & 0xFFFF0000) | (r & 0x0000FFFF);
return sum;
}
q31_t ref__SHSUB16(q31_t x, q31_t y)
{
q31_t diff;
q31_t r, s;
r = (q15_t) x;
s = (q15_t) y;
r = ((r >> 1) - (s >> 1));
s = (((x >> 17) - (y >> 17)) << 16);
diff = (s & 0xFFFF0000) | (r & 0x0000FFFF);
return diff;
}
q31_t ref__QASX(q31_t x, q31_t y)
{
q31_t sum = 0;
q31_t xL, xH, yL, yH;
// extract bottom halfword and sign extend
xL = (q15_t)(x & 0xffff);
// extract bottom halfword and sign extend
yL = (q15_t)(y & 0xffff);
// extract top halfword and sign extend
xH = (q15_t)(x >> 16);
// extract top halfword and sign extend
yH = (q15_t)(y >> 16);
sum = (((q31_t)ref_sat_q15(xH + yL )) << 16) |
(((q31_t)ref_sat_q15(xL - yH )) & 0xffff);
return sum;
}
q31_t ref__SHASX(q31_t x, q31_t y)
{
q31_t sum;
q31_t r, s;
r = (q15_t) x;
s = (q15_t) y;
r = (r - (y >> 16)) / 2;
s = (((x >> 16) + s) << 15);
sum = (s & 0xFFFF0000) | (r & 0x0000FFFF);
return sum;
}
q31_t ref__QSAX(q31_t x, q31_t y)
{
q31_t sum = 0;
q31_t xL, xH, yL, yH;
// extract bottom halfword and sign extend
xL = (q15_t)(x & 0xffff);
// extract bottom halfword and sign extend
yL = (q15_t)(y & 0xffff);
// extract top halfword and sign extend
xH = (q15_t)(x >> 16);
// extract top halfword and sign extend
yH = (q15_t)(y >> 16);
sum = (((q31_t)ref_sat_q15(xH - yL )) << 16) |
(((q31_t)ref_sat_q15(xL + yH )) & 0xffff);
return sum;
}
q31_t ref__SHSAX(q31_t x, q31_t y)
{
q31_t sum;
q31_t r, s;
r = (q15_t) x;
s = (q15_t) y;
r = (r + (y >> 16)) / 2;
s = (((x >> 16) - s) << 15);
sum = (s & 0xFFFF0000) | (r & 0x0000FFFF);
return sum;
}
q31_t ref__SMUSDX(q31_t x, q31_t y)
{
return ((q31_t) (((q15_t) x * (q15_t) (y >> 16)) - ((q15_t) (x >> 16) * (q15_t) y)));
}
q31_t ref__SMUADX(q31_t x, q31_t y)
{
return ((q31_t) (((q15_t) x * (q15_t) (y >> 16)) + ((q15_t) (x >> 16) * (q15_t) y)));
}
q31_t ref__QADD(q31_t x, q31_t y)
{
return ref_sat_q31((q63_t) x + y);
}
q31_t ref__QSUB(q31_t x, q31_t y)
{
return ref_sat_q31((q63_t) x - y);
}
q31_t ref__SMLAD(q31_t x, q31_t y, q31_t sum)
{
return (sum + ((q15_t) (x >> 16) * (q15_t) (y >> 16)) + ((q15_t) x * (q15_t) y));
}
q31_t ref__SMLADX(q31_t x, q31_t y, q31_t sum)
{
return (sum + ((q15_t) (x >> 16) * (q15_t) (y)) + ((q15_t) x * (q15_t) (y >> 16)));
}
q31_t ref__SMLSDX(q31_t x, q31_t y, q31_t sum)
{
return (sum - ((q15_t) (x >> 16) * (q15_t) (y)) + ((q15_t) x * (q15_t) (y >> 16)));
}
q63_t ref__SMLALD(q31_t x, q31_t y, q63_t sum)
{
return (sum + ((q15_t) (x >> 16) * (q15_t) (y >> 16)) + ((q15_t) x * (q15_t) y));
}
q63_t ref__SMLALDX(q31_t x, q31_t y, q63_t sum)
{
return (sum + ((q15_t) (x >> 16) * (q15_t) y)) + ((q15_t) x * (q15_t) (y >> 16));
}
q31_t ref__SMUAD(q31_t x, q31_t y)
{
return (((x >> 16) * (y >> 16)) + (((x << 16) >> 16) * ((y << 16) >> 16)));
}
q31_t ref__SMUSD(q31_t x, q31_t y)
{
return (-((x >> 16) * (y >> 16)) + (((x << 16) >> 16) * ((y << 16) >> 16)));
}
q31_t ref__SXTB16(q31_t x)
{
return ((((x << 24) >> 24) & 0x0000FFFF) | (((x << 8) >> 8) & 0xFFFF0000));
}