24[[gnu::always_inline]]
static inline std::pair<Argon<int32_t>, uint32_t>
25waveRenderingFunctionGeneral(uint32_t phase, int32_t phaseIncrement, uint32_t _phaseToAdd,
const int16_t* table,
26 int32_t tableSizeMagnitude) {
27 Argon<uint32_t> phaseVector = Argon<uint32_t>{phase}.MultiplyAdd(Argon<uint32_t>{1U, 2U, 3U, 4U}, phaseIncrement);
28 Argon<uint32_t> indices = phaseVector >> (32 - tableSizeMagnitude);
29 ArgonHalf<uint16_t> strength2 = indices.ShiftRightNarrow<16>() >> 1;
30 auto [value1, value2] = ArgonHalf<int16_t>::LoadGatherInterleaved<2>(table, indices);
33 auto output = value1.ShiftLeftLong<16>().MultiplyDoubleAddSaturateLong(value2 - value1, strength2.As<int16_t>());
34 return {output, phase + phaseIncrement * 4};
38[[gnu::always_inline]]
static inline std::pair<Argon<int32_t>, uint32_t>
39waveRenderingFunctionPulse(uint32_t phase, int32_t phaseIncrement, uint32_t phaseToAdd,
const int16_t* table,
40 int32_t tableSizeMagnitude) {
42 const int32_t rshiftAmount = (32 - tableSizeMagnitude - 16);
44 Argon<uint32_t> phaseVector = Argon<uint32_t>{phase}.MultiplyAdd(Argon<uint32_t>{1U, 2U, 3U, 4U}, phaseIncrement);
45 Argon<uint32_t> phaseLater = phaseVector + phaseToAdd;
47 Argon<uint32_t> indicesA = phaseVector >> (32 - tableSizeMagnitude);
48 ArgonHalf<int16_t> rshiftedA =
49 indicesA.ShiftRightNarrow<16>().BitwiseAnd(std::numeric_limits<int16_t>::max()).As<int16_t>();
50 auto [valueA1, valueA2] = ArgonHalf<int16_t>::LoadGatherInterleaved<2>(table, indicesA);
52 Argon<uint32_t> indicesB = phaseLater >> (32 - tableSizeMagnitude);
53 ArgonHalf<int16_t> rshiftedB =
54 indicesB.ShiftRightNarrow<16>().BitwiseAnd(std::numeric_limits<int16_t>::max()).As<int16_t>();
55 auto [valueB1, valueB2] = ArgonHalf<int16_t>::LoadGatherInterleaved<2>(table, indicesB);
58 ArgonHalf<int16_t> strengthA1 = rshiftedA | std::numeric_limits<int16_t>::min();
59 ArgonHalf<int16_t> strengthA2 = std::numeric_limits<int16_t>::min() - strengthA1;
61 Argon<int32_t> outputA = strengthA2
62 .MultiplyDoubleSaturateLong(valueA2)
63 .MultiplyDoubleAddSaturateLong(strengthA1, valueA1);
65 ArgonHalf<int16_t> strengthB2 = rshiftedB & std::numeric_limits<int16_t>::max();
66 ArgonHalf<int16_t> strengthB1 = std::numeric_limits<int16_t>::max() - strengthB2;
68 Argon<int32_t> outputB = strengthB2
69 .MultiplyDoubleSaturateLong(valueB2)
70 .MultiplyDoubleAddSaturateLong(strengthB1, valueB1);
72 auto output = outputA.MultiplyRoundFixedPoint(outputB) << 1;
73 return {output, phase + phaseIncrement * 4};