diff projects/heavy/samphold/SignalSamphold.h @ 160:5bcf04234f80 heavy-updated

- added -std=c99 to Makefile for user-supplied C files (required for heavy files) - changed heavy core render.cpp file to use latest API and removed all redundant functions (e.g. foleyDesigner/touchkey stuff) - use build_pd.sh to compile and run pd files (-h for usage instructions)
author chnrx <chris.heinrichs@gmail.com>
date Thu, 05 Nov 2015 18:58:26 +0000
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/projects/heavy/samphold/SignalSamphold.h	Thu Nov 05 18:58:26 2015 +0000
@@ -0,0 +1,248 @@
+/**
+ * Copyright (c) 2014, 2015, Enzien Audio Ltd.
+ *
+ * Permission to use, copy, modify, and/or distribute this software for any
+ * purpose with or without fee is hereby granted, provided that the above
+ * copyright notice and this permission notice appear in all copies.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH
+ * REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY
+ * AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT,
+ * INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM
+ * LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR
+ * OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
+ * PERFORMANCE OF THIS SOFTWARE.
+ */
+
+#ifndef _SIGNAL_SAMPHOLD_H_
+#define _SIGNAL_SAMPHOLD_H_
+
+#include "HvBase.h"
+
+typedef struct SignalSamphold {
+  hv_bufferf_t s;
+} SignalSamphold;
+
+hv_size_t sSamphold_init(SignalSamphold *o);
+
+static inline void __hv_samphold_f(SignalSamphold *o, hv_bInf_t bIn0, hv_bInf_t bIn1, hv_bOutf_t bOut) {
+#if HV_SIMD_AVX
+#warning __hv_samphold_f() not implemented
+#elif HV_SIMD_SSE
+  switch (_mm_movemask_ps(bIn1)) {
+    default:
+    case 0x0: *bOut = o->s; break;
+    case 0x1: {
+      *bOut = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(0,0,0,0));
+      o->s = *bOut;
+      break;
+    }
+    case 0x2: {
+      const __m128 x = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(1,1,1,1));
+      *bOut = _mm_blend_ps(o->s, x, 0xE);
+      o->s = x;
+      break;
+    }
+    case 0x3: {
+      const __m128 x = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(1,1,1,1));
+      *bOut = _mm_blend_ps(bIn0, x, 0xC);
+      o->s = x;
+      break;
+    }
+    case 0x4: {
+      const __m128 x = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(2,2,2,2));
+      *bOut = _mm_blend_ps(o->s, x, 0xC);
+      o->s = x;
+      break;
+    }
+    case 0x5: {
+      *bOut = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(2,2,0,0));
+      o->s = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(2,2,2,2));
+      break;
+    }
+    case 0x6: {
+      const __m128 x = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(2,2,1,0));
+      *bOut = _mm_blend_ps(o->s, x, 0xE);
+      o->s = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(2,2,2,2));
+      break;
+    }
+    case 0x7: {
+      const __m128 x = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(2,2,2,2));
+      *bOut = _mm_blend_ps(bIn0, x, 0x8);
+      o->s = x;
+      break;
+    }
+    case 0x8: {
+      const __m128 x = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(3,3,3,3));
+      *bOut = _mm_blend_ps(o->s, x, 0x8);
+      o->s = x;
+      break;
+    }
+    case 0x9: {
+      *bOut = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(3,0,0,0));
+      o->s = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(3,3,3,3));
+      break;
+    }
+    case 0xA: {
+      const __m128 x = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(3,1,1,0));
+      *bOut = _mm_blend_ps(o->s, x, 0xE);
+      o->s = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(3,3,3,3));
+      break;
+    }
+    case 0xB: {
+      *bOut = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(3,1,1,0));
+      o->s = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(3,3,3,3));
+      break;
+    }
+    case 0xC: {
+      *bOut = _mm_blend_ps(o->s, bIn0, 0xC);
+      o->s = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(3,3,3,3));
+      break;
+    }
+    case 0xD: {
+      *bOut = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(3,2,0,0));
+      o->s = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(3,3,3,3));
+      break;
+    }
+    case 0xE: {
+      *bOut = _mm_blend_ps(o->s, bIn0, 0xE);
+      o->s = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(3,3,3,3));
+      break;
+    }
+    case 0xF: {
+      *bOut = bIn0;
+      o->s = _mm_shuffle_ps(bIn0, bIn0, _MM_SHUFFLE(3,3,3,3));
+      break;
+    }
+  }
+#elif HV_SIMD_NEON
+  uint32x4_t mmA = vandq_u32(
+      vreinterpretq_u32_f32(bIn1), (uint32x4_t) {0x1, 0x2, 0x4, 0x8}); // [0 1 2 3]
+  uint32x4_t mmB = vextq_u32(mmA, mmA, 2);                             // [2 3 0 1]
+  uint32x4_t mmC = vorrq_u32(mmA, mmB);                                // [0+2 1+3 0+2 1+3]
+  uint32x4_t mmD = vextq_u32(mmC, mmC, 3);                             // [1+3 0+2 1+3 0+2]
+  uint32x4_t mmE = vorrq_u32(mmC, mmD);                                // [0+1+2+3 ...]
+  uint32_t movemask = vgetq_lane_u32(mmE, 0);
+  switch (movemask) {
+    default:
+    case 0x0: *bOut = o->s; break;
+    case 0x1: {
+      *bOut = vdupq_n_f32(vgetq_lane_f32(bIn0,0));
+      o->s = *bOut;
+      break;
+    }
+    case 0x2: {
+      const float32x4_t x = vdupq_n_f32(vgetq_lane_f32(bIn0,1));
+      *bOut = vextq_f32(o->s, x, 3);
+      o->s = x;
+      break;
+    }
+    case 0x3: {
+      const float32x4_t x = vdupq_n_f32(vgetq_lane_f32(bIn0,1));
+      *bOut = vreinterpretq_f32_u32(vorrq_u32(
+          vandq_u32(vreinterpretq_u32_f32(bIn0), (uint32x4_t) {~0x0, 0x0, 0x0, 0x0}),
+          vandq_u32(vreinterpretq_u32_f32(x), (uint32x4_t) {0x0, ~0x0, ~0x0, ~0x0})));
+      o->s = x;
+      break;
+    }
+    case 0x4: {
+      const float32x4_t x = vdupq_n_f32(vgetq_lane_f32(bIn0,2));
+      *bOut = vextq_f32(o->s, x, 2);
+      o->s = x;
+      break;
+    }
+    case 0x5: {
+      const float32x4_t x = vdupq_n_f32(vgetq_lane_f32(bIn0,0));
+      const float32x4_t y = vdupq_n_f32(vgetq_lane_f32(bIn0,2));
+      *bOut = vreinterpretq_f32_u32(vorrq_u32(
+          vandq_u32(vreinterpretq_u32_f32(x), (uint32x4_t) {~0x0, ~0x0, 0x0, 0x0}),
+          vandq_u32(vreinterpretq_u32_f32(y), (uint32x4_t) {0x0, 0x0, ~0x0, ~0x0})));
+      o->s = y;
+    }
+    case 0x6: {
+      const float32x4_t y = vdupq_n_f32(vgetq_lane_f32(bIn0,3));
+      float32x4_t z = vreinterpretq_f32_u32(vorrq_u32(
+          vandq_u32(vreinterpretq_u32_f32(o->s), (uint32x4_t) {~0x0, 0x0, 0x0, 0x0}),
+          vandq_u32(vreinterpretq_u32_f32(bIn0), (uint32x4_t) {0x0, ~0x0, ~0x0, 0x0})));
+      *bOut = vreinterpretq_f32_u32(vorrq_u32(
+          vandq_u32(vreinterpretq_u32_f32(z), (uint32x4_t) {~0x0, ~0x0, ~0x0, 0x0}),
+          vandq_u32(vreinterpretq_u32_f32(y), (uint32x4_t) {0x0, 0x0, 0x0, ~0x0})));
+      o->s = y;
+    }
+    case 0x7: {
+      const float32x4_t x = vdupq_n_f32(vgetq_lane_f32(bIn0,2));
+      *bOut = vreinterpretq_f32_u32(vorrq_u32(
+          vandq_u32(vreinterpretq_u32_f32(bIn0), (uint32x4_t) {~0x0, ~0x0, 0x0, 0x0}),
+          vandq_u32(vreinterpretq_u32_f32(x), (uint32x4_t) {0x0, 0x0, ~0x0, ~0x0})));
+      o->s = x;
+      break;
+    }
+    case 0x8: {
+      const float32x4_t x = vdupq_n_f32(vgetq_lane_f32(bIn0,3));
+      *bOut = vextq_f32(o->s, x, 1);
+      o->s = x;
+      break;
+    }
+    case 0x9: {
+      const float32x4_t x = vdupq_n_f32(vgetq_lane_f32(bIn0,0));
+      *bOut = vreinterpretq_f32_u32(vorrq_u32(
+          vandq_u32(vreinterpretq_u32_f32(x), (uint32x4_t) {~0x0, ~0x0, ~0x0, 0x0}),
+          vandq_u32(vreinterpretq_u32_f32(bIn0), (uint32x4_t) {0x0, 0x0, 0x0, ~0x0})));
+      o->s = vdupq_n_f32(vgetq_lane_f32(bIn0,3));
+    }
+    case 0xA: {
+      const float32x4_t x = vdupq_n_f32(vgetq_lane_f32(bIn0,1));
+      const float32x4_t y = vdupq_n_f32(vgetq_lane_f32(bIn0,3));
+      float32x4_t z = vreinterpretq_f32_u32(vorrq_u32(
+          vandq_u32(vreinterpretq_u32_f32(o->s), (uint32x4_t) {~0x0, 0x0, 0x0, 0x0}),
+          vandq_u32(vreinterpretq_u32_f32(x), (uint32x4_t) {0x0, ~0x0, ~0x0, 0x0})));
+      *bOut = vreinterpretq_f32_u32(vorrq_u32(
+          vandq_u32(vreinterpretq_u32_f32(z), (uint32x4_t) {~0x0, ~0x0, ~0x0, 0x0}),
+          vandq_u32(vreinterpretq_u32_f32(y), (uint32x4_t) {0x0, 0x0, 0x0, ~0x0})));
+      o->s = y;
+    }
+    case 0xB: {
+      const float32x4_t x = vdupq_n_f32(vgetq_lane_f32(bIn0,1));
+      *bOut = vreinterpretq_f32_u32(vorrq_u32(
+          vandq_u32(vreinterpretq_u32_f32(bIn0), (uint32x4_t) {~0x0, ~0x0, 0x0, ~0x0}),
+          vandq_u32(vreinterpretq_u32_f32(x), (uint32x4_t) {0x0, 0x0, ~0x0, 0x0})));
+      o->s = vdupq_n_f32(vgetq_lane_f32(bIn0,3));
+      break;
+    }
+    case 0xC: {
+      *bOut = vreinterpretq_f32_u32(vorrq_u32(
+          vandq_u32(vreinterpretq_u32_f32(o->s), (uint32x4_t) {~0x0, ~0x0, 0x0, 0x0}),
+          vandq_u32(vreinterpretq_u32_f32(bIn0), (uint32x4_t) {0x0, 0x0, ~0x0, ~0x0})));
+      o->s = vdupq_n_f32(vgetq_lane_f32(bIn0,3));
+      break;
+    }
+    case 0xD: {
+      const float32x4_t x = vdupq_n_f32(vgetq_lane_f32(bIn0,0));
+      *bOut = vreinterpretq_f32_u32(vorrq_u32(
+          vandq_u32(vreinterpretq_u32_f32(bIn0), (uint32x4_t) {~0x0, 0x0, ~0x0, ~0x0}),
+          vandq_u32(vreinterpretq_u32_f32(x), (uint32x4_t) {0x0, ~0x0, 0x0, 0x0})));
+      o->s = vdupq_n_f32(vgetq_lane_f32(bIn0,3));
+    }
+    case 0xE: {
+      *bOut = vreinterpretq_f32_u32(vorrq_u32(
+          vandq_u32(vreinterpretq_u32_f32(o->s), (uint32x4_t) {~0x0, 0x0, 0x0, 0x0}),
+          vandq_u32(vreinterpretq_u32_f32(bIn0), (uint32x4_t) {0x0, ~0x0, ~0x0, ~0x0})));
+      o->s = vdupq_n_f32(vgetq_lane_f32(bIn0,3));
+      break;
+    }
+    case 0xF: {
+      *bOut = bIn0;
+      o->s = vdupq_n_f32(vgetq_lane_f32(bIn0,3));
+      break;
+    }
+  }
+#else // HV_SIMD_NONE
+  if (bIn1 != 0.0f) o->s = bIn0;
+  *bOut = o->s;
+#endif
+}
+
+void sSamphold_onMessage(HvBase *_c, SignalSamphold *o, int letIndex,
+    const HvMessage *const m, void *sendMessage);
+
+#endif // _SIGNAL_SAMPHOLD_H_