diff options
Diffstat (limited to 'src/0x7c0x7c0x7e.c')
-rw-r--r-- | src/0x7c0x7c0x7e.c | 276 |
1 files changed, 276 insertions, 0 deletions
diff --git a/src/0x7c0x7c0x7e.c b/src/0x7c0x7c0x7e.c new file mode 100644 index 0000000..8c2afb1 --- /dev/null +++ b/src/0x7c0x7c0x7e.c @@ -0,0 +1,276 @@ +/****************************************************** + * + * zexy - implementation file + * + * copyleft (c) IOhannes m zmölnig + * + * 1999:forum::für::umläute:2004 + * + * institute of electronic music and acoustics (iem) + * + ****************************************************** + * + * license: GNU General Public License v.2 + * + ******************************************************/ + +/* + finally :: some of the missing binops for signals :: ||~ + + 1302:forum::für::umläute:2000 +*/ + +#include "zexy.h" + +/* ----------------------------- oror_tilde ----------------------------- */ +static t_class *oror_tilde_class, *scalaroror_tilde_class; + +typedef struct _oror_tilde +{ + t_object x_obj; + float x_f; +} t_oror_tilde; + +typedef struct _scalaroror_tilde +{ + t_object x_obj; + float x_f; + t_float x_g; /* inlet value */ +} t_scalaroror_tilde; + +static void *oror_tilde_new(t_symbol *s, int argc, t_atom *argv) +{ + if (argc > 1) post("||~: extra arguments ignored"); + if (argc) + { + t_scalaroror_tilde *x = (t_scalaroror_tilde *)pd_new(scalaroror_tilde_class); + floatinlet_new(&x->x_obj, &x->x_g); + x->x_g = atom_getfloatarg(0, argc, argv); + outlet_new(&x->x_obj, &s_signal); + x->x_f = 0; + return (x); + } + else + { + t_oror_tilde *x = (t_oror_tilde *)pd_new(oror_tilde_class); + inlet_new(&x->x_obj, &x->x_obj.ob_pd, &s_signal, &s_signal); + outlet_new(&x->x_obj, &s_signal); + x->x_f = 0; + return (x); + } +} + +t_int *oror_tilde_perform(t_int *w) +{ + t_float *in1 = (t_float *)(w[1]); + t_float *in2 = (t_float *)(w[2]); + t_float *out = (t_float *)(w[3]); + int n = (int)(w[4]); + while (n--) *out++ = (int)*in1++ || (int)*in2++; + return (w+5); +} + +t_int *oror_tilde_perf8(t_int *w) +{ + t_float *in1 = (t_float *)(w[1]); + t_float *in2 = (t_float *)(w[2]); + t_float *out = (t_float *)(w[3]); + int n = (int)(w[4]); + for (; n; n -= 8, in1 += 8, in2 += 8, out += 8) + { + int f0 = in1[0], f1 = in1[1], f2 = in1[2], f3 = in1[3]; + int f4 = in1[4], f5 = in1[5], f6 = in1[6], f7 = in1[7]; + + int g0 = in2[0], g1 = in2[1], g2 = in2[2], g3 = in2[3]; + int g4 = in2[4], g5 = in2[5], g6 = in2[6], g7 = in2[7]; + + out[0] = f0 || g0; out[1] = f1 || g1; out[2] = f2 || g2; out[3] = f3 || g3; + out[4] = f4 || g4; out[5] = f5 || g5; out[6] = f6 || g6; out[7] = f7 || g7; + } + return (w+5); +} + +t_int *scalaroror_tilde_perform(t_int *w) +{ + t_float *in = (t_float *)(w[1]); + int f = *(t_float *)(w[2]); + t_float *out = (t_float *)(w[3]); + int n = (int)(w[4]); + while (n--) *out++ = (int)*in++ || f; + return (w+5); +} + +t_int *scalaroror_tilde_perf8(t_int *w) +{ + t_float *in = (t_float *)(w[1]); + int g = *(t_float *)(w[2]); + t_float *out = (t_float *)(w[3]); + int n = (int)(w[4]); + for (; n; n -= 8, in += 8, out += 8) + { + int f0 = in[0], f1 = in[1], f2 = in[2], f3 = in[3]; + int f4 = in[4], f5 = in[5], f6 = in[6], f7 = in[7]; + + out[0] = f0 || g; out[1] = f1 || g; out[2] = f2 || g; out[3] = f3 || g; + out[4] = f4 || g; out[5] = f5 || g; out[6] = f6 || g; out[7] = f7 || g; + } + return (w+5); +} + +#ifdef __SSE__ +t_int *oror_tilde_performSSE(t_int *w) +{ + __m128 *in1 = (__m128 *)(w[1]); + __m128 *in2 = (__m128 *)(w[2]); + __m128 *out = (__m128 *)(w[3]); + int n = (int)(w[4])>>4; + const __m128 one = _mm_set1_ps(1.f); + const __m128 zero = _mm_setzero_ps(); + + while (n--) { + __m128 xmm0, xmm1, xmm2; + xmm0 = _mm_cmpneq_ps(in1[0], zero); + xmm1 = _mm_cmpneq_ps(in2[0], zero); + xmm2 = _mm_or_ps (xmm0 , xmm1); + out[0] = _mm_and_ps (xmm2 , one); + + xmm0 = _mm_cmpneq_ps(in1[1], zero); + xmm1 = _mm_cmpneq_ps(in2[1], zero); + xmm2 = _mm_or_ps (xmm0 , xmm1); + out[1] = _mm_and_ps (xmm2 , one); + + xmm0 = _mm_cmpneq_ps(in1[2], zero); + xmm1 = _mm_cmpneq_ps(in2[2], zero); + xmm2 = _mm_or_ps (xmm0 , xmm1); + out[2] = _mm_and_ps (xmm2 , one); + + xmm0 = _mm_cmpneq_ps(in1[3], zero); + xmm1 = _mm_cmpneq_ps(in2[3], zero); + xmm2 = _mm_or_ps (xmm0 , xmm1); + out[3] = _mm_and_ps (xmm2 , one); + + in1+=4; + in2+=4; + out+=4; + } + + return (w+5); +} +t_int *scalaroror_tilde_performSSE(t_int *w) +{ + __m128 *in = (__m128 *)(w[1]); + __m128 *out = (__m128 *)(w[3]); + t_float f = *(t_float *)(w[2]); + __m128 scalar = _mm_set1_ps(f); + int n = (int)(w[4])>>4; + const __m128 one = _mm_set1_ps(1.f); + const __m128 zero = _mm_setzero_ps(); + + scalar = _mm_cmpneq_ps(scalar, zero); + while (n--) { + __m128 xmm0, xmm1; + xmm0 = _mm_cmpneq_ps(in[0], zero); + xmm1 = _mm_or_ps (xmm0 , scalar); + out[0] = _mm_and_ps (xmm1 , one); + + xmm0 = _mm_cmpneq_ps(in[1], zero); + xmm1 = _mm_or_ps (xmm0 , scalar); + out[1] = _mm_and_ps (xmm1 , one); + + xmm0 = _mm_cmpneq_ps(in[2], zero); + xmm1 = _mm_or_ps (xmm0 , scalar); + out[2] = _mm_and_ps (xmm1 , one); + + xmm0 = _mm_cmpneq_ps(in[3], zero); + xmm1 = _mm_or_ps (xmm0 , scalar); + out[3] = _mm_and_ps (xmm1 , one); + + + in +=4; + out+=4; + } + return (w+5); +} +#endif /* __SSE__ */ + +static void oror_tilde_dsp(t_oror_tilde *x, t_signal **sp) +{ + t_sample*in1=sp[0]->s_vec; + t_sample*in2=sp[1]->s_vec; + t_sample*out=sp[2]->s_vec; + + int n=sp[0]->s_n; + +#ifdef __SSE__ + if( + Z_SIMD_CHKBLOCKSIZE(n)&& + Z_SIMD_CHKALIGN(in1)&& + Z_SIMD_CHKALIGN(in2)&& + Z_SIMD_CHKALIGN(out) + ) + { + dsp_add(oror_tilde_performSSE, 4, in1, in2, out, n); + } else +#endif + if(n&7) + dsp_add(oror_tilde_perform, 4, in1, in2, out, n); + else + dsp_add(oror_tilde_perf8, 4, in1, in2, out, n); +} + +static void scalaroror_tilde_dsp(t_scalaroror_tilde *x, t_signal **sp) +{ + t_sample*in =sp[0]->s_vec; + t_sample*out=sp[1]->s_vec; + int n =sp[0]->s_n; + +#ifdef __SSE__ + if( + Z_SIMD_CHKBLOCKSIZE(n)&& + Z_SIMD_CHKALIGN(in)&& + Z_SIMD_CHKALIGN(out) + ) + { + dsp_add(scalaroror_tilde_performSSE, 4, in, &x->x_g, out, n); + } else +#endif + if (n&7) + dsp_add(scalaroror_tilde_perform, 4, in, &x->x_g, out, n); + else + dsp_add(scalaroror_tilde_perf8, 4, in, &x->x_g, out, n); +} + +static void oror_tilde_setup(void) +{ + oror_tilde_class = class_new(gensym("||~"), (t_newmethod)oror_tilde_new, 0, + sizeof(t_oror_tilde), 0, A_GIMME, 0); + class_addmethod(oror_tilde_class, (t_method)oror_tilde_dsp, gensym("dsp"), 0); + CLASS_MAINSIGNALIN(oror_tilde_class, t_oror_tilde, x_f); + class_sethelpsymbol(oror_tilde_class, gensym("zexy/sigbinops+")); + scalaroror_tilde_class = class_new(gensym("||~"), 0, 0, + sizeof(t_scalaroror_tilde), 0, 0); + CLASS_MAINSIGNALIN(scalaroror_tilde_class, t_scalaroror_tilde, x_f); + class_addmethod(scalaroror_tilde_class, (t_method)scalaroror_tilde_dsp, gensym("dsp"), + 0); + class_sethelpsymbol(scalaroror_tilde_class, gensym("zexy/sigbinops+")); + zexy_register("||~"); +} + + + +/* ---------------------- global setup ------------------------- */ +void z_oror__setup() +{ + oror_tilde_setup(); +} + +void z_0x7c0x7c0x7e_setup(void) +{ + oror_tilde_setup(); +} + +void setup_0x7c0x7c0x7e(void) +{ + oror_tilde_setup(); +} + |