/* * ==~: test signals for equality * * (c) 1999-2011 IOhannes m zmölnig, forum::für::umläute, institute of electronic music and acoustics (iem) * * This program is free software; you can redistribute it and/or * modify it under the terms of the GNU General Public License * as published by the Free Software Foundation; either version 2 * of the License, or (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License along * with this program. If not, see . */ #include "zexySIMD.h" /* ----------------------------- eq_tilde ----------------------------- */ static t_class *eq_tilde_class, *scalareq_tilde_class; typedef struct _eq_tilde { t_object x_obj; t_float x_f; } t_eq_tilde; typedef struct _scalareq_tilde { t_object x_obj; t_float x_f; t_float x_g; /* inlet value */ } t_scalareq_tilde; static void *eq_tilde_new(t_symbol* UNUSED(s), int argc, t_atom *argv) { if (argc > 1) { post("==~: extra arguments ignored"); } if (argc) { t_scalareq_tilde *x = (t_scalareq_tilde *)pd_new(scalareq_tilde_class); floatinlet_new(&x->x_obj, &x->x_g); x->x_g = atom_getfloatarg(0, argc, argv); outlet_new(&x->x_obj, gensym("signal")); x->x_f = 0; return (x); } else { t_eq_tilde *x = (t_eq_tilde *)pd_new(eq_tilde_class); inlet_new(&x->x_obj, &x->x_obj.ob_pd, gensym("signal"), gensym("signal")); outlet_new(&x->x_obj, gensym("signal")); x->x_f = 0; return (x); } } static t_int *eq_tilde_perform(t_int *w) { t_sample *in1 = (t_sample *)(w[1]); t_sample *in2 = (t_sample *)(w[2]); t_sample *out = (t_sample *)(w[3]); int n = (int)(w[4]); while (n--) { *out++ = (*in1++ == *in2++); } return (w+5); } static t_int *eq_tilde_perf8(t_int *w) { t_sample *in1 = (t_sample *)(w[1]); t_sample *in2 = (t_sample *)(w[2]); t_sample *out = (t_sample *)(w[3]); int n = (int)(w[4]); for (; n; n -= 8, in1 += 8, in2 += 8, out += 8) { t_sample f0 = in1[0], f1 = in1[1], f2 = in1[2], f3 = in1[3]; t_sample f4 = in1[4], f5 = in1[5], f6 = in1[6], f7 = in1[7]; t_sample g0 = in2[0], g1 = in2[1], g2 = in2[2], g3 = in2[3]; t_sample g4 = in2[4], g5 = in2[5], g6 = in2[6], g7 = in2[7]; out[0] = f0 == g0; out[1] = f1 == g1; out[2] = f2 == g2; out[3] = f3 == g3; out[4] = f4 == g4; out[5] = f5 == g5; out[6] = f6 == g6; out[7] = f7 == g7; } return (w+5); } static t_int *scalareq_tilde_perform(t_int *w) { t_sample *in = (t_sample *)(w[1]); t_sample f = *(t_float *)(w[2]); t_sample *out = (t_sample *)(w[3]); int n = (int)(w[4]); while (n--) { *out++ = (*in++ == f); } return (w+5); } static t_int *scalareq_tilde_perf8(t_int *w) { t_sample *in = (t_sample *)(w[1]); t_sample g = *(t_float *)(w[2]); t_sample *out = (t_sample *)(w[3]); int n = (int)(w[4]); for (; n; n -= 8, in += 8, out += 8) { t_sample f0 = in[0], f1 = in[1], f2 = in[2], f3 = in[3]; t_sample f4 = in[4], f5 = in[5], f6 = in[6], f7 = in[7]; out[0] = (f0 == g); out[1] = (f1 == g); out[2] = (f2 == g); out[3] = (f3 == g); out[4] = (f4 == g); out[5] = (f5 == g); out[6] = (f6 == g); out[7] = (f7 == g); } return (w+5); } #ifdef __SSE__ static t_int *eq_tilde_performSSE(t_int *w) { __m128 *in1 = (__m128 *)(w[1]); __m128 *in2 = (__m128 *)(w[2]); __m128 *out = (__m128 *)(w[3]); int n = (int)(w[4])>>4; const __m128 one = _mm_set1_ps(1.f); while (n--) { __m128 xmm0, xmm1; xmm0 = _mm_cmpeq_ps(in1[0], in2[0]); out[0] = _mm_and_ps (xmm0 , one); xmm1 = _mm_cmpeq_ps(in1[1], in2[1]); out[1] = _mm_and_ps (xmm1 , one); xmm0 = _mm_cmpeq_ps(in1[2], in2[2]); out[2] = _mm_and_ps (xmm0 , one); xmm1 = _mm_cmpeq_ps(in1[3], in2[3]); out[3] = _mm_and_ps (xmm1 , one); in1+=4; in2+=4; out+=4; } return (w+5); } static t_int *scalareq_tilde_performSSE(t_int *w) { __m128 *in = (__m128 *)(w[1]); __m128 *out = (__m128 *)(w[3]); float f = *(float *)(w[2]); __m128 scalar = _mm_set1_ps(f); int n = (int)(w[4])>>4; const __m128 one = _mm_set1_ps(1.f); while (n--) { __m128 xmm0, xmm1; xmm0 = _mm_cmpeq_ps (in[0], scalar); out[0] = _mm_and_ps (xmm0, one); xmm1 = _mm_cmpeq_ps (in[1], scalar); out[1] = _mm_and_ps (xmm1, one); xmm0 = _mm_cmpeq_ps (in[2], scalar); out[2] = _mm_and_ps (xmm0, one); xmm1 = _mm_cmpeq_ps (in[3], scalar); out[3] = _mm_and_ps (xmm1, one); in +=4; out+=4; } return (w+5); } #endif /* __SSE__ */ static void eq_tilde_dsp(t_eq_tilde* UNUSED(x), t_signal **sp) { t_sample*in1=sp[0]->s_vec; t_sample*in2=sp[1]->s_vec; t_sample*out=sp[2]->s_vec; int n=sp[0]->s_n; #ifdef __SSE__ if( Z_SIMD_CHKBLOCKSIZE(n)&& Z_SIMD_CHKALIGN(in1)&& Z_SIMD_CHKALIGN(in2)&& Z_SIMD_CHKALIGN(out)&& ZEXY_TYPE_EQUAL(t_sample, float) ) { dsp_add(eq_tilde_performSSE, 4, in1, in2, out, n); } else #endif if (n&7) { dsp_add(eq_tilde_perform, 4, in1, in2, out, n); } else { dsp_add(eq_tilde_perf8, 4, in1, in2, out, n); } } static void scalareq_tilde_dsp(t_scalareq_tilde *x, t_signal **sp) { t_sample*in =sp[0]->s_vec; t_sample*out=sp[1]->s_vec; int n =sp[0]->s_n; #ifdef __SSE__ if( Z_SIMD_CHKBLOCKSIZE(n)&& Z_SIMD_CHKALIGN(in)&& Z_SIMD_CHKALIGN(out) && ZEXY_TYPE_EQUAL(t_sample, float) ) { dsp_add(scalareq_tilde_performSSE, 4, in, &x->x_g, out, n); } else #endif if (n&7) { dsp_add(scalareq_tilde_perform, 4, in, &x->x_g, out, n); } else { dsp_add(scalareq_tilde_perf8, 4, in, &x->x_g, out, n); } } static void eq_tilde_help(t_object*x) { post("\n"HEARTSYMBOL" &&~\t\t:: test 2 signals for equality"); } void setup_0x3d0x3d0x7e(void) { eq_tilde_class = class_new(gensym("==~"), (t_newmethod)eq_tilde_new, 0, sizeof(t_eq_tilde), 0, A_GIMME, 0); class_addmethod(eq_tilde_class, (t_method)eq_tilde_dsp, gensym("dsp"), 0); CLASS_MAINSIGNALIN(eq_tilde_class, t_eq_tilde, x_f); class_addmethod (eq_tilde_class, (t_method)eq_tilde_help, gensym("help"), A_NULL); class_sethelpsymbol(eq_tilde_class, gensym("zigbinops")); scalareq_tilde_class = class_new(gensym("==~"), 0, 0, sizeof(t_scalareq_tilde), 0, 0); CLASS_MAINSIGNALIN(scalareq_tilde_class, t_scalareq_tilde, x_f); class_addmethod(scalareq_tilde_class, (t_method)scalareq_tilde_dsp, gensym("dsp"), 0); class_addmethod (scalareq_tilde_class, (t_method)eq_tilde_help, gensym("help"), A_NULL); class_sethelpsymbol(scalareq_tilde_class, gensym("zigbinops")); zexy_register("==~"); } #ifndef ZEXY_LIBRARY void setup(void) { setup_0x3d0x3d0x7e(); } #endif