/* * >~: signal comparision * * (c) 1999-2011 IOhannes m zmölnig, forum::für::umläute, institute of electronic music and acoustics (iem) * * This program is free software; you can redistribute it and/or * modify it under the terms of the GNU General Public License * as published by the Free Software Foundation; either version 2 * of the License, or (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License along * with this program. If not, see . */ #include "zexySIMD.h" /* ------------------------ relational~ ----------------------------- */ /* ----------------------------- gt_tilde ----------------------------- */ static t_class *gt_tilde_class, *scalargt_tilde_class; typedef struct _gt_tilde { t_object x_obj; t_float x_f; } t_gt_tilde; typedef struct _scalargt_tilde { t_object x_obj; t_float x_f; t_float x_g; /* inlet value */ } t_scalargt_tilde; static void *gt_tilde_new(t_symbol* UNUSED(s), int argc, t_atom *argv) { if (argc > 1) { post(">~: extra arguments ignored"); } if (argc) { t_scalargt_tilde *x = (t_scalargt_tilde *)pd_new(scalargt_tilde_class); floatinlet_new(&x->x_obj, &x->x_g); x->x_g = atom_getfloatarg(0, argc, argv); outlet_new(&x->x_obj, gensym("signal")); x->x_f = 0; return (x); } else { t_gt_tilde *x = (t_gt_tilde *)pd_new(gt_tilde_class); inlet_new(&x->x_obj, &x->x_obj.ob_pd, gensym("signal"), gensym("signal")); outlet_new(&x->x_obj, gensym("signal")); x->x_f = 0; return (x); } } static t_int *gt_tilde_perform(t_int *w) { t_sample *in1 = (t_sample *)(w[1]); t_sample *in2 = (t_sample *)(w[2]); t_sample *out = (t_sample *)(w[3]); int n = (int)(w[4]); while (n--) { *out++ = *in1++ > *in2++; } return (w+5); } static t_int *gt_tilde_perf8(t_int *w) { t_sample *in1 = (t_sample *)(w[1]); t_sample *in2 = (t_sample *)(w[2]); t_sample *out = (t_sample *)(w[3]); int n = (int)(w[4]); for (; n; n -= 8, in1 += 8, in2 += 8, out += 8) { t_sample f0 = in1[0], f1 = in1[1], f2 = in1[2], f3 = in1[3]; t_sample f4 = in1[4], f5 = in1[5], f6 = in1[6], f7 = in1[7]; t_sample g0 = in2[0], g1 = in2[1], g2 = in2[2], g3 = in2[3]; t_sample g4 = in2[4], g5 = in2[5], g6 = in2[6], g7 = in2[7]; out[0] = f0 > g0; out[1] = f1 > g1; out[2] = f2 > g2; out[3] = f3 > g3; out[4] = f4 > g4; out[5] = f5 > g5; out[6] = f6 > g6; out[7] = f7 > g7; } return (w+5); } static t_int *scalargt_tilde_perform(t_int *w) { t_sample *in = (t_sample *)(w[1]); t_sample f = *(t_float *)(w[2]); t_sample *out = (t_sample *)(w[3]); int n = (int)(w[4]); while (n--) { *out++ = *in++ > f; } return (w+5); } static t_int *scalargt_tilde_perf8(t_int *w) { t_sample *in = (t_sample *)(w[1]); t_sample g = *(t_float *)(w[2]); t_sample *out = (t_sample *)(w[3]); int n = (int)(w[4]); for (; n; n -= 8, in += 8, out += 8) { t_sample f0 = in[0], f1 = in[1], f2 = in[2], f3 = in[3]; t_sample f4 = in[4], f5 = in[5], f6 = in[6], f7 = in[7]; out[0] = f0 > g; out[1] = f1 > g; out[2] = f2 > g; out[3] = f3 > g; out[4] = f4 > g; out[5] = f5 > g; out[6] = f6 > g; out[7] = f7 > g; } return (w+5); } #ifdef __SSE__ static t_int *gt_tilde_performSSE(t_int *w) { __m128 *in1 = (__m128 *)(w[1]); __m128 *in2 = (__m128 *)(w[2]); __m128 *out = (__m128 *)(w[3]); int n = (int)(w[4])>>4; const __m128 one = _mm_set1_ps(1.f); while (n--) { __m128 xmm0, xmm1; xmm0 = _mm_cmpgt_ps(in1[0], in2[0]); out[0] = _mm_and_ps (xmm0 , one); xmm1 = _mm_cmpgt_ps(in1[1], in2[1]); out[1] = _mm_and_ps (xmm1 , one); xmm0 = _mm_cmpgt_ps(in1[2], in2[2]); out[2] = _mm_and_ps (xmm0 , one); xmm1 = _mm_cmpgt_ps(in1[3], in2[3]); out[3] = _mm_and_ps (xmm1 , one); in1+=4; in2+=4; out+=4; } return (w+5); } static t_int *scalargt_tilde_performSSE(t_int *w) { __m128 *in = (__m128 *)(w[1]); __m128 *out = (__m128 *)(w[3]); float f = *(t_float *)(w[2]); __m128 scalar = _mm_set1_ps(f); int n = (int)(w[4])>>4; const __m128 one = _mm_set1_ps(1.f); while (n--) { __m128 xmm0, xmm1; xmm0 = _mm_cmpgt_ps (in[0], scalar); out[0] = _mm_and_ps (xmm0, one); xmm1 = _mm_cmpgt_ps (in[1], scalar); out[1] = _mm_and_ps (xmm1, one); xmm0 = _mm_cmpgt_ps (in[2], scalar); out[2] = _mm_and_ps (xmm0, one); xmm1 = _mm_cmpgt_ps (in[3], scalar); out[3] = _mm_and_ps (xmm1, one); in +=4; out+=4; } return (w+5); } #endif /* __SSE__ */ static void gt_tilde_dsp(t_gt_tilde* UNUSED(x), t_signal **sp) { t_sample*in1=sp[0]->s_vec; t_sample*in2=sp[1]->s_vec; t_sample*out=sp[2]->s_vec; int n=sp[0]->s_n; #ifdef __SSE__ if( Z_SIMD_CHKBLOCKSIZE(n)&& Z_SIMD_CHKALIGN(in1)&& Z_SIMD_CHKALIGN(in2)&& Z_SIMD_CHKALIGN(out)&& ZEXY_TYPE_EQUAL(t_sample, float) ) { dsp_add(gt_tilde_performSSE, 4, in1, in2, out, n); } else #endif if (n&7) { dsp_add(gt_tilde_perform, 4, in1, in2, out, n); } else { dsp_add(gt_tilde_perf8, 4, in1, in2, out, n); } } static void scalargt_tilde_dsp(t_scalargt_tilde *x, t_signal **sp) { t_sample*in =sp[0]->s_vec; t_sample*out=sp[1]->s_vec; int n =sp[0]->s_n; #ifdef __SSE__ if( Z_SIMD_CHKBLOCKSIZE(n)&& Z_SIMD_CHKALIGN(in)&& Z_SIMD_CHKALIGN(out)&& ZEXY_TYPE_EQUAL(t_sample, float) ) { dsp_add(scalargt_tilde_performSSE, 4, in, &x->x_g, out, n); } else #endif if (n&7) { dsp_add(scalargt_tilde_perform, 4, in, &x->x_g, out, n); } else { dsp_add(scalargt_tilde_perf8, 4, in, &x->x_g, out, n); } } static void gt_tilde_help(t_object*x) { post("\n"HEARTSYMBOL" >~\t\t:: compare 2 signals"); } void setup_0x3e0x7e(void) { gt_tilde_class = class_new(gensym(">~"), (t_newmethod)gt_tilde_new, 0, sizeof(t_gt_tilde), 0, A_GIMME, 0); class_addmethod(gt_tilde_class, (t_method)gt_tilde_dsp, gensym("dsp"), 0); CLASS_MAINSIGNALIN(gt_tilde_class, t_gt_tilde, x_f); class_addmethod (gt_tilde_class, (t_method)gt_tilde_help, gensym("help"), A_NULL); class_sethelpsymbol(gt_tilde_class, gensym("zigbinops")); scalargt_tilde_class = class_new(gensym(">~"), 0, 0, sizeof(t_scalargt_tilde), 0, 0); CLASS_MAINSIGNALIN(scalargt_tilde_class, t_scalargt_tilde, x_f); class_addmethod(scalargt_tilde_class, (t_method)scalargt_tilde_dsp, gensym("dsp"), 0); class_addmethod (scalargt_tilde_class, (t_method)gt_tilde_help, gensym("help"), A_NULL); class_sethelpsymbol(scalargt_tilde_class, gensym("zigbinops")); zexy_register(">~"); } #ifndef ZEXY_LIBRARY void setup(void) { setup_0x3e0x7e(); } #endif