/* -*- c++ -*- */ /* * Copyright 2002,2004 Free Software Foundation, Inc. * * This file is part of GNU Radio * * GNU Radio is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 3, or (at your option) * any later version. * * GNU Radio is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with GNU Radio; see the file COPYING. If not, write to * the Free Software Foundation, Inc., 51 Franklin Street, * Boston, MA 02110-1301, USA. */ #ifdef HAVE_CONFIG_H #include "config.h" #endif #include #include #ifdef HAVE_SYS_RESOURCE_H #include #endif #include #include #include #define ITERATIONS 20000000 #define BLOCK_SIZE (10 * 1000) // fits in cache #define FREQ 5003.123 static double timeval_to_double (const struct timeval *tv) { return (double) tv->tv_sec + (double) tv->tv_usec * 1e-6; } static void benchmark (void test (float *x, float *y), const char *implementation_name) { #ifdef HAVE_SYS_RESOURCE_H struct rusage rusage_start; struct rusage rusage_stop; #else double clock_start; double clock_end; #endif float output[2*BLOCK_SIZE]; float *x = &output[0], *y = &output[BLOCK_SIZE]; // touch memory memset(output, 0, 2*BLOCK_SIZE*sizeof(float)); // get starting CPU usage #ifdef HAVE_SYS_RESOURCE_H if (getrusage (RUSAGE_SELF, &rusage_start) < 0){ perror ("getrusage"); exit (1); } #else clock_start = (double) clock() * (1000000. / CLOCKS_PER_SEC); #endif // do the actual work test (x, y); // get ending CPU usage #ifdef HAVE_SYS_RESOURCE_H if (getrusage (RUSAGE_SELF, &rusage_stop) < 0){ perror ("getrusage"); exit (1); } // compute results double user = timeval_to_double (&rusage_stop.ru_utime) - timeval_to_double (&rusage_start.ru_utime); double sys = timeval_to_double (&rusage_stop.ru_stime) - timeval_to_double (&rusage_start.ru_stime); double total = user + sys; #else clock_end = (double) clock () * (1000000. / CLOCKS_PER_SEC); double total = clock_end - clock_start; #endif printf ("%18s: cpu: %6.3f steps/sec: %10.3e\n", implementation_name, total, ITERATIONS / total); } // ---------------------------------------------------------------- // Don't compare the _vec with other functions since memory store's // are involved. void basic_sincos_vec (float *x, float *y) { gr_nco nco; nco.set_freq (2 * M_PI / FREQ); for (int i = 0; i < ITERATIONS/BLOCK_SIZE; i++){ for (int j = 0; j < BLOCK_SIZE; j++){ nco.sincos (&x[2*j+1], &x[2*j]); nco.step (); } } } void native_sincos_vec (float *x, float *y) { gr_nco nco; nco.set_freq (2 * M_PI / FREQ); for (int i = 0; i < ITERATIONS/BLOCK_SIZE; i++){ nco.sincos ((gr_complex*)x, BLOCK_SIZE); } } void fxpt_sincos_vec (float *x, float *y) { gr_fxpt_nco nco; nco.set_freq (2 * M_PI / FREQ); for (int i = 0; i < ITERATIONS/BLOCK_SIZE; i++){ nco.sincos ((gr_complex*)x, BLOCK_SIZE); } } // ---------------------------------------------------------------- void native_sincos (float *x, float *y) { gr_nco nco; nco.set_freq (2 * M_PI / FREQ); for (int i = 0; i < ITERATIONS; i++){ nco.sincos (x, y); nco.step (); } } void fxpt_sincos (float *x, float *y) { gr_fxpt_nco nco; nco.set_freq (2 * M_PI / FREQ); for (int i = 0; i < ITERATIONS; i++){ nco.sincos (x, y); nco.step (); } } // ---------------------------------------------------------------- void native_sin (float *x, float *y) { gr_nco nco; nco.set_freq (2 * M_PI / FREQ); for (int i = 0; i < ITERATIONS; i++){ *x = nco.sin (); nco.step (); } } void fxpt_sin (float *x, float *y) { gr_fxpt_nco nco; nco.set_freq (2 * M_PI / FREQ); for (int i = 0; i < ITERATIONS; i++){ *x = nco.sin (); nco.step (); } } // ---------------------------------------------------------------- void nop_fct (float *x, float *y) { } void nop_loop (float *x, float *y) { for (int i = 0; i < ITERATIONS; i++){ nop_fct (x, y); } } int main (int argc, char **argv) { benchmark (nop_loop, "nop loop"); benchmark (native_sin, "native sine"); benchmark (fxpt_sin, "fxpt sine"); benchmark (native_sincos, "native sin/cos"); benchmark (fxpt_sincos, "fxpt sin/cos"); benchmark (basic_sincos_vec, "basic sin/cos vec"); benchmark (native_sincos_vec, "native sin/cos vec"); benchmark (fxpt_sincos_vec, "fxpt sin/cos vec"); }