root / gnuradio-core / src / tests / benchmark_nco.cc @ 9967e2e7
History | View | Annotate | Download (4.8 kB)
| 1 | 5d69a524 | jcorgan | /* -*- c++ -*- */
|
|---|---|---|---|
| 2 | 5d69a524 | jcorgan | /*
|
| 3 | 5d69a524 | jcorgan | * Copyright 2002,2004 Free Software Foundation, Inc. |
| 4 | 5d69a524 | jcorgan | * |
| 5 | 5d69a524 | jcorgan | * This file is part of GNU Radio |
| 6 | 5d69a524 | jcorgan | * |
| 7 | 5d69a524 | jcorgan | * GNU Radio is free software; you can redistribute it and/or modify |
| 8 | 5d69a524 | jcorgan | * it under the terms of the GNU General Public License as published by |
| 9 | 937b719d | eb | * the Free Software Foundation; either version 3, or (at your option) |
| 10 | 5d69a524 | jcorgan | * any later version. |
| 11 | 5d69a524 | jcorgan | * |
| 12 | 5d69a524 | jcorgan | * GNU Radio is distributed in the hope that it will be useful, |
| 13 | 5d69a524 | jcorgan | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 14 | 5d69a524 | jcorgan | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| 15 | 5d69a524 | jcorgan | * GNU General Public License for more details. |
| 16 | 5d69a524 | jcorgan | * |
| 17 | 5d69a524 | jcorgan | * You should have received a copy of the GNU General Public License |
| 18 | 5d69a524 | jcorgan | * along with GNU Radio; see the file COPYING. If not, write to |
| 19 | 86f5c924 | eb | * the Free Software Foundation, Inc., 51 Franklin Street, |
| 20 | 86f5c924 | eb | * Boston, MA 02110-1301, USA. |
| 21 | 5d69a524 | jcorgan | */ |
| 22 | 5d69a524 | jcorgan | #ifdef HAVE_CONFIG_H
|
| 23 | 5d69a524 | jcorgan | #include "config.h" |
| 24 | 5d69a524 | jcorgan | #endif
|
| 25 | 5d69a524 | jcorgan | #include <stdio.h> |
| 26 | 5d69a524 | jcorgan | #include <sys/time.h> |
| 27 | 5d69a524 | jcorgan | #ifdef HAVE_SYS_RESOURCE_H
|
| 28 | 5d69a524 | jcorgan | #include <sys/resource.h> |
| 29 | 5d69a524 | jcorgan | #endif
|
| 30 | 5d69a524 | jcorgan | #include <unistd.h> |
| 31 | 5d69a524 | jcorgan | #include <gr_nco.h> |
| 32 | 5d69a524 | jcorgan | #include <gr_fxpt_nco.h> |
| 33 | 5d69a524 | jcorgan | |
| 34 | 5d69a524 | jcorgan | #define ITERATIONS 20000000 |
| 35 | 5d69a524 | jcorgan | #define BLOCK_SIZE (10 * 1000) // fits in cache |
| 36 | 5d69a524 | jcorgan | |
| 37 | 5d69a524 | jcorgan | #define FREQ 5003.123 |
| 38 | 5d69a524 | jcorgan | |
| 39 | 5d69a524 | jcorgan | static double |
| 40 | 5d69a524 | jcorgan | timeval_to_double (const struct timeval *tv) |
| 41 | 5d69a524 | jcorgan | {
|
| 42 | 5d69a524 | jcorgan | return (double) tv->tv_sec + (double) tv->tv_usec * 1e-6; |
| 43 | 5d69a524 | jcorgan | } |
| 44 | 5d69a524 | jcorgan | |
| 45 | 5d69a524 | jcorgan | |
| 46 | 5d69a524 | jcorgan | static void |
| 47 | 5d69a524 | jcorgan | benchmark (void test (float *x, float *y), const char *implementation_name) |
| 48 | 5d69a524 | jcorgan | {
|
| 49 | 5d69a524 | jcorgan | #ifdef HAVE_SYS_RESOURCE_H
|
| 50 | 5d69a524 | jcorgan | struct rusage rusage_start;
|
| 51 | 5d69a524 | jcorgan | struct rusage rusage_stop;
|
| 52 | 5d69a524 | jcorgan | #else
|
| 53 | 5d69a524 | jcorgan | double clock_start;
|
| 54 | 5d69a524 | jcorgan | double clock_end;
|
| 55 | 5d69a524 | jcorgan | #endif
|
| 56 | 5d69a524 | jcorgan | float output[2*BLOCK_SIZE]; |
| 57 | 5d69a524 | jcorgan | float *x = &output[0], *y = &output[BLOCK_SIZE]; |
| 58 | 5d69a524 | jcorgan | |
| 59 | 5d69a524 | jcorgan | // touch memory
|
| 60 | 5d69a524 | jcorgan | memset(output, 0, 2*BLOCK_SIZE*sizeof(float)); |
| 61 | 5d69a524 | jcorgan | |
| 62 | 5d69a524 | jcorgan | // get starting CPU usage
|
| 63 | 5d69a524 | jcorgan | #ifdef HAVE_SYS_RESOURCE_H
|
| 64 | 5d69a524 | jcorgan | if (getrusage (RUSAGE_SELF, &rusage_start) < 0){ |
| 65 | 5d69a524 | jcorgan | perror ("getrusage");
|
| 66 | 5d69a524 | jcorgan | exit (1);
|
| 67 | 5d69a524 | jcorgan | } |
| 68 | 5d69a524 | jcorgan | #else
|
| 69 | 5d69a524 | jcorgan | clock_start = (double) clock() * (1000000. / CLOCKS_PER_SEC); |
| 70 | 5d69a524 | jcorgan | #endif
|
| 71 | 5d69a524 | jcorgan | // do the actual work
|
| 72 | 5d69a524 | jcorgan | |
| 73 | 5d69a524 | jcorgan | test (x, y); |
| 74 | 5d69a524 | jcorgan | |
| 75 | 5d69a524 | jcorgan | // get ending CPU usage
|
| 76 | 5d69a524 | jcorgan | |
| 77 | 5d69a524 | jcorgan | #ifdef HAVE_SYS_RESOURCE_H
|
| 78 | 5d69a524 | jcorgan | if (getrusage (RUSAGE_SELF, &rusage_stop) < 0){ |
| 79 | 5d69a524 | jcorgan | perror ("getrusage");
|
| 80 | 5d69a524 | jcorgan | exit (1);
|
| 81 | 5d69a524 | jcorgan | } |
| 82 | 5d69a524 | jcorgan | |
| 83 | 5d69a524 | jcorgan | // compute results
|
| 84 | 5d69a524 | jcorgan | |
| 85 | 5d69a524 | jcorgan | double user =
|
| 86 | 5d69a524 | jcorgan | timeval_to_double (&rusage_stop.ru_utime) |
| 87 | 5d69a524 | jcorgan | - timeval_to_double (&rusage_start.ru_utime); |
| 88 | 5d69a524 | jcorgan | |
| 89 | 5d69a524 | jcorgan | double sys =
|
| 90 | 5d69a524 | jcorgan | timeval_to_double (&rusage_stop.ru_stime) |
| 91 | 5d69a524 | jcorgan | - timeval_to_double (&rusage_start.ru_stime); |
| 92 | 5d69a524 | jcorgan | |
| 93 | 5d69a524 | jcorgan | double total = user + sys;
|
| 94 | 5d69a524 | jcorgan | #else
|
| 95 | 5d69a524 | jcorgan | clock_end = (double) clock () * (1000000. / CLOCKS_PER_SEC); |
| 96 | 5d69a524 | jcorgan | double total = clock_end - clock_start;
|
| 97 | 5d69a524 | jcorgan | #endif
|
| 98 | 5d69a524 | jcorgan | |
| 99 | 5d69a524 | jcorgan | printf ("%18s: cpu: %6.3f steps/sec: %10.3e\n",
|
| 100 | 5d69a524 | jcorgan | implementation_name, total, ITERATIONS / total); |
| 101 | 5d69a524 | jcorgan | } |
| 102 | 5d69a524 | jcorgan | |
| 103 | 5d69a524 | jcorgan | // ----------------------------------------------------------------
|
| 104 | 5d69a524 | jcorgan | // Don't compare the _vec with other functions since memory store's
|
| 105 | 5d69a524 | jcorgan | // are involved.
|
| 106 | 5d69a524 | jcorgan | |
| 107 | 5d69a524 | jcorgan | void basic_sincos_vec (float *x, float *y) |
| 108 | 5d69a524 | jcorgan | {
|
| 109 | 5d69a524 | jcorgan | gr_nco<float,float> nco; |
| 110 | 5d69a524 | jcorgan | |
| 111 | 5d69a524 | jcorgan | nco.set_freq (2 * M_PI / FREQ);
|
| 112 | 5d69a524 | jcorgan | |
| 113 | 5d69a524 | jcorgan | for (int i = 0; i < ITERATIONS/BLOCK_SIZE; i++){ |
| 114 | 5d69a524 | jcorgan | for (int j = 0; j < BLOCK_SIZE; j++){ |
| 115 | 5d69a524 | jcorgan | nco.sincos (&x[2*j+1], &x[2*j]); |
| 116 | 5d69a524 | jcorgan | nco.step (); |
| 117 | 5d69a524 | jcorgan | } |
| 118 | 5d69a524 | jcorgan | } |
| 119 | 5d69a524 | jcorgan | } |
| 120 | 5d69a524 | jcorgan | |
| 121 | 5d69a524 | jcorgan | void native_sincos_vec (float *x, float *y) |
| 122 | 5d69a524 | jcorgan | {
|
| 123 | 5d69a524 | jcorgan | gr_nco<float,float> nco; |
| 124 | 5d69a524 | jcorgan | |
| 125 | 5d69a524 | jcorgan | nco.set_freq (2 * M_PI / FREQ);
|
| 126 | 5d69a524 | jcorgan | |
| 127 | 5d69a524 | jcorgan | for (int i = 0; i < ITERATIONS/BLOCK_SIZE; i++){ |
| 128 | 5d69a524 | jcorgan | nco.sincos ((gr_complex*)x, BLOCK_SIZE); |
| 129 | 5d69a524 | jcorgan | } |
| 130 | 5d69a524 | jcorgan | } |
| 131 | 5d69a524 | jcorgan | |
| 132 | 5d69a524 | jcorgan | void fxpt_sincos_vec (float *x, float *y) |
| 133 | 5d69a524 | jcorgan | {
|
| 134 | 5d69a524 | jcorgan | gr_fxpt_nco nco; |
| 135 | 5d69a524 | jcorgan | |
| 136 | 5d69a524 | jcorgan | nco.set_freq (2 * M_PI / FREQ);
|
| 137 | 5d69a524 | jcorgan | |
| 138 | 5d69a524 | jcorgan | for (int i = 0; i < ITERATIONS/BLOCK_SIZE; i++){ |
| 139 | 5d69a524 | jcorgan | nco.sincos ((gr_complex*)x, BLOCK_SIZE); |
| 140 | 5d69a524 | jcorgan | } |
| 141 | 5d69a524 | jcorgan | } |
| 142 | 5d69a524 | jcorgan | |
| 143 | 5d69a524 | jcorgan | // ----------------------------------------------------------------
|
| 144 | 5d69a524 | jcorgan | |
| 145 | 5d69a524 | jcorgan | void native_sincos (float *x, float *y) |
| 146 | 5d69a524 | jcorgan | {
|
| 147 | 5d69a524 | jcorgan | gr_nco<float,float> nco; |
| 148 | 5d69a524 | jcorgan | |
| 149 | 5d69a524 | jcorgan | nco.set_freq (2 * M_PI / FREQ);
|
| 150 | 5d69a524 | jcorgan | |
| 151 | 5d69a524 | jcorgan | for (int i = 0; i < ITERATIONS; i++){ |
| 152 | 5d69a524 | jcorgan | nco.sincos (x, y); |
| 153 | 5d69a524 | jcorgan | nco.step (); |
| 154 | 5d69a524 | jcorgan | } |
| 155 | 5d69a524 | jcorgan | } |
| 156 | 5d69a524 | jcorgan | |
| 157 | 5d69a524 | jcorgan | void fxpt_sincos (float *x, float *y) |
| 158 | 5d69a524 | jcorgan | {
|
| 159 | 5d69a524 | jcorgan | gr_fxpt_nco nco; |
| 160 | 5d69a524 | jcorgan | |
| 161 | 5d69a524 | jcorgan | nco.set_freq (2 * M_PI / FREQ);
|
| 162 | 5d69a524 | jcorgan | |
| 163 | 5d69a524 | jcorgan | for (int i = 0; i < ITERATIONS; i++){ |
| 164 | 5d69a524 | jcorgan | nco.sincos (x, y); |
| 165 | 5d69a524 | jcorgan | nco.step (); |
| 166 | 5d69a524 | jcorgan | } |
| 167 | 5d69a524 | jcorgan | } |
| 168 | 5d69a524 | jcorgan | |
| 169 | 5d69a524 | jcorgan | // ----------------------------------------------------------------
|
| 170 | 5d69a524 | jcorgan | |
| 171 | 5d69a524 | jcorgan | void native_sin (float *x, float *y) |
| 172 | 5d69a524 | jcorgan | {
|
| 173 | 5d69a524 | jcorgan | gr_nco<float,float> nco; |
| 174 | 5d69a524 | jcorgan | |
| 175 | 5d69a524 | jcorgan | nco.set_freq (2 * M_PI / FREQ);
|
| 176 | 5d69a524 | jcorgan | |
| 177 | 5d69a524 | jcorgan | for (int i = 0; i < ITERATIONS; i++){ |
| 178 | 5d69a524 | jcorgan | *x = nco.sin (); |
| 179 | 5d69a524 | jcorgan | nco.step (); |
| 180 | 5d69a524 | jcorgan | } |
| 181 | 5d69a524 | jcorgan | } |
| 182 | 5d69a524 | jcorgan | |
| 183 | 5d69a524 | jcorgan | void fxpt_sin (float *x, float *y) |
| 184 | 5d69a524 | jcorgan | {
|
| 185 | 5d69a524 | jcorgan | gr_fxpt_nco nco; |
| 186 | 5d69a524 | jcorgan | |
| 187 | 5d69a524 | jcorgan | nco.set_freq (2 * M_PI / FREQ);
|
| 188 | 5d69a524 | jcorgan | |
| 189 | 5d69a524 | jcorgan | for (int i = 0; i < ITERATIONS; i++){ |
| 190 | 5d69a524 | jcorgan | *x = nco.sin (); |
| 191 | 5d69a524 | jcorgan | nco.step (); |
| 192 | 5d69a524 | jcorgan | } |
| 193 | 5d69a524 | jcorgan | } |
| 194 | 5d69a524 | jcorgan | |
| 195 | 5d69a524 | jcorgan | // ----------------------------------------------------------------
|
| 196 | 5d69a524 | jcorgan | |
| 197 | 5d69a524 | jcorgan | void nop_fct (float *x, float *y) |
| 198 | 5d69a524 | jcorgan | {
|
| 199 | 5d69a524 | jcorgan | } |
| 200 | 5d69a524 | jcorgan | |
| 201 | 5d69a524 | jcorgan | void nop_loop (float *x, float *y) |
| 202 | 5d69a524 | jcorgan | {
|
| 203 | 5d69a524 | jcorgan | for (int i = 0; i < ITERATIONS; i++){ |
| 204 | 5d69a524 | jcorgan | nop_fct (x, y); |
| 205 | 5d69a524 | jcorgan | } |
| 206 | 5d69a524 | jcorgan | } |
| 207 | 5d69a524 | jcorgan | |
| 208 | 5d69a524 | jcorgan | int
|
| 209 | 5d69a524 | jcorgan | main (int argc, char **argv) |
| 210 | 5d69a524 | jcorgan | {
|
| 211 | 5d69a524 | jcorgan | benchmark (nop_loop, "nop loop");
|
| 212 | 5d69a524 | jcorgan | benchmark (native_sin, "native sine");
|
| 213 | 5d69a524 | jcorgan | benchmark (fxpt_sin, "fxpt sine");
|
| 214 | 5d69a524 | jcorgan | benchmark (native_sincos, "native sin/cos");
|
| 215 | 5d69a524 | jcorgan | benchmark (fxpt_sincos, "fxpt sin/cos");
|
| 216 | 5d69a524 | jcorgan | benchmark (basic_sincos_vec, "basic sin/cos vec");
|
| 217 | 5d69a524 | jcorgan | benchmark (native_sincos_vec, "native sin/cos vec");
|
| 218 | 5d69a524 | jcorgan | benchmark (fxpt_sincos_vec, "fxpt sin/cos vec");
|
| 219 | 5d69a524 | jcorgan | } |