Statistics
| Branch: | Tag: | Revision:

root / gnuradio-core / src / tests / benchmark_nco.cc @ 9967e2e7

History | View | Annotate | Download (4.8 kB)

1 5d69a524 jcorgan
/* -*- c++ -*- */
2 5d69a524 jcorgan
/*
3 5d69a524 jcorgan
 * Copyright 2002,2004 Free Software Foundation, Inc.
4 5d69a524 jcorgan
 *
5 5d69a524 jcorgan
 * This file is part of GNU Radio
6 5d69a524 jcorgan
 *
7 5d69a524 jcorgan
 * GNU Radio is free software; you can redistribute it and/or modify
8 5d69a524 jcorgan
 * it under the terms of the GNU General Public License as published by
9 937b719d eb
 * the Free Software Foundation; either version 3, or (at your option)
10 5d69a524 jcorgan
 * any later version.
11 5d69a524 jcorgan
 *
12 5d69a524 jcorgan
 * GNU Radio is distributed in the hope that it will be useful,
13 5d69a524 jcorgan
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 5d69a524 jcorgan
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15 5d69a524 jcorgan
 * GNU General Public License for more details.
16 5d69a524 jcorgan
 *
17 5d69a524 jcorgan
 * You should have received a copy of the GNU General Public License
18 5d69a524 jcorgan
 * along with GNU Radio; see the file COPYING.  If not, write to
19 86f5c924 eb
 * the Free Software Foundation, Inc., 51 Franklin Street,
20 86f5c924 eb
 * Boston, MA 02110-1301, USA.
21 5d69a524 jcorgan
 */
22 5d69a524 jcorgan
#ifdef HAVE_CONFIG_H
23 5d69a524 jcorgan
#include "config.h"
24 5d69a524 jcorgan
#endif
25 5d69a524 jcorgan
#include <stdio.h>
26 5d69a524 jcorgan
#include <sys/time.h>
27 5d69a524 jcorgan
#ifdef HAVE_SYS_RESOURCE_H
28 5d69a524 jcorgan
#include <sys/resource.h>
29 5d69a524 jcorgan
#endif
30 5d69a524 jcorgan
#include <unistd.h>
31 5d69a524 jcorgan
#include <gr_nco.h>
32 5d69a524 jcorgan
#include <gr_fxpt_nco.h>
33 5d69a524 jcorgan
34 5d69a524 jcorgan
#define ITERATIONS        20000000
35 5d69a524 jcorgan
#define BLOCK_SIZE        (10 * 1000)        // fits in cache
36 5d69a524 jcorgan
37 5d69a524 jcorgan
#define FREQ        5003.123
38 5d69a524 jcorgan
39 5d69a524 jcorgan
static double
40 5d69a524 jcorgan
timeval_to_double (const struct timeval *tv)
41 5d69a524 jcorgan
{
42 5d69a524 jcorgan
  return (double) tv->tv_sec + (double) tv->tv_usec * 1e-6;
43 5d69a524 jcorgan
}
44 5d69a524 jcorgan
45 5d69a524 jcorgan
46 5d69a524 jcorgan
static void
47 5d69a524 jcorgan
benchmark (void test (float *x, float *y), const char *implementation_name)
48 5d69a524 jcorgan
{
49 5d69a524 jcorgan
#ifdef HAVE_SYS_RESOURCE_H
50 5d69a524 jcorgan
  struct rusage        rusage_start;
51 5d69a524 jcorgan
  struct rusage        rusage_stop;
52 5d69a524 jcorgan
#else
53 5d69a524 jcorgan
  double clock_start;
54 5d69a524 jcorgan
  double clock_end;
55 5d69a524 jcorgan
#endif
56 5d69a524 jcorgan
  float output[2*BLOCK_SIZE];
57 5d69a524 jcorgan
  float *x = &output[0], *y = &output[BLOCK_SIZE];
58 5d69a524 jcorgan
59 5d69a524 jcorgan
  // touch memory
60 5d69a524 jcorgan
  memset(output, 0, 2*BLOCK_SIZE*sizeof(float));
61 5d69a524 jcorgan
62 5d69a524 jcorgan
  // get starting CPU usage
63 5d69a524 jcorgan
#ifdef HAVE_SYS_RESOURCE_H
64 5d69a524 jcorgan
  if (getrusage (RUSAGE_SELF, &rusage_start) < 0){
65 5d69a524 jcorgan
    perror ("getrusage");
66 5d69a524 jcorgan
    exit (1);
67 5d69a524 jcorgan
  }
68 5d69a524 jcorgan
#else
69 5d69a524 jcorgan
  clock_start = (double) clock() * (1000000. / CLOCKS_PER_SEC);
70 5d69a524 jcorgan
#endif
71 5d69a524 jcorgan
  // do the actual work
72 5d69a524 jcorgan
73 5d69a524 jcorgan
  test (x, y);
74 5d69a524 jcorgan
75 5d69a524 jcorgan
  // get ending CPU usage
76 5d69a524 jcorgan
77 5d69a524 jcorgan
#ifdef HAVE_SYS_RESOURCE_H
78 5d69a524 jcorgan
  if (getrusage (RUSAGE_SELF, &rusage_stop) < 0){
79 5d69a524 jcorgan
    perror ("getrusage");
80 5d69a524 jcorgan
    exit (1);
81 5d69a524 jcorgan
  }
82 5d69a524 jcorgan
83 5d69a524 jcorgan
  // compute results
84 5d69a524 jcorgan
85 5d69a524 jcorgan
  double user =
86 5d69a524 jcorgan
    timeval_to_double (&rusage_stop.ru_utime)
87 5d69a524 jcorgan
    - timeval_to_double (&rusage_start.ru_utime);
88 5d69a524 jcorgan
89 5d69a524 jcorgan
  double sys =
90 5d69a524 jcorgan
    timeval_to_double (&rusage_stop.ru_stime)
91 5d69a524 jcorgan
    - timeval_to_double (&rusage_start.ru_stime);
92 5d69a524 jcorgan
93 5d69a524 jcorgan
  double total = user + sys;
94 5d69a524 jcorgan
#else
95 5d69a524 jcorgan
  clock_end = (double) clock () * (1000000. / CLOCKS_PER_SEC);
96 5d69a524 jcorgan
  double total = clock_end - clock_start;
97 5d69a524 jcorgan
#endif
98 5d69a524 jcorgan
99 5d69a524 jcorgan
  printf ("%18s:  cpu: %6.3f  steps/sec: %10.3e\n",
100 5d69a524 jcorgan
          implementation_name, total, ITERATIONS / total);
101 5d69a524 jcorgan
}
102 5d69a524 jcorgan
103 5d69a524 jcorgan
// ----------------------------------------------------------------
104 5d69a524 jcorgan
// Don't compare the _vec with other functions since memory store's
105 5d69a524 jcorgan
// are involved.
106 5d69a524 jcorgan
107 5d69a524 jcorgan
void basic_sincos_vec (float *x, float *y)
108 5d69a524 jcorgan
{
109 5d69a524 jcorgan
  gr_nco<float,float>        nco;
110 5d69a524 jcorgan
111 5d69a524 jcorgan
  nco.set_freq (2 * M_PI / FREQ);
112 5d69a524 jcorgan
113 5d69a524 jcorgan
  for (int i = 0; i < ITERATIONS/BLOCK_SIZE; i++){
114 5d69a524 jcorgan
    for (int j = 0; j < BLOCK_SIZE; j++){
115 5d69a524 jcorgan
      nco.sincos (&x[2*j+1], &x[2*j]);
116 5d69a524 jcorgan
      nco.step ();
117 5d69a524 jcorgan
    }
118 5d69a524 jcorgan
  }
119 5d69a524 jcorgan
}
120 5d69a524 jcorgan
121 5d69a524 jcorgan
void native_sincos_vec (float *x, float *y)
122 5d69a524 jcorgan
{
123 5d69a524 jcorgan
  gr_nco<float,float>        nco;
124 5d69a524 jcorgan
125 5d69a524 jcorgan
  nco.set_freq (2 * M_PI / FREQ);
126 5d69a524 jcorgan
 
127 5d69a524 jcorgan
  for (int i = 0; i < ITERATIONS/BLOCK_SIZE; i++){
128 5d69a524 jcorgan
    nco.sincos ((gr_complex*)x, BLOCK_SIZE);
129 5d69a524 jcorgan
  }
130 5d69a524 jcorgan
}
131 5d69a524 jcorgan
132 5d69a524 jcorgan
void fxpt_sincos_vec (float *x, float *y)
133 5d69a524 jcorgan
{
134 5d69a524 jcorgan
  gr_fxpt_nco        nco;
135 5d69a524 jcorgan
  
136 5d69a524 jcorgan
  nco.set_freq (2 * M_PI / FREQ);
137 5d69a524 jcorgan
  
138 5d69a524 jcorgan
  for (int i = 0; i < ITERATIONS/BLOCK_SIZE; i++){
139 5d69a524 jcorgan
    nco.sincos ((gr_complex*)x, BLOCK_SIZE);
140 5d69a524 jcorgan
  }
141 5d69a524 jcorgan
}
142 5d69a524 jcorgan
143 5d69a524 jcorgan
// ----------------------------------------------------------------
144 5d69a524 jcorgan
145 5d69a524 jcorgan
void native_sincos (float *x, float *y)
146 5d69a524 jcorgan
{
147 5d69a524 jcorgan
  gr_nco<float,float>        nco;
148 5d69a524 jcorgan
149 5d69a524 jcorgan
  nco.set_freq (2 * M_PI / FREQ);
150 5d69a524 jcorgan
151 5d69a524 jcorgan
  for (int i = 0; i < ITERATIONS; i++){
152 5d69a524 jcorgan
    nco.sincos (x, y);
153 5d69a524 jcorgan
    nco.step ();
154 5d69a524 jcorgan
  }
155 5d69a524 jcorgan
}
156 5d69a524 jcorgan
157 5d69a524 jcorgan
void fxpt_sincos (float *x, float *y)
158 5d69a524 jcorgan
{
159 5d69a524 jcorgan
  gr_fxpt_nco        nco;
160 5d69a524 jcorgan
161 5d69a524 jcorgan
  nco.set_freq (2 * M_PI / FREQ);
162 5d69a524 jcorgan
163 5d69a524 jcorgan
  for (int i = 0; i < ITERATIONS; i++){
164 5d69a524 jcorgan
    nco.sincos (x, y);
165 5d69a524 jcorgan
    nco.step ();
166 5d69a524 jcorgan
  }
167 5d69a524 jcorgan
}
168 5d69a524 jcorgan
169 5d69a524 jcorgan
// ----------------------------------------------------------------
170 5d69a524 jcorgan
171 5d69a524 jcorgan
void native_sin (float *x, float *y)
172 5d69a524 jcorgan
{
173 5d69a524 jcorgan
  gr_nco<float,float>        nco;
174 5d69a524 jcorgan
175 5d69a524 jcorgan
  nco.set_freq (2 * M_PI / FREQ);
176 5d69a524 jcorgan
177 5d69a524 jcorgan
  for (int i = 0; i < ITERATIONS; i++){
178 5d69a524 jcorgan
    *x = nco.sin ();
179 5d69a524 jcorgan
    nco.step ();
180 5d69a524 jcorgan
  }
181 5d69a524 jcorgan
}
182 5d69a524 jcorgan
183 5d69a524 jcorgan
void fxpt_sin (float *x, float *y)
184 5d69a524 jcorgan
{
185 5d69a524 jcorgan
  gr_fxpt_nco        nco;
186 5d69a524 jcorgan
187 5d69a524 jcorgan
  nco.set_freq (2 * M_PI / FREQ);
188 5d69a524 jcorgan
189 5d69a524 jcorgan
  for (int i = 0; i < ITERATIONS; i++){
190 5d69a524 jcorgan
    *x = nco.sin ();
191 5d69a524 jcorgan
    nco.step ();
192 5d69a524 jcorgan
  }
193 5d69a524 jcorgan
}
194 5d69a524 jcorgan
195 5d69a524 jcorgan
// ----------------------------------------------------------------
196 5d69a524 jcorgan
197 5d69a524 jcorgan
void nop_fct (float *x, float *y)
198 5d69a524 jcorgan
{
199 5d69a524 jcorgan
}
200 5d69a524 jcorgan
201 5d69a524 jcorgan
void nop_loop (float *x, float *y)
202 5d69a524 jcorgan
{
203 5d69a524 jcorgan
  for (int i = 0; i < ITERATIONS; i++){
204 5d69a524 jcorgan
    nop_fct (x, y);
205 5d69a524 jcorgan
  }
206 5d69a524 jcorgan
}
207 5d69a524 jcorgan
208 5d69a524 jcorgan
int
209 5d69a524 jcorgan
main (int argc, char **argv)
210 5d69a524 jcorgan
{
211 5d69a524 jcorgan
  benchmark (nop_loop, "nop loop");
212 5d69a524 jcorgan
  benchmark (native_sin, "native sine");
213 5d69a524 jcorgan
  benchmark (fxpt_sin, "fxpt sine");
214 5d69a524 jcorgan
  benchmark (native_sincos, "native sin/cos");
215 5d69a524 jcorgan
  benchmark (fxpt_sincos, "fxpt sin/cos");
216 5d69a524 jcorgan
  benchmark (basic_sincos_vec, "basic sin/cos vec");
217 5d69a524 jcorgan
  benchmark (native_sincos_vec, "native sin/cos vec");
218 5d69a524 jcorgan
  benchmark (fxpt_sincos_vec, "fxpt sin/cos vec");
219 5d69a524 jcorgan
}