about summary refs log tree commit diff
path: root/benchtests/bench-skeleton.c
blob: 7359184ba8f4d7da1b64e896df668386f75bd1c3 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
/* Skeleton for benchmark programs.
   Copyright (C) 2013 Free Software Foundation, Inc.
   This file is part of the GNU C Library.

   The GNU C Library is free software; you can redistribute it and/or
   modify it under the terms of the GNU Lesser General Public
   License as published by the Free Software Foundation; either
   version 2.1 of the License, or (at your option) any later version.

   The GNU C Library is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   Lesser General Public License for more details.

   You should have received a copy of the GNU Lesser General Public
   License along with the GNU C Library; if not, see
   <http://www.gnu.org/licenses/>.  */

#include <string.h>
#include <stdint.h>
#include <stdio.h>
#include <time.h>
#include <inttypes.h>

#define TIMESPEC_AFTER(a, b) \
  (((a).tv_sec == (b).tv_sec) ?						      \
     ((a).tv_nsec > (b).tv_nsec) :					      \
	((a).tv_sec > (b).tv_sec))
int
main (int argc, char **argv)
{
  unsigned long i, k;
  struct timespec start, end, runtime;

  memset (&runtime, 0, sizeof (runtime));
  memset (&start, 0, sizeof (start));
  memset (&end, 0, sizeof (end));

  clock_getres (CLOCK_PROCESS_CPUTIME_ID, &start);

  /* Measure 1000 times the resolution of the clock.  So for a 1ns resolution
     clock, we measure 1000 iterations of the function call at a time.
     Measurements close to the minimum clock resolution won't make much sense,
     but it's better than having nothing at all.  */
  unsigned long iters = 1000 * start.tv_nsec;

  for (int v = 0; v < NUM_VARIANTS; v++)
    {
      /* Run for approximately DURATION seconds.  */
      clock_gettime (CLOCK_MONOTONIC_RAW, &runtime);
      runtime.tv_sec += DURATION;

      double d_total_i = 0;
      uint64_t total = 0, max = 0, min = 0x7fffffffffffffff;
      while (1)
	{
	  for (i = 0; i < NUM_SAMPLES (v); i++)
	    {
	      clock_gettime (CLOCK_PROCESS_CPUTIME_ID, &start);
	      for (k = 0; k < iters; k++)
		BENCH_FUNC (v, i);
	      clock_gettime (CLOCK_PROCESS_CPUTIME_ID, &end);

	      uint64_t cur = (end.tv_nsec - start.tv_nsec
			      + ((end.tv_sec - start.tv_sec)
				 * (uint64_t) 1000000000));

	      if (cur > max)
		max = cur;

	      if (cur < min)
		min = cur;

	      total += cur;

	      d_total_i += iters;
	    }
	  struct timespec curtime;

	  memset (&curtime, 0, sizeof (curtime));
	  clock_gettime (CLOCK_MONOTONIC_RAW, &curtime);
	  if (TIMESPEC_AFTER (curtime, runtime))
	    goto done;
	}

      double d_total_s;
      double d_iters;

    done:
      d_total_s = total * 1e-9;
      d_iters = iters;

      printf ("%s: ITERS:%g: TOTAL:%gs, MAX:%gns, MIN:%gns, %g iter/s\n",
	      VARIANT (v),
	      d_total_i, d_total_s, max / d_iters, min / d_iters,
	      d_total_i / d_total_s);
    }

  return 0;
}