| /* |
| * Test null syscall performance |
| * |
| * Copyright (C) 2009-2015 Anton Blanchard, IBM |
| * |
| * This program is free software; you can redistribute it and/or |
| * modify it under the terms of the GNU General Public License |
| * as published by the Free Software Foundation; either version |
| * 2 of the License, or (at your option) any later version. |
| */ |
| |
| #define NR_LOOPS 10000000 |
| |
| #include <string.h> |
| #include <stdio.h> |
| #include <stdlib.h> |
| #include <unistd.h> |
| #include <time.h> |
| #include <sys/types.h> |
| #include <sys/time.h> |
| #include <signal.h> |
| |
| static volatile int soak_done; |
| unsigned long long clock_frequency; |
| unsigned long long timebase_frequency; |
| double timebase_multiplier; |
| |
| static inline unsigned long mftb(void) |
| { |
| unsigned long low; |
| |
| asm volatile("mftb %0" : "=r" (low)); |
| |
| return low; |
| } |
| |
| static void sigalrm_handler(int unused) |
| { |
| soak_done = 1; |
| } |
| |
| /* |
| * Use a timer instead of busy looping on clock_gettime() so we don't |
| * pollute profiles with glibc and VDSO hits. |
| */ |
| static void cpu_soak_usecs(unsigned long usecs) |
| { |
| struct itimerval val; |
| |
| memset(&val, 0, sizeof(val)); |
| val.it_value.tv_usec = usecs; |
| |
| signal(SIGALRM, sigalrm_handler); |
| setitimer(ITIMER_REAL, &val, NULL); |
| |
| while (1) { |
| if (soak_done) |
| break; |
| } |
| |
| signal(SIGALRM, SIG_DFL); |
| } |
| |
| /* |
| * This only works with recent kernels where cpufreq modifies |
| * /proc/cpuinfo dynamically. |
| */ |
| static void get_proc_frequency(void) |
| { |
| FILE *f; |
| char line[128]; |
| char *p, *end; |
| unsigned long v; |
| double d; |
| char *override; |
| |
| /* Try to get out of low power/low frequency mode */ |
| cpu_soak_usecs(0.25 * 1000000); |
| |
| f = fopen("/proc/cpuinfo", "r"); |
| if (f == NULL) |
| return; |
| |
| timebase_frequency = 0; |
| |
| while (fgets(line, sizeof(line), f) != NULL) { |
| if (strncmp(line, "timebase", 8) == 0) { |
| p = strchr(line, ':'); |
| if (p != NULL) { |
| v = strtoull(p + 1, &end, 0); |
| if (end != p + 1) |
| timebase_frequency = v; |
| } |
| } |
| |
| if (((strncmp(line, "clock", 5) == 0) || |
| (strncmp(line, "cpu MHz", 7) == 0))) { |
| p = strchr(line, ':'); |
| if (p != NULL) { |
| d = strtod(p + 1, &end); |
| if (end != p + 1) { |
| /* Find fastest clock frequency */ |
| if ((d * 1000000ULL) > clock_frequency) |
| clock_frequency = d * 1000000ULL; |
| } |
| } |
| } |
| } |
| |
| fclose(f); |
| |
| override = getenv("FREQUENCY"); |
| if (override) |
| clock_frequency = strtoull(override, NULL, 10); |
| |
| if (timebase_frequency) |
| timebase_multiplier = (double)clock_frequency |
| / timebase_frequency; |
| else |
| timebase_multiplier = 1; |
| } |
| |
| static void do_null_syscall(unsigned long nr) |
| { |
| unsigned long i; |
| |
| for (i = 0; i < nr; i++) |
| getppid(); |
| } |
| |
| #define TIME(A, STR) \ |
| |
| int main(void) |
| { |
| unsigned long tb_start, tb_now; |
| struct timespec tv_start, tv_now; |
| unsigned long long elapsed_ns, elapsed_tb; |
| |
| get_proc_frequency(); |
| |
| clock_gettime(CLOCK_MONOTONIC, &tv_start); |
| tb_start = mftb(); |
| |
| do_null_syscall(NR_LOOPS); |
| |
| clock_gettime(CLOCK_MONOTONIC, &tv_now); |
| tb_now = mftb(); |
| |
| elapsed_ns = (tv_now.tv_sec - tv_start.tv_sec) * 1000000000ULL + |
| (tv_now.tv_nsec - tv_start.tv_nsec); |
| elapsed_tb = tb_now - tb_start; |
| |
| printf("%10.2f ns %10.2f cycles\n", (float)elapsed_ns / NR_LOOPS, |
| (float)elapsed_tb * timebase_multiplier / NR_LOOPS); |
| |
| return 0; |
| } |