mirror of
https://mirrors.bfsu.edu.cn/git/linux.git
synced 2025-01-09 15:24:32 +08:00
a1ea0ca8a6
gettid() is 10% lighter than getppid(), use it for null_syscall selftest. Signed-off-by: Christophe Leroy <christophe.leroy@csgroup.eu> Signed-off-by: Michael Ellerman <mpe@ellerman.id.au> Link: https://lore.kernel.org/r/0ad62673d3e063f848e7c99d719bb966efd433e8.1622809833.git.christophe.leroy@csgroup.eu
155 lines
2.9 KiB
C
155 lines
2.9 KiB
C
// SPDX-License-Identifier: GPL-2.0-or-later
|
|
/*
|
|
* Test null syscall performance
|
|
*
|
|
* Copyright (C) 2009-2015 Anton Blanchard, IBM
|
|
*/
|
|
|
|
#define NR_LOOPS 10000000
|
|
|
|
#include <string.h>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <unistd.h>
|
|
#include <time.h>
|
|
#include <sys/types.h>
|
|
#include <sys/time.h>
|
|
#include <sys/syscall.h>
|
|
#include <signal.h>
|
|
|
|
static volatile int soak_done;
|
|
unsigned long long clock_frequency;
|
|
unsigned long long timebase_frequency;
|
|
double timebase_multiplier;
|
|
|
|
static inline unsigned long mftb(void)
|
|
{
|
|
unsigned long low;
|
|
|
|
asm volatile("mftb %0" : "=r" (low));
|
|
|
|
return low;
|
|
}
|
|
|
|
static void sigalrm_handler(int unused)
|
|
{
|
|
soak_done = 1;
|
|
}
|
|
|
|
/*
|
|
* Use a timer instead of busy looping on clock_gettime() so we don't
|
|
* pollute profiles with glibc and VDSO hits.
|
|
*/
|
|
static void cpu_soak_usecs(unsigned long usecs)
|
|
{
|
|
struct itimerval val;
|
|
|
|
memset(&val, 0, sizeof(val));
|
|
val.it_value.tv_usec = usecs;
|
|
|
|
signal(SIGALRM, sigalrm_handler);
|
|
setitimer(ITIMER_REAL, &val, NULL);
|
|
|
|
while (1) {
|
|
if (soak_done)
|
|
break;
|
|
}
|
|
|
|
signal(SIGALRM, SIG_DFL);
|
|
}
|
|
|
|
/*
|
|
* This only works with recent kernels where cpufreq modifies
|
|
* /proc/cpuinfo dynamically.
|
|
*/
|
|
static void get_proc_frequency(void)
|
|
{
|
|
FILE *f;
|
|
char line[128];
|
|
char *p, *end;
|
|
unsigned long v;
|
|
double d;
|
|
char *override;
|
|
|
|
/* Try to get out of low power/low frequency mode */
|
|
cpu_soak_usecs(0.25 * 1000000);
|
|
|
|
f = fopen("/proc/cpuinfo", "r");
|
|
if (f == NULL)
|
|
return;
|
|
|
|
timebase_frequency = 0;
|
|
|
|
while (fgets(line, sizeof(line), f) != NULL) {
|
|
if (strncmp(line, "timebase", 8) == 0) {
|
|
p = strchr(line, ':');
|
|
if (p != NULL) {
|
|
v = strtoull(p + 1, &end, 0);
|
|
if (end != p + 1)
|
|
timebase_frequency = v;
|
|
}
|
|
}
|
|
|
|
if (((strncmp(line, "clock", 5) == 0) ||
|
|
(strncmp(line, "cpu MHz", 7) == 0))) {
|
|
p = strchr(line, ':');
|
|
if (p != NULL) {
|
|
d = strtod(p + 1, &end);
|
|
if (end != p + 1) {
|
|
/* Find fastest clock frequency */
|
|
if ((d * 1000000ULL) > clock_frequency)
|
|
clock_frequency = d * 1000000ULL;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
fclose(f);
|
|
|
|
override = getenv("FREQUENCY");
|
|
if (override)
|
|
clock_frequency = strtoull(override, NULL, 10);
|
|
|
|
if (timebase_frequency)
|
|
timebase_multiplier = (double)clock_frequency
|
|
/ timebase_frequency;
|
|
else
|
|
timebase_multiplier = 1;
|
|
}
|
|
|
|
static void do_null_syscall(unsigned long nr)
|
|
{
|
|
unsigned long i;
|
|
|
|
for (i = 0; i < nr; i++)
|
|
syscall(__NR_gettid);
|
|
}
|
|
|
|
#define TIME(A, STR) \
|
|
|
|
int main(void)
|
|
{
|
|
unsigned long tb_start, tb_now;
|
|
struct timespec tv_start, tv_now;
|
|
unsigned long long elapsed_ns, elapsed_tb;
|
|
|
|
get_proc_frequency();
|
|
|
|
clock_gettime(CLOCK_MONOTONIC, &tv_start);
|
|
tb_start = mftb();
|
|
|
|
do_null_syscall(NR_LOOPS);
|
|
|
|
clock_gettime(CLOCK_MONOTONIC, &tv_now);
|
|
tb_now = mftb();
|
|
|
|
elapsed_ns = (tv_now.tv_sec - tv_start.tv_sec) * 1000000000ULL +
|
|
(tv_now.tv_nsec - tv_start.tv_nsec);
|
|
elapsed_tb = tb_now - tb_start;
|
|
|
|
printf("%10.2f ns %10.2f cycles\n", (float)elapsed_ns / NR_LOOPS,
|
|
(float)elapsed_tb * timebase_multiplier / NR_LOOPS);
|
|
|
|
return 0;
|
|
}
|