1 /* 2 * Copyright 2008 Google Inc. All Rights Reserved. 3 * Author: md@google.com (Michael Davidson) 4 * 5 * Based on time-warp-test.c, which is: 6 * Copyright (C) 2005, Ingo Molnar 7 */ 8 #define _GNU_SOURCE 9 10 #include <errno.h> 11 #include <pthread.h> 12 #include <getopt.h> 13 #include <sched.h> 14 #include <signal.h> 15 #include <stdarg.h> 16 #include <stdint.h> 17 #include <inttypes.h> 18 #include <stdio.h> 19 #include <stdlib.h> 20 #include <string.h> 21 #include <sys/time.h> 22 #include <time.h> 23 24 #include "cpuset.h" 25 #include "spinlock.h" 26 #include "threads.h" 27 #include "logging.h" 28 29 30 char *program = ""; 31 long duration = 0; 32 long threshold = 0; 33 int verbose = 0; 34 35 const char optstring[] = "c:d:ht:v"; 36 37 struct option options[] = { 38 { "cpus", required_argument, 0, 'c' }, 39 { "duration", required_argument, 0, 'd' }, 40 { "help", no_argument, 0, 'h' }, 41 { "threshold", required_argument, 0, 't' }, 42 { "verbose", no_argument, 0, 'v' }, 43 { 0, 0, 0, 0 } 44 }; 45 46 47 void usage(void) 48 { 49 printf("usage: %s [-hv] [-c <cpu_set>] [-d duration] [-t threshold] " 50 "tsc|gtod|clock", program); 51 } 52 53 54 const char help_text[] = 55 "check time sources for monotonicity across multiple CPUs\n" 56 " -c,--cpus set of cpus to test (default: all)\n" 57 " -d,--duration test duration in seconds (default: infinite)\n" 58 " -t,--threshold error threshold (default: 0)\n" 59 " -v,--verbose verbose output\n" 60 " tsc test the TSC\n" 61 " gtod test gettimeofday()\n" 62 " clock test CLOCK_MONOTONIC\n"; 63 64 65 void help(void) 66 { 67 usage(); 68 printf("%s", help_text); 69 } 70 71 72 /* 73 * get the TSC as 64 bit value with CPU clock frequency resolution 74 */ 75 #if defined(__x86_64__) 76 static inline uint64_t rdtsc(void) 77 { 78 uint32_t tsc_lo, tsc_hi; 79 __asm__ __volatile__("rdtsc" : "=a" (tsc_lo), "=d" (tsc_hi)); 80 return ((uint64_t)tsc_hi << 32) | tsc_lo; 81 } 82 #elif defined(__i386__) 83 static inline uint64_t rdtsc(void) 84 { 85 uint64_t tsc; 86 __asm__ __volatile__("rdtsc" : "=A" (tsc)); 87 return tsc; 88 } 89 #else 90 #error "rdtsc() not implemented for this architecture" 91 #endif 92 93 94 static inline uint64_t rdtsc_mfence(void) 95 { 96 __asm__ __volatile__("mfence" ::: "memory"); 97 return rdtsc(); 98 } 99 100 101 static inline uint64_t rdtsc_lfence(void) 102 { 103 __asm__ __volatile__("lfence" ::: "memory"); 104 return rdtsc(); 105 } 106 107 108 /* 109 * get result from gettimeofday() as a 64 bit value 110 * with microsecond resolution 111 */ 112 static inline uint64_t rdgtod(void) 113 { 114 struct timeval tv; 115 116 gettimeofday(&tv, NULL); 117 return (uint64_t)tv.tv_sec * 1000000 + tv.tv_usec; 118 } 119 120 121 /* 122 * get result from clock_gettime(CLOCK_MONOTONIC) as a 64 bit value 123 * with nanosecond resolution 124 */ 125 static inline uint64_t rdclock(void) 126 { 127 struct timespec ts; 128 129 clock_gettime(CLOCK_MONOTONIC, &ts); 130 return (uint64_t)ts.tv_sec * 1000000000 + ts.tv_nsec; 131 } 132 133 134 /* 135 * test data 136 */ 137 typedef struct test_info { 138 const char *name; /* test name */ 139 void (*func)(struct test_info *); /* the test */ 140 spinlock_t lock; 141 uint64_t last; /* last time value */ 142 long loops; /* # of test loop iterations */ 143 long warps; /* # of backward time jumps */ 144 int64_t worst; /* worst backward time jump */ 145 uint64_t start; /* test start time */ 146 int done; /* flag to stop test */ 147 } test_info_t; 148 149 150 void show_warps(struct test_info *test) 151 { 152 INFO("new %s-warp maximum: %9"PRId64, test->name, test->worst); 153 } 154 155 156 #define DEFINE_TEST(_name) \ 157 \ 158 void _name##_test(struct test_info *test) \ 159 { \ 160 uint64_t t0, t1; \ 161 int64_t delta; \ 162 \ 163 spin_lock(&test->lock); \ 164 t1 = rd##_name(); \ 165 t0 = test->last; \ 166 test->last = rd##_name(); \ 167 test->loops++; \ 168 spin_unlock(&test->lock); \ 169 \ 170 delta = t1 - t0; \ 171 if (delta < 0 && delta < -threshold) { \ 172 spin_lock(&test->lock); \ 173 ++test->warps; \ 174 if (delta < test->worst) { \ 175 test->worst = delta; \ 176 show_warps(test); \ 177 } \ 178 spin_unlock(&test->lock); \ 179 } \ 180 if (!((unsigned long)t0 & 31)) \ 181 asm volatile ("rep; nop"); \ 182 } \ 183 \ 184 struct test_info _name##_test_info = { \ 185 .name = #_name, \ 186 .func = _name##_test, \ 187 } 188 189 DEFINE_TEST(tsc); 190 DEFINE_TEST(tsc_lfence); 191 DEFINE_TEST(tsc_mfence); 192 DEFINE_TEST(gtod); 193 DEFINE_TEST(clock); 194 195 struct test_info *tests[] = { 196 &tsc_test_info, 197 &tsc_lfence_test_info, 198 &tsc_mfence_test_info, 199 >od_test_info, 200 &clock_test_info, 201 NULL 202 }; 203 204 205 void show_progress(struct test_info *test) 206 { 207 static int count; 208 const char progress[] = "\\|/-"; 209 uint64_t elapsed = rdgtod() - test->start; 210 211 printf(" | %.2f us, %s-warps:%ld %c\r", 212 (double)elapsed/(double)test->loops, 213 test->name, 214 test->warps, 215 progress[++count & 3]); 216 fflush(stdout); 217 } 218 219 220 void *test_loop(void *arg) 221 { 222 struct test_info *test = arg; 223 224 while (! test->done) 225 (*test->func)(test); 226 227 return NULL; 228 } 229 230 231 int run_test(cpu_set_t *cpus, long duration, struct test_info *test) 232 { 233 int errs; 234 int ncpus; 235 int nthreads; 236 struct timespec ts = { .tv_sec = 0, .tv_nsec = 200000000 }; 237 struct timespec *timeout = (verbose || duration) ? &ts : NULL; 238 sigset_t signals; 239 240 /* 241 * Make sure that SIG_INT is blocked so we can 242 * wait for it in the main test loop below. 243 */ 244 sigemptyset(&signals); 245 sigaddset(&signals, SIGINT); 246 sigprocmask(SIG_BLOCK, &signals, NULL); 247 248 /* 249 * test start time 250 */ 251 test->start = rdgtod(); 252 253 /* 254 * create the threads 255 */ 256 ncpus = count_cpus(cpus); 257 nthreads = create_per_cpu_threads(cpus, test_loop, test); 258 if (nthreads != ncpus) { 259 ERROR(0, "failed to create threads: expected %d, got %d", 260 ncpus, nthreads); 261 if (nthreads) { 262 test->done = 1; 263 join_threads(); 264 } 265 return 1; 266 } 267 268 if (duration) { 269 INFO("running %s test on %d cpus for %ld seconds", 270 test->name, ncpus, duration); 271 } else { 272 INFO("running %s test on %d cpus", test->name, ncpus); 273 } 274 275 /* 276 * wait for a signal 277 */ 278 while (sigtimedwait(&signals, NULL, timeout) < 0) { 279 if (duration && rdgtod() > test->start + duration * 1000000) 280 break; 281 282 if (verbose) 283 show_progress(test); 284 } 285 286 /* 287 * tell the test threads that we are done and wait for them to exit 288 */ 289 test->done = 1; 290 291 join_threads(); 292 293 errs = (test->warps != 0); 294 295 if (!errs) 296 printf("PASS:\n"); 297 else 298 printf("FAIL: %s-worst-warp=%"PRId64"\n", 299 test->name, test->worst); 300 301 return errs; 302 } 303 304 305 int 306 main(int argc, char *argv[]) 307 { 308 int c; 309 cpu_set_t cpus; 310 int errs; 311 int i; 312 test_info_t *test; 313 const char *testname; 314 extern int opterr; 315 extern int optind; 316 extern char *optarg; 317 318 if ((program = strrchr(argv[0], '/')) != NULL) 319 ++program; 320 else 321 program = argv[0]; 322 set_program_name(program); 323 324 /* 325 * default to checking all cpus 326 */ 327 for (c = 0; c < CPU_SETSIZE; c++) { 328 CPU_SET(c, &cpus); 329 } 330 331 opterr = 0; 332 errs = 0; 333 while ((c = getopt_long(argc, argv, optstring, options, NULL)) != EOF) { 334 switch (c) { 335 case 'c': 336 if (parse_cpu_set(optarg, &cpus) != 0) 337 ++errs; 338 break; 339 case 'd': 340 duration = strtol(optarg, NULL, 0); 341 break; 342 case 'h': 343 help(); 344 exit(0); 345 case 't': 346 threshold = strtol(optarg, NULL, 0); 347 break; 348 case 'v': 349 ++verbose; 350 break; 351 default: 352 ERROR(0, "unknown option '%c'", c); 353 ++errs; 354 break; 355 } 356 } 357 358 if (errs || optind != argc-1) { 359 usage(); 360 exit(1); 361 } 362 363 testname = argv[optind]; 364 for (i = 0; (test = tests[i]) != NULL; i++) { 365 if (strcmp(testname, test->name) == 0) 366 break; 367 } 368 369 if (!test) { 370 ERROR(0, "unknown test '%s'\n", testname); 371 usage(); 372 exit(1); 373 } 374 375 /* 376 * limit the set of CPUs to the ones that are currently available 377 * (Note that on some kernel versions sched_setaffinity() will fail 378 * if you specify CPUs that are not currently online so we ignore 379 * the return value and hope for the best) 380 */ 381 sched_setaffinity(0, sizeof cpus, &cpus); 382 if (sched_getaffinity(0, sizeof cpus, &cpus) < 0) { 383 ERROR(errno, "sched_getaffinity() failed"); 384 exit(1); 385 } 386 387 return run_test(&cpus, duration, test); 388 } 389