1 /*
2 * Copyright (c) 2004, Bull S.A.. All rights reserved.
3 * Created by: Sebastien Decugis
4
5 * This program is free software; you can redistribute it and/or modify it
6 * under the terms of version 2 of the GNU General Public License as
7 * published by the Free Software Foundation.
8 *
9 * This program is distributed in the hope that it would be useful, but
10 * WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
12 *
13 * You should have received a copy of the GNU General Public License along
14 * with this program; if not, write the Free Software Foundation, Inc.,
15 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
16
17 * This scalability sample aims to test the following assertion:
18 * -> The fork() duration does not depend on the # of processes in the system
19
20 * The steps are:
21 * -> Create processes until failure
22 * -> wait for each created process starting before creating the next one.
23 * -> processes are destroyed once we have reached the max processes in the system.
24
25 * The test fails if the fork duration tends to grow with the # of processes.
26 */
27
28 /********************************************************************************************/
29 /****************************** standard includes *****************************************/
30 /********************************************************************************************/
31 #include <pthread.h>
32 #include <stdarg.h>
33 #include <stdio.h>
34 #include <stdlib.h>
35 #include <string.h>
36 #include <unistd.h>
37
38 #include <sys/wait.h>
39 #include <errno.h>
40
41 #include <time.h>
42 #include <semaphore.h>
43 #include <fcntl.h>
44 #include <math.h>
45
46 /********************************************************************************************/
47 /****************************** Test framework *****************************************/
48 /********************************************************************************************/
49 #include "testfrmw.h"
50 #include "testfrmw.c"
51 /* This header is responsible for defining the following macros:
52 * UNRESOLVED(ret, descr);
53 * where descr is a description of the error and ret is an int (error code for example)
54 * FAILED(descr);
55 * where descr is a short text saying why the test has failed.
56 * PASSED();
57 * No parameter.
58 *
59 * Both three macros shall terminate the calling process.
60 * The testcase shall not terminate in any other maneer.
61 *
62 * The other file defines the functions
63 * void output_init()
64 * void output(char * string, ...)
65 *
66 * Those may be used to output information.
67 */
68
69 /********************************************************************************************/
70 /********************************** Configuration ******************************************/
71 /********************************************************************************************/
72 #ifndef SCALABILITY_FACTOR
73 #define SCALABILITY_FACTOR 1
74 #endif
75 #ifndef VERBOSE
76 #define VERBOSE 1
77 #endif
78
79 #define RESOLUTION (5 * SCALABILITY_FACTOR)
80
81 #ifdef PLOT_OUTPUT
82 #undef VERBOSE
83 #define VERBOSE 0
84 #endif
85
86 /********************************************************************************************/
87 /*********************************** Test *****************************************/
88 /********************************************************************************************/
89
90 /* The next structure is used to save the tests measures */
91
92 typedef struct __mes_t {
93 int nprocess;
94 long _data; /* As we store µsec values, a long type should be enough. */
95
96 struct __mes_t *next;
97 } mes_t;
98
99 /* Forward declaration */
100 int parse_measure(mes_t * measures);
101
102 sem_t *sem_synchro;
103 sem_t *sem_ending;
104
main(int argc,char * argv[])105 int main(int argc, char *argv[])
106 {
107 int ret, status;
108 pid_t pidctl;
109 pid_t *pr;
110
111 int nprocesses, i;
112
113 struct timespec ts_ref, ts_fin;
114
115 mes_t sentinel;
116 mes_t *m_cur, *m_tmp;
117
118 long CHILD_MAX = sysconf(_SC_CHILD_MAX);
119 long my_max = 1000 * SCALABILITY_FACTOR;
120
121 /* Initialize the measure list */
122 m_cur = &sentinel;
123 m_cur->next = NULL;
124
125 /* Initialize output routine */
126 output_init();
127
128 if (CHILD_MAX > 0)
129 my_max = CHILD_MAX;
130
131 pr = (pid_t *) calloc(1 + my_max, sizeof(pid_t));
132
133 if (pr == NULL) {
134 UNRESOLVED(errno, "Not enough memory for process IDs storage");
135 }
136 #if VERBOSE > 1
137 output("CHILD_MAX: %d\n", CHILD_MAX);
138
139 #endif
140
141 #ifdef PLOT_OUTPUT
142 output("# COLUMNS 2 #Process Duration\n");
143
144 #endif
145
146 /* Initilaize the semaphores */
147 sem_synchro = sem_open("/fork_scal_sync", O_CREAT, O_RDWR, 0);
148
149 if (sem_synchro == SEM_FAILED) {
150 UNRESOLVED(errno, "Failed to open a named semaphore\n");
151 }
152
153 sem_unlink("/fork_scal_sync");
154
155 sem_ending = sem_open("/fork_scal_end", O_CREAT, O_RDWR, 0);
156
157 if (sem_ending == SEM_FAILED) {
158 UNRESOLVED(errno, "Failed to open a named semaphore\n");
159 }
160
161 sem_unlink("/fork_scal_end");
162
163 nprocesses = 0;
164 m_cur = &sentinel;
165
166 while (1) { /* we will break */
167 /* read clock */
168 ret = clock_gettime(CLOCK_REALTIME, &ts_ref);
169
170 if (ret != 0) {
171 UNRESOLVED(errno, "Unable to read clock");
172 }
173
174 /* create a new child */
175 pr[nprocesses] = fork();
176
177 if (pr[nprocesses] == -1) {
178 if (errno == EAGAIN || errno == ENOMEM)
179 break;
180
181 FAILED
182 ("Failed to fork and received an unexpected error");
183 /* Post the semaphore so running processes will terminate */
184
185 do {
186 ret = sem_post(sem_ending);
187 } while (ret != 0 && errno == EINTR);
188
189 if (ret != 0)
190 output
191 ("Failed to post the semaphore on termination: error %d\n",
192 errno);
193
194 }
195
196 if (pr[nprocesses] == 0) {
197 /* Child */
198 /* Post the synchro semaphore */
199
200 do {
201 ret = sem_post(sem_synchro);
202 } while ((ret != 0) && (errno == EINTR));
203
204 if (ret != 0) {
205 /* In this case the test will hang... */
206 UNRESOLVED(errno,
207 "Failed post the sync semaphore");
208 }
209
210 /* Wait the end semaphore */
211 do {
212 ret = sem_wait(sem_ending);
213 } while ((ret != 0) && (errno == EINTR));
214
215 if (ret != 0) {
216 UNRESOLVED(errno,
217 "Failed wait for the end semaphore");
218 }
219
220 /* Cascade-post the end semaphore */
221 do {
222 ret = sem_post(sem_ending);
223 } while ((ret != 0) && (errno == EINTR));
224
225 if (ret != 0) {
226 UNRESOLVED(errno,
227 "Failed post the end semaphore");
228 }
229
230 /* Exit */
231 exit(PTS_PASS);
232 }
233
234 /* Parent */
235 nprocesses++;
236
237 /* FAILED if nprocesses > CHILD_MAX */
238 if (nprocesses > my_max) {
239 errno = 0;
240
241 if (CHILD_MAX > 0) {
242 #if VERBOSE > 0
243 output
244 ("WARNING! We were able to create more than CHILD_MAX processes\n");
245 #endif
246
247 }
248
249 break;
250 }
251
252 /* wait for the semaphore */
253 do {
254 ret = sem_wait(sem_synchro);
255 } while ((ret == -1) && (errno == EINTR));
256
257 if (ret == -1) {
258 sem_post(sem_ending);
259 UNRESOLVED(errno,
260 "Failed to wait for the sync semaphore");
261 }
262
263 /* read clock */
264 ret = clock_gettime(CLOCK_REALTIME, &ts_fin);
265
266 if (ret != 0) {
267 UNRESOLVED(errno, "Unable to read clock");
268 }
269
270 /* add to the measure list if nprocesses % resolution == 0 */
271 if (((nprocesses % RESOLUTION) == 0) && (nprocesses != 0)) {
272 /* Create an empty new element */
273 m_tmp = malloc(sizeof(mes_t));
274
275 if (m_tmp == NULL) {
276 sem_post(sem_ending);
277 UNRESOLVED(errno,
278 "Unable to alloc memory for measure saving");
279 }
280
281 m_tmp->nprocess = nprocesses;
282 m_tmp->next = NULL;
283 m_tmp->_data = 0;
284 m_cur->next = m_tmp;
285
286 m_cur = m_cur->next;
287
288 m_cur->_data =
289 ((ts_fin.tv_sec - ts_ref.tv_sec) * 1000000) +
290 ((ts_fin.tv_nsec - ts_ref.tv_nsec) / 1000);
291
292 #if VERBOSE > 5
293 output("Added the following measure: n=%i, v=%li\n",
294 nprocesses, m_cur->_data);
295 #endif
296
297 }
298
299 }
300 #if VERBOSE > 3
301
302 if (errno)
303 output
304 ("Could not create anymore processes. Current count is %i\n",
305 nprocesses);
306 else
307 output
308 ("Should not create anymore processes. Current count is %i\n",
309 nprocesses);
310
311 #endif
312
313 /* Unblock every created children: post once, then cascade signaling */
314
315 do {
316 ret = sem_post(sem_ending);
317 }
318 while ((ret != 0) && (errno == EINTR));
319
320 if (ret != 0) {
321 UNRESOLVED(errno, "Failed post the end semaphore");
322 }
323 #if VERBOSE > 3
324 output("Waiting children termination\n");
325
326 #endif
327
328 for (i = 0; i < nprocesses; i++) {
329 pidctl = waitpid(pr[i], &status, 0);
330
331 if (pidctl != pr[i]) {
332 UNRESOLVED(errno, "Waitpid returned the wrong PID");
333 }
334
335 if ((!WIFEXITED(status)) || (WEXITSTATUS(status) != PTS_PASS)) {
336 FAILED("Child exited abnormally");
337 }
338
339 }
340
341 /* Free some memory before result parsing */
342 free(pr);
343
344 /* Compute the results */
345 ret = parse_measure(&sentinel);
346
347 /* Free the resources and output the results */
348
349 #if VERBOSE > 5
350 output("Dump : \n");
351
352 output(" nproc | dur \n");
353
354 #endif
355 while (sentinel.next != NULL) {
356 m_cur = sentinel.next;
357 #if (VERBOSE > 5) || defined(PLOT_OUTPUT)
358 output("%8.8i %1.1li.%6.6li\n", m_cur->nprocess,
359 m_cur->_data / 1000000, m_cur->_data % 1000000);
360
361 #endif
362 sentinel.next = m_cur->next;
363
364 free(m_cur);
365 }
366
367 if (ret != 0) {
368 FAILED
369 ("The function is not scalable, add verbosity for more information");
370 }
371 #if VERBOSE > 0
372 output("-----\n");
373
374 output("All test data destroyed\n");
375
376 output("Test PASSED\n");
377
378 #endif
379
380 PASSED;
381 }
382
383 /***
384 * The next function will seek for the better model for each series of measurements.
385 *
386 * The tested models are: -- X = # threads; Y = latency
387 * -> Y = a; -- Error is r1 = avg((Y - Yavg)²);
388 * -> Y = aX + b; -- Error is r2 = avg((Y -aX -b)²);
389 * -- where a = avg ((X - Xavg)(Y - Yavg)) / avg((X - Xavg)²)
390 * -- Note: We will call _q = sum((X - Xavg) * (Y - Yavg));
391 * -- and _d = sum((X - Xavg)²);
392 * -- and b = Yavg - a * Xavg
393 * -> Y = c * X^a;-- Same as previous, but with log(Y) = a log(X) + b; and b = log(c). Error is r3
394 * -> Y = exp(aX + b); -- log(Y) = aX + b. Error is r4
395 *
396 * We compute each error factor (r1, r2, r3, r4) then search which is the smallest (with ponderation).
397 * The function returns 0 when r1 is the best for all cases (latency is constant) and !0 otherwise.
398 */
399
400 struct row {
401 long X; /* the X values -- copied from function argument */
402 long Y; /* the Y values -- copied from function argument */
403 long _x; /* Value X - Xavg */
404 long _y; /* Value Y - Yavg */
405 double LnX; /* Natural logarithm of X values */
406 double LnY; /* Natural logarithm of Y values */
407 double _lnx; /* Value LnX - LnXavg */
408 double _lny; /* Value LnY - LnYavg */
409 };
410
parse_measure(mes_t * measures)411 int parse_measure(mes_t * measures)
412 {
413 int ret, r;
414
415 mes_t *cur;
416
417 double Xavg, Yavg;
418 double LnXavg, LnYavg;
419
420 int N;
421
422 double r1, r2, r3, r4;
423
424 /* Some more intermediate vars */
425 long double _q[3];
426 long double _d[3];
427
428 long double t; /* temp value */
429
430 struct row *Table = NULL;
431
432 /* This array contains the last element of each serie */
433 int array_max;
434
435 /* Initialize the datas */
436
437 array_max = -1; /* means no data */
438 Xavg = 0.0;
439 LnXavg = 0.0;
440 Yavg = 0.0;
441 LnYavg = 0.0;
442 r1 = 0.0;
443 r2 = 0.0;
444 r3 = 0.0;
445 r4 = 0.0;
446 _q[0] = 0.0;
447 _q[1] = 0.0;
448 _q[2] = 0.0;
449 _d[0] = 0.0;
450 _d[1] = 0.0;
451 _d[2] = 0.0;
452
453 N = 0;
454 cur = measures;
455
456 #if VERBOSE > 1
457 output("Data analysis starting\n");
458 #endif
459
460 /* We start with reading the list to find:
461 * -> number of elements, to assign an array.
462 * -> average values
463 */
464
465 while (cur->next != NULL) {
466 cur = cur->next;
467
468 N++;
469
470 if (cur->_data != 0) {
471 array_max = N;
472 Xavg += (double)cur->nprocess;
473 LnXavg += log((double)cur->nprocess);
474 Yavg += (double)cur->_data;
475 LnYavg += log((double)cur->_data);
476 }
477 }
478
479 /* We have the sum; we can divide to obtain the average values */
480 if (array_max != -1) {
481 Xavg /= array_max;
482 LnXavg /= array_max;
483 Yavg /= array_max;
484 LnYavg /= array_max;
485 }
486 #if VERBOSE > 1
487 output(" Found %d rows\n", N);
488
489 #endif
490
491 /* We will now alloc the array ... */
492
493 Table = calloc(N, sizeof(struct row));
494
495 if (Table == NULL) {
496 UNRESOLVED(errno, "Unable to alloc space for results parsing");
497 }
498
499 /* ... and fill it */
500 N = 0;
501
502 cur = measures;
503
504 while (cur->next != NULL) {
505 cur = cur->next;
506
507 Table[N].X = (long)cur->nprocess;
508 Table[N].LnX = log((double)cur->nprocess);
509
510 if (array_max > N) {
511 Table[N]._x = Table[N].X - Xavg;
512 Table[N]._lnx = Table[N].LnX - LnXavg;
513 Table[N].Y = cur->_data;
514 Table[N]._y = Table[N].Y - Yavg;
515 Table[N].LnY = log((double)cur->_data);
516 Table[N]._lny = Table[N].LnY - LnYavg;
517 }
518
519 N++;
520 }
521
522 /* We won't need the list anymore -- we'll work with the array which should be faster. */
523 #if VERBOSE > 1
524 output(" Data was stored in an array.\n");
525
526 #endif
527
528 /* We need to read the full array at least twice to compute all the error factors */
529
530 /* In the first pass, we'll compute:
531 * -> r1 for each scenar.
532 * -> "a" factor for linear (0), power (1) and exponential (2) approximations -- with using the _d and _q vars.
533 */
534 #if VERBOSE > 1
535 output("Starting first pass...\n");
536
537 #endif
538 for (r = 0; r < array_max; r++) {
539 r1 += ((double)Table[r]._y / array_max) * (double)Table[r]._y;
540
541 _q[0] += Table[r]._y * Table[r]._x;
542 _d[0] += Table[r]._x * Table[r]._x;
543
544 _q[1] += Table[r]._lny * Table[r]._lnx;
545 _d[1] += Table[r]._lnx * Table[r]._lnx;
546
547 _q[2] += Table[r]._lny * Table[r]._x;
548 _d[2] += Table[r]._x * Table[r]._x;
549 }
550
551 /* First pass is terminated; a2 = _q[0]/_d[0]; a3 = _q[1]/_d[1]; a4 = _q[2]/_d[2] */
552
553 /* In the first pass, we'll compute:
554 * -> r2, r3, r4 for each scenar.
555 */
556
557 #if VERBOSE > 1
558 output("Starting second pass...\n");
559
560 #endif
561 for (r = 0; r < array_max; r++) {
562 /* r2 = avg((y - ax -b)²); t = (y - ax - b) = (y - yavg) - a (x - xavg); */
563 t = (Table[r]._y - ((_q[0] * Table[r]._x) / _d[0]));
564 r2 += t * t / array_max;
565
566 /* r3 = avg((y - c.x^a) ²);
567 t = y - c * x ^ a
568 = y - log (LnYavg - (_q[1]/_d[1]) * LnXavg) * x ^ (_q[1]/_d[1])
569 */
570 t = (Table[r].Y - (logl(LnYavg - (_q[1] / _d[1]) * LnXavg)
571 * powl(Table[r].X, (_q[1] / _d[1]))
572 ));
573 r3 += t * t / array_max;
574
575 /* r4 = avg((y - exp(ax+b))²);
576 t = y - exp(ax+b)
577 = y - exp(_q[2]/_d[2] * x + (LnYavg - (_q[2]/_d[2] * Xavg)));
578 = y - exp(_q[2]/_d[2] * (x - Xavg) + LnYavg);
579 */
580 t = (Table[r].Y - expl((_q[2] / _d[2]) * Table[r]._x + LnYavg));
581 r4 += t * t / array_max;
582
583 }
584
585 #if VERBOSE > 1
586 output("All computing terminated.\n");
587
588 #endif
589 ret = 0;
590
591 #if VERBOSE > 1
592 output(" # of data: %i\n", array_max);
593
594 output(" Model: Y = k\n");
595
596 output(" k = %g\n", Yavg);
597
598 output(" Divergence %g\n", r1);
599
600 output(" Model: Y = a * X + b\n");
601
602 output(" a = %Lg\n", _q[0] / _d[0]);
603
604 output(" b = %Lg\n", Yavg - ((_q[0] / _d[0]) * Xavg));
605
606 output(" Divergence %g\n", r2);
607
608 output(" Model: Y = c * X ^ a\n");
609
610 output(" a = %Lg\n", _q[1] / _d[1]);
611
612 output(" c = %Lg\n", logl(LnYavg - (_q[1] / _d[1]) * LnXavg));
613
614 output(" Divergence %g\n", r2);
615
616 output(" Model: Y = exp(a * X + b)\n");
617
618 output(" a = %Lg\n", _q[2] / _d[2]);
619
620 output(" b = %Lg\n", LnYavg - ((_q[2] / _d[2]) * Xavg));
621
622 output(" Divergence %g\n", r2);
623
624 #endif
625
626 if (array_max != -1) {
627 /* Compare r1 to other values, with some ponderations */
628
629 if ((r1 > 1.1 * r2) || (r1 > 1.2 * r3) || (r1 > 1.3 * r4))
630 ret++;
631
632 #if VERBOSE > 1
633 else
634 output(" Sanction: OK\n");
635
636 #endif
637
638 }
639
640 /* We need to free the array */
641 free(Table);
642
643 /* We're done */
644 return ret;
645 }
646