From: Stelian Pop Date: Thu, 18 Jun 2009 09:50:54 +0000 (+0000) Subject: Use sys_clone under Linux to share I/O contexts between dump processes. X-Git-Tag: release_0_4b42~2 X-Git-Url: https://git.wh0rd.org/?p=dump.git;a=commitdiff_plain;h=b8db960b14856a2ab86e044b2ffa53612d2aa489 Use sys_clone under Linux to share I/O contexts between dump processes. --- diff --git a/CHANGES b/CHANGES index 4b117b2..b0d3831 100644 --- a/CHANGES +++ b/CHANGES @@ -1,4 +1,4 @@ -$Id: CHANGES,v 1.299 2009/06/18 09:42:11 stelian Exp $ +$Id: CHANGES,v 1.300 2009/06/18 09:50:54 stelian Exp $ Changes between versions 0.4b41 and 0.4b42 (released xxxxxxxxxxxxxxx) ===================================================================== @@ -70,6 +70,12 @@ Changes between versions 0.4b41 and 0.4b42 (released xxxxxxxxxxxxxxx) that -P and -A were both allowed in the same invocation (RedHat bug #490627). Thanks to Adam Tkac for the patch. +17. Use sys_clone under Linux to share I/O contexts between dump + processes, thus drastically increasing the performance of dump + under CFQ (which is the default I/O scheduler used in a number of + distributions). Thanks to Jeff Moyer for the + patch. + Changes between versions 0.4b40 and 0.4b41 (released January 2, 2006) ===================================================================== diff --git a/dump/tape.c b/dump/tape.c index 3e41622..edcf5d6 100644 --- a/dump/tape.c +++ b/dump/tape.c @@ -37,7 +37,7 @@ #ifndef lint static const char rcsid[] = - "$Id: tape.c,v 1.90 2008/06/04 19:27:48 stelian Exp $"; + "$Id: tape.c,v 1.91 2009/06/18 09:50:54 stelian Exp $"; #endif /* not lint */ #include @@ -187,6 +187,41 @@ static sigjmp_buf jmpbuf; /* where to jump to if we are ready when the */ static int gtperr = 0; #endif +/* + * Determine if we can use Linux' clone system call. If so, call it + * with the CLONE_IO flag so that all processes will share the same I/O + * context, allowing the I/O schedulers to make better scheduling decisions. + */ +#ifdef __linux__ +/* first, pull in the header files that define sys_clone and CLONE_IO */ +#include +#define _GNU_SOURCE +#include +#include +#undef _GNU_SOURCE + +/* If either is not present, fall back on the fork behaviour */ +#if ! defined(SYS_clone) || ! defined (CLONE_IO) +#define fork_clone_io fork +#else /* SYS_clone */ +/* CLONE_IO is available, determine which version of sys_clone to use */ +#include +/* + * Kernel 2.5.49 introduced two extra parameters to the clone system call. + * Neither is useful in our case, so this is easy to handle. + */ +#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,5,49) +/* clone_flags, child_stack, parent_tidptr, child_tidptr */ +#define CLONE_ARGS SIGCHLD|CLONE_IO, 0, NULL, NULL +#else +#define CLONE_ARGS SIGCHLD|CLONE_IO, 0 +#endif /* LINUX_VERSION_CODE */ +pid_t fork_clone_io(void); +#endif /* SYS_clone */ +#else /* __linux__ not defined */ +#define fork_clone_io fork +#endif /* __linux__ */ + int alloctape(void) { @@ -755,6 +790,16 @@ rollforward(void) #endif } +#ifdef __linux__ +#if defined(SYS_clone) && defined(CLONE_IO) +pid_t +fork_clone_io(void) +{ + return syscall(SYS_clone, CLONE_ARGS); +} +#endif +#endif + /* * We implement taking and restoring checkpoints on the tape level. * When each tape is opened, a new process is created by forking; this @@ -801,7 +846,7 @@ restore_check_point: /* * All signals are inherited... */ - childpid = fork(); + childpid = fork_clone_io(); if (childpid < 0) { msg("Context save fork fails in parent %d\n", parentpid); Exit(X_ABORT); @@ -1017,7 +1062,7 @@ enslave(void) } if (socketpair(AF_UNIX, SOCK_STREAM, 0, cmd) < 0 || - (slaves[i].pid = fork()) < 0) + (slaves[i].pid = fork_clone_io()) < 0) quit("too many slaves, %d (recompile smaller): %s\n", i, strerror(errno));