9ff72da471
This patch implements a new posix_spawn{p} implementation for Linux. The main difference is it uses the clone syscall directly with CLONE_VM and CLONE_VFORK flags and a direct allocated stack. The new stack and start function solves most the vfork limitation (possible parent clobber due stack spilling). The remaning issue are related to signal handling: 1. That no signal handlers must run in child context, to avoid corrupt parent's state. 2. Child must synchronize with parent to enforce stack deallocation and to possible return execv issues. The first one is solved by blocking all signals in child, even NPTL-internal ones (SIGCANCEL and SIGSETXID). The second issue is done by a stack allocation in parent and a synchronization with using a pipe or waitpid (in case or error). The pipe has the advantage of allowing the child signal an exec error (checked with new tst-spawn2 test). There is an inherent race condition in pipe2 usage for architectures that do not support the syscall directly. In such cases the a pipe plus fctnl is used instead and it may lead to file descriptor leak in parent (as decribed by fcntl documentation). The child process stack is allocate with a mmap with MAP_STACK flag using default architecture stack size. Although it is slower than use a stack buffer from parent, it allows some slack for the compatibility code to run scripts with no shebang (which may use a buffer with size depending of argument list count). Performance should be similar to the vfork default posix implementation and way faster than fork path (vfork on mostly linux ports are basically clone with CLONE_VM plus CLONE_VFORK). The only difference is the syscalls required for the stack allocation/deallocation. It fixes BZ#10354, BZ#14750, and BZ#18433. Tested on i386, x86_64, powerpc64le, and aarch64. [BZ #14750] [BZ #10354] [BZ #18433] * include/sched.h (__clone): Add hidden prototype. (__clone2): Likewise. * include/unistd.h (__dup): Likewise. * posix/Makefile (tests): Add tst-spawn2. * posix/tst-spawn2.c: New file. * sysdeps/posix/dup.c (__dup): Add hidden definition. * sysdeps/unix/sysv/linux/aarch64/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/alpha/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/arm/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/hppa/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/i386/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/ia64/clone2.S (__clone): Likewise. * sysdeps/unix/sysv/linux/m68k/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/microblaze/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/mips/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/nios2/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/powerpc/powerpc32/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/powerpc/powerpc64/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/s390/s390-32/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/s390/s390-64/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/sh/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/sparc/sparc32/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/sparc/sparc64/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/tile/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/x86_64/clone.S (__clone): Likewise. * sysdeps/unix/sysv/linux/nptl-signals.h (____nptl_is_internal_signal): New function. * sysdeps/unix/sysv/linux/spawni.c: New file.
188 lines
7.1 KiB
C
188 lines
7.1 KiB
C
#ifndef _UNISTD_H
|
|
# include <posix/unistd.h>
|
|
|
|
# ifndef _ISOMAC
|
|
__BEGIN_DECLS
|
|
|
|
libc_hidden_proto (_exit, __noreturn__)
|
|
rtld_hidden_proto (_exit, __noreturn__)
|
|
libc_hidden_proto (alarm)
|
|
libc_hidden_proto (confstr)
|
|
libc_hidden_proto (execl)
|
|
libc_hidden_proto (execle)
|
|
libc_hidden_proto (execlp)
|
|
libc_hidden_proto (execvp)
|
|
libc_hidden_proto (getpid)
|
|
libc_hidden_proto (getsid)
|
|
libc_hidden_proto (getdomainname)
|
|
extern __typeof (getlogin_r) __getlogin_r __nonnull ((1));
|
|
libc_hidden_proto (__getlogin_r)
|
|
libc_hidden_proto (getlogin_r)
|
|
libc_hidden_proto (seteuid)
|
|
libc_hidden_proto (setegid)
|
|
libc_hidden_proto (tcgetpgrp)
|
|
libc_hidden_proto (readlinkat)
|
|
|
|
/* Now define the internal interfaces. */
|
|
extern int __access (const char *__name, int __type);
|
|
extern int __euidaccess (const char *__name, int __type);
|
|
extern __off64_t __lseek64 (int __fd, __off64_t __offset, int __whence);
|
|
extern __off_t __lseek (int __fd, __off_t __offset, int __whence);
|
|
libc_hidden_proto (__lseek)
|
|
extern __off_t __libc_lseek (int __fd, __off_t __offset, int __whence);
|
|
extern __off64_t __libc_lseek64 (int __fd, __off64_t __offset, int __whence);
|
|
extern ssize_t __pread (int __fd, void *__buf, size_t __nbytes,
|
|
__off_t __offset);
|
|
extern ssize_t __libc_pread (int __fd, void *__buf, size_t __nbytes,
|
|
__off_t __offset);
|
|
extern ssize_t __pread64 (int __fd, void *__buf, size_t __nbytes,
|
|
__off64_t __offset);
|
|
extern ssize_t __libc_pread64 (int __fd, void *__buf, size_t __nbytes,
|
|
__off64_t __offset);
|
|
extern ssize_t __pwrite (int __fd, const void *__buf, size_t __n,
|
|
__off_t __offset);
|
|
extern ssize_t __libc_pwrite (int __fd, const void *__buf, size_t __n,
|
|
__off_t __offset);
|
|
extern ssize_t __pwrite64 (int __fd, const void *__buf, size_t __n,
|
|
__off64_t __offset);
|
|
libc_hidden_proto (__pwrite64)
|
|
extern ssize_t __libc_pwrite64 (int __fd, const void *__buf, size_t __n,
|
|
__off64_t __offset) attribute_hidden;
|
|
extern ssize_t __libc_read (int __fd, void *__buf, size_t __n);
|
|
libc_hidden_proto (__libc_read)
|
|
extern ssize_t __libc_write (int __fd, const void *__buf, size_t __n);
|
|
libc_hidden_proto (__libc_write)
|
|
extern int __pipe (int __pipedes[2]);
|
|
libc_hidden_proto (__pipe)
|
|
extern int __pipe2 (int __pipedes[2], int __flags);
|
|
extern unsigned int __sleep (unsigned int __seconds);
|
|
extern int __chown (const char *__file,
|
|
__uid_t __owner, __gid_t __group);
|
|
libc_hidden_proto (__chown)
|
|
extern int __fchown (int __fd,
|
|
__uid_t __owner, __gid_t __group);
|
|
extern int __lchown (const char *__file, __uid_t __owner,
|
|
__gid_t __group);
|
|
extern int __chdir (const char *__path);
|
|
extern int __fchdir (int __fd);
|
|
extern char *__getcwd (char *__buf, size_t __size);
|
|
extern int __rmdir (const char *__path);
|
|
extern int __execvpe (const char *file, char *const argv[],
|
|
char *const envp[]);
|
|
|
|
/* Get the canonical absolute name of the named directory, and put it in SIZE
|
|
bytes of BUF. Returns NULL if the directory couldn't be determined or
|
|
SIZE was too small. If successful, returns BUF. In GNU, if BUF is
|
|
NULL, an array is allocated with `malloc'; the array is SIZE bytes long,
|
|
unless SIZE <= 0, in which case it is as big as necessary. */
|
|
|
|
char *__canonicalize_directory_name_internal (const char *__thisdir,
|
|
char *__buf,
|
|
size_t __size) attribute_hidden;
|
|
|
|
extern int __dup (int __fd);
|
|
libc_hidden_proto (__dup)
|
|
extern int __dup2 (int __fd, int __fd2);
|
|
libc_hidden_proto (__dup2)
|
|
extern int __dup3 (int __fd, int __fd2, int flags);
|
|
libc_hidden_proto (__dup3)
|
|
extern int __execve (const char *__path, char *const __argv[],
|
|
char *const __envp[]);
|
|
extern long int __pathconf (const char *__path, int __name);
|
|
extern long int __fpathconf (int __fd, int __name);
|
|
extern long int __sysconf (int __name);
|
|
libc_hidden_proto (__sysconf)
|
|
extern __pid_t __getpid (void);
|
|
libc_hidden_proto (__getpid)
|
|
extern __pid_t __getppid (void);
|
|
extern __pid_t __setsid (void);
|
|
extern __uid_t __getuid (void);
|
|
extern __uid_t __geteuid (void);
|
|
extern __gid_t __getgid (void);
|
|
extern __gid_t __getegid (void);
|
|
extern int __getgroups (int __size, __gid_t __list[]);
|
|
libc_hidden_proto (__getpgid)
|
|
extern int __group_member (__gid_t __gid);
|
|
extern int __setuid (__uid_t __uid);
|
|
extern int __setreuid (__uid_t __ruid, __uid_t __euid);
|
|
extern int __setgid (__gid_t __gid);
|
|
extern int __setpgid (__pid_t __pid, __pid_t __pgid);
|
|
libc_hidden_proto (__setpgid)
|
|
extern int __setregid (__gid_t __rgid, __gid_t __egid);
|
|
extern int __getresuid (__uid_t *__ruid, __uid_t *__euid, __uid_t *__suid);
|
|
extern int __getresgid (__gid_t *__rgid, __gid_t *__egid, __gid_t *__sgid);
|
|
extern int __setresuid (__uid_t __ruid, __uid_t __euid, __uid_t __suid);
|
|
extern int __setresgid (__gid_t __rgid, __gid_t __egid, __gid_t __sgid);
|
|
libc_hidden_proto (__getresuid)
|
|
libc_hidden_proto (__getresgid)
|
|
libc_hidden_proto (__setresuid)
|
|
libc_hidden_proto (__setresgid)
|
|
extern __pid_t __vfork (void);
|
|
libc_hidden_proto (__vfork)
|
|
extern int __ttyname_r (int __fd, char *__buf, size_t __buflen);
|
|
extern int __isatty (int __fd);
|
|
extern int __link (const char *__from, const char *__to);
|
|
extern int __symlink (const char *__from, const char *__to);
|
|
extern ssize_t __readlink (const char *__path, char *__buf, size_t __len);
|
|
extern int __unlink (const char *__name);
|
|
extern int __gethostname (char *__name, size_t __len);
|
|
extern int __profil (unsigned short int *__sample_buffer, size_t __size,
|
|
size_t __offset, unsigned int __scale);
|
|
extern int __getdtablesize (void);
|
|
extern int __brk (void *__addr);
|
|
extern int __close (int __fd);
|
|
libc_hidden_proto (__close)
|
|
extern int __libc_close (int __fd);
|
|
extern ssize_t __read (int __fd, void *__buf, size_t __nbytes);
|
|
libc_hidden_proto (__read)
|
|
extern ssize_t __write (int __fd, const void *__buf, size_t __n);
|
|
libc_hidden_proto (__write)
|
|
extern __pid_t __fork (void);
|
|
libc_hidden_proto (__fork)
|
|
extern int __getpagesize (void) __attribute__ ((__const__));
|
|
libc_hidden_proto (__getpagesize)
|
|
extern int __ftruncate (int __fd, __off_t __length);
|
|
extern int __ftruncate64 (int __fd, __off64_t __length);
|
|
extern int __truncate (const char *path, __off_t __length);
|
|
extern void *__sbrk (intptr_t __delta);
|
|
libc_hidden_proto (__sbrk)
|
|
|
|
|
|
/* This variable is set nonzero at startup if the process's effective
|
|
IDs differ from its real IDs, or it is otherwise indicated that
|
|
extra security should be used. When this is set the dynamic linker
|
|
and some functions contained in the C library ignore various
|
|
environment variables that normally affect them. */
|
|
extern int __libc_enable_secure attribute_relro;
|
|
extern int __libc_enable_secure_decided;
|
|
rtld_hidden_proto (__libc_enable_secure)
|
|
|
|
|
|
/* Various internal function. */
|
|
extern void __libc_check_standard_fds (void) attribute_hidden;
|
|
|
|
|
|
/* Internal name for fork function. */
|
|
extern __pid_t __libc_fork (void);
|
|
|
|
/* Suspend the process until a signal arrives.
|
|
This always returns -1 and sets `errno' to EINTR. */
|
|
extern int __libc_pause (void);
|
|
/* Not cancelable variant. */
|
|
extern int __pause_nocancel (void) attribute_hidden;
|
|
|
|
extern int __have_pipe2 attribute_hidden;
|
|
extern int __have_dup3 attribute_hidden;
|
|
|
|
extern int __getlogin_r_loginuid (char *name, size_t namesize)
|
|
attribute_hidden;
|
|
|
|
# if IS_IN (rtld)
|
|
# include <dl-unistd.h>
|
|
# endif
|
|
|
|
__END_DECLS
|
|
# endif
|
|
|
|
#endif
|