mirror of
				https://git.kernel.org/pub/scm/linux/kernel/git/chenhuacai/linux-loongson
				synced 2025-10-26 16:56:07 +00:00 
			
		
		
		
	 ed8cae8ba0
			
		
	
	
		ed8cae8ba0
		
	
	
	
	
		
			
			This patch introduces the new syscall pipe2 which is like pipe but it also
takes an additional parameter which takes a flag value.  This patch implements
the handling of O_CLOEXEC for the flag.  I did not add support for the new
syscall for the architectures which have a special sys_pipe implementation.  I
think the maintainers of those archs have the chance to go with the unified
implementation but that's up to them.
The implementation introduces do_pipe_flags.  I did that instead of changing
all callers of do_pipe because some of the callers are written in assembler.
I would probably screw up changing the assembly code.  To avoid breaking code
do_pipe is now a small wrapper around do_pipe_flags.  Once all callers are
changed over to do_pipe_flags the old do_pipe function can be removed.
The following test must be adjusted for architectures other than x86 and
x86-64 and in case the syscall numbers changed.
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
#include <fcntl.h>
#include <stdio.h>
#include <unistd.h>
#include <sys/syscall.h>
#ifndef __NR_pipe2
# ifdef __x86_64__
#  define __NR_pipe2 293
# elif defined __i386__
#  define __NR_pipe2 331
# else
#  error "need __NR_pipe2"
# endif
#endif
int
main (void)
{
  int fd[2];
  if (syscall (__NR_pipe2, fd, 0) != 0)
    {
      puts ("pipe2(0) failed");
      return 1;
    }
  for (int i = 0; i < 2; ++i)
    {
      int coe = fcntl (fd[i], F_GETFD);
      if (coe == -1)
        {
          puts ("fcntl failed");
          return 1;
        }
      if (coe & FD_CLOEXEC)
        {
          printf ("pipe2(0) set close-on-exit for fd[%d]\n", i);
          return 1;
        }
    }
  close (fd[0]);
  close (fd[1]);
  if (syscall (__NR_pipe2, fd, O_CLOEXEC) != 0)
    {
      puts ("pipe2(O_CLOEXEC) failed");
      return 1;
    }
  for (int i = 0; i < 2; ++i)
    {
      int coe = fcntl (fd[i], F_GETFD);
      if (coe == -1)
        {
          puts ("fcntl failed");
          return 1;
        }
      if ((coe & FD_CLOEXEC) == 0)
        {
          printf ("pipe2(O_CLOEXEC) does not set close-on-exit for fd[%d]\n", i);
          return 1;
        }
    }
  close (fd[0]);
  close (fd[1]);
  puts ("OK");
  return 0;
}
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
Signed-off-by: Ulrich Drepper <drepper@redhat.com>
Acked-by: Davide Libenzi <davidel@xmailserver.org>
Cc: Michael Kerrisk <mtk.manpages@googlemail.com>
Cc: <linux-arch@vger.kernel.org>
Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
		
	
			
		
			
				
	
	
		
			287 lines
		
	
	
		
			6.9 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			287 lines
		
	
	
		
			6.9 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * This file contains various system calls that have different calling
 | |
|  * conventions on different platforms.
 | |
|  *
 | |
|  * Copyright (C) 1999-2000, 2002-2003, 2005 Hewlett-Packard Co
 | |
|  *	David Mosberger-Tang <davidm@hpl.hp.com>
 | |
|  */
 | |
| #include <linux/errno.h>
 | |
| #include <linux/fs.h>
 | |
| #include <linux/mm.h>
 | |
| #include <linux/mman.h>
 | |
| #include <linux/sched.h>
 | |
| #include <linux/shm.h>
 | |
| #include <linux/file.h>		/* doh, must come after sched.h... */
 | |
| #include <linux/smp.h>
 | |
| #include <linux/syscalls.h>
 | |
| #include <linux/highuid.h>
 | |
| #include <linux/hugetlb.h>
 | |
| 
 | |
| #include <asm/shmparam.h>
 | |
| #include <asm/uaccess.h>
 | |
| 
 | |
| unsigned long
 | |
| arch_get_unmapped_area (struct file *filp, unsigned long addr, unsigned long len,
 | |
| 			unsigned long pgoff, unsigned long flags)
 | |
| {
 | |
| 	long map_shared = (flags & MAP_SHARED);
 | |
| 	unsigned long start_addr, align_mask = PAGE_SIZE - 1;
 | |
| 	struct mm_struct *mm = current->mm;
 | |
| 	struct vm_area_struct *vma;
 | |
| 
 | |
| 	if (len > RGN_MAP_LIMIT)
 | |
| 		return -ENOMEM;
 | |
| 
 | |
| 	/* handle fixed mapping: prevent overlap with huge pages */
 | |
| 	if (flags & MAP_FIXED) {
 | |
| 		if (is_hugepage_only_range(mm, addr, len))
 | |
| 			return -EINVAL;
 | |
| 		return addr;
 | |
| 	}
 | |
| 
 | |
| #ifdef CONFIG_HUGETLB_PAGE
 | |
| 	if (REGION_NUMBER(addr) == RGN_HPAGE)
 | |
| 		addr = 0;
 | |
| #endif
 | |
| 	if (!addr)
 | |
| 		addr = mm->free_area_cache;
 | |
| 
 | |
| 	if (map_shared && (TASK_SIZE > 0xfffffffful))
 | |
| 		/*
 | |
| 		 * For 64-bit tasks, align shared segments to 1MB to avoid potential
 | |
| 		 * performance penalty due to virtual aliasing (see ASDM).  For 32-bit
 | |
| 		 * tasks, we prefer to avoid exhausting the address space too quickly by
 | |
| 		 * limiting alignment to a single page.
 | |
| 		 */
 | |
| 		align_mask = SHMLBA - 1;
 | |
| 
 | |
|   full_search:
 | |
| 	start_addr = addr = (addr + align_mask) & ~align_mask;
 | |
| 
 | |
| 	for (vma = find_vma(mm, addr); ; vma = vma->vm_next) {
 | |
| 		/* At this point:  (!vma || addr < vma->vm_end). */
 | |
| 		if (TASK_SIZE - len < addr || RGN_MAP_LIMIT - len < REGION_OFFSET(addr)) {
 | |
| 			if (start_addr != TASK_UNMAPPED_BASE) {
 | |
| 				/* Start a new search --- just in case we missed some holes.  */
 | |
| 				addr = TASK_UNMAPPED_BASE;
 | |
| 				goto full_search;
 | |
| 			}
 | |
| 			return -ENOMEM;
 | |
| 		}
 | |
| 		if (!vma || addr + len <= vma->vm_start) {
 | |
| 			/* Remember the address where we stopped this search:  */
 | |
| 			mm->free_area_cache = addr + len;
 | |
| 			return addr;
 | |
| 		}
 | |
| 		addr = (vma->vm_end + align_mask) & ~align_mask;
 | |
| 	}
 | |
| }
 | |
| 
 | |
| asmlinkage long
 | |
| ia64_getpriority (int which, int who)
 | |
| {
 | |
| 	long prio;
 | |
| 
 | |
| 	prio = sys_getpriority(which, who);
 | |
| 	if (prio >= 0) {
 | |
| 		force_successful_syscall_return();
 | |
| 		prio = 20 - prio;
 | |
| 	}
 | |
| 	return prio;
 | |
| }
 | |
| 
 | |
| /* XXX obsolete, but leave it here until the old libc is gone... */
 | |
| asmlinkage unsigned long
 | |
| sys_getpagesize (void)
 | |
| {
 | |
| 	return PAGE_SIZE;
 | |
| }
 | |
| 
 | |
| asmlinkage unsigned long
 | |
| ia64_brk (unsigned long brk)
 | |
| {
 | |
| 	unsigned long rlim, retval, newbrk, oldbrk;
 | |
| 	struct mm_struct *mm = current->mm;
 | |
| 
 | |
| 	/*
 | |
| 	 * Most of this replicates the code in sys_brk() except for an additional safety
 | |
| 	 * check and the clearing of r8.  However, we can't call sys_brk() because we need
 | |
| 	 * to acquire the mmap_sem before we can do the test...
 | |
| 	 */
 | |
| 	down_write(&mm->mmap_sem);
 | |
| 
 | |
| 	if (brk < mm->end_code)
 | |
| 		goto out;
 | |
| 	newbrk = PAGE_ALIGN(brk);
 | |
| 	oldbrk = PAGE_ALIGN(mm->brk);
 | |
| 	if (oldbrk == newbrk)
 | |
| 		goto set_brk;
 | |
| 
 | |
| 	/* Always allow shrinking brk. */
 | |
| 	if (brk <= mm->brk) {
 | |
| 		if (!do_munmap(mm, newbrk, oldbrk-newbrk))
 | |
| 			goto set_brk;
 | |
| 		goto out;
 | |
| 	}
 | |
| 
 | |
| 	/* Check against unimplemented/unmapped addresses: */
 | |
| 	if ((newbrk - oldbrk) > RGN_MAP_LIMIT || REGION_OFFSET(newbrk) > RGN_MAP_LIMIT)
 | |
| 		goto out;
 | |
| 
 | |
| 	/* Check against rlimit.. */
 | |
| 	rlim = current->signal->rlim[RLIMIT_DATA].rlim_cur;
 | |
| 	if (rlim < RLIM_INFINITY && brk - mm->start_data > rlim)
 | |
| 		goto out;
 | |
| 
 | |
| 	/* Check against existing mmap mappings. */
 | |
| 	if (find_vma_intersection(mm, oldbrk, newbrk+PAGE_SIZE))
 | |
| 		goto out;
 | |
| 
 | |
| 	/* Ok, looks good - let it rip. */
 | |
| 	if (do_brk(oldbrk, newbrk-oldbrk) != oldbrk)
 | |
| 		goto out;
 | |
| set_brk:
 | |
| 	mm->brk = brk;
 | |
| out:
 | |
| 	retval = mm->brk;
 | |
| 	up_write(&mm->mmap_sem);
 | |
| 	force_successful_syscall_return();
 | |
| 	return retval;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * On IA-64, we return the two file descriptors in ret0 and ret1 (r8
 | |
|  * and r9) as this is faster than doing a copy_to_user().
 | |
|  */
 | |
| asmlinkage long
 | |
| sys_pipe (void)
 | |
| {
 | |
| 	struct pt_regs *regs = task_pt_regs(current);
 | |
| 	int fd[2];
 | |
| 	int retval;
 | |
| 
 | |
| 	retval = do_pipe_flags(fd, 0);
 | |
| 	if (retval)
 | |
| 		goto out;
 | |
| 	retval = fd[0];
 | |
| 	regs->r9 = fd[1];
 | |
|   out:
 | |
| 	return retval;
 | |
| }
 | |
| 
 | |
| int ia64_mmap_check(unsigned long addr, unsigned long len,
 | |
| 		unsigned long flags)
 | |
| {
 | |
| 	unsigned long roff;
 | |
| 
 | |
| 	/*
 | |
| 	 * Don't permit mappings into unmapped space, the virtual page table
 | |
| 	 * of a region, or across a region boundary.  Note: RGN_MAP_LIMIT is
 | |
| 	 * equal to 2^n-PAGE_SIZE (for some integer n <= 61) and len > 0.
 | |
| 	 */
 | |
| 	roff = REGION_OFFSET(addr);
 | |
| 	if ((len > RGN_MAP_LIMIT) || (roff > (RGN_MAP_LIMIT - len)))
 | |
| 		return -EINVAL;
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static inline unsigned long
 | |
| do_mmap2 (unsigned long addr, unsigned long len, int prot, int flags, int fd, unsigned long pgoff)
 | |
| {
 | |
| 	struct file *file = NULL;
 | |
| 
 | |
| 	flags &= ~(MAP_EXECUTABLE | MAP_DENYWRITE);
 | |
| 	if (!(flags & MAP_ANONYMOUS)) {
 | |
| 		file = fget(fd);
 | |
| 		if (!file)
 | |
| 			return -EBADF;
 | |
| 
 | |
| 		if (!file->f_op || !file->f_op->mmap) {
 | |
| 			addr = -ENODEV;
 | |
| 			goto out;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	/* Careful about overflows.. */
 | |
| 	len = PAGE_ALIGN(len);
 | |
| 	if (!len || len > TASK_SIZE) {
 | |
| 		addr = -EINVAL;
 | |
| 		goto out;
 | |
| 	}
 | |
| 
 | |
| 	down_write(¤t->mm->mmap_sem);
 | |
| 	addr = do_mmap_pgoff(file, addr, len, prot, flags, pgoff);
 | |
| 	up_write(¤t->mm->mmap_sem);
 | |
| 
 | |
| out:	if (file)
 | |
| 		fput(file);
 | |
| 	return addr;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * mmap2() is like mmap() except that the offset is expressed in units
 | |
|  * of PAGE_SIZE (instead of bytes).  This allows to mmap2() (pieces
 | |
|  * of) files that are larger than the address space of the CPU.
 | |
|  */
 | |
| asmlinkage unsigned long
 | |
| sys_mmap2 (unsigned long addr, unsigned long len, int prot, int flags, int fd, long pgoff)
 | |
| {
 | |
| 	addr = do_mmap2(addr, len, prot, flags, fd, pgoff);
 | |
| 	if (!IS_ERR((void *) addr))
 | |
| 		force_successful_syscall_return();
 | |
| 	return addr;
 | |
| }
 | |
| 
 | |
| asmlinkage unsigned long
 | |
| sys_mmap (unsigned long addr, unsigned long len, int prot, int flags, int fd, long off)
 | |
| {
 | |
| 	if (offset_in_page(off) != 0)
 | |
| 		return -EINVAL;
 | |
| 
 | |
| 	addr = do_mmap2(addr, len, prot, flags, fd, off >> PAGE_SHIFT);
 | |
| 	if (!IS_ERR((void *) addr))
 | |
| 		force_successful_syscall_return();
 | |
| 	return addr;
 | |
| }
 | |
| 
 | |
| asmlinkage unsigned long
 | |
| ia64_mremap (unsigned long addr, unsigned long old_len, unsigned long new_len, unsigned long flags,
 | |
| 	     unsigned long new_addr)
 | |
| {
 | |
| 	extern unsigned long do_mremap (unsigned long addr,
 | |
| 					unsigned long old_len,
 | |
| 					unsigned long new_len,
 | |
| 					unsigned long flags,
 | |
| 					unsigned long new_addr);
 | |
| 
 | |
| 	down_write(¤t->mm->mmap_sem);
 | |
| 	{
 | |
| 		addr = do_mremap(addr, old_len, new_len, flags, new_addr);
 | |
| 	}
 | |
| 	up_write(¤t->mm->mmap_sem);
 | |
| 
 | |
| 	if (IS_ERR((void *) addr))
 | |
| 		return addr;
 | |
| 
 | |
| 	force_successful_syscall_return();
 | |
| 	return addr;
 | |
| }
 | |
| 
 | |
| #ifndef CONFIG_PCI
 | |
| 
 | |
| asmlinkage long
 | |
| sys_pciconfig_read (unsigned long bus, unsigned long dfn, unsigned long off, unsigned long len,
 | |
| 		    void *buf)
 | |
| {
 | |
| 	return -ENOSYS;
 | |
| }
 | |
| 
 | |
| asmlinkage long
 | |
| sys_pciconfig_write (unsigned long bus, unsigned long dfn, unsigned long off, unsigned long len,
 | |
| 		     void *buf)
 | |
| {
 | |
| 	return -ENOSYS;
 | |
| }
 | |
| 
 | |
| #endif /* CONFIG_PCI */
 |