* [PATCH 08/18] flag parameters: epoll_create
@ 2008-05-05 3:42 Ulrich Drepper
2008-05-05 4:52 ` Davide Libenzi
2008-05-06 21:06 ` Matthew Helsley
0 siblings, 2 replies; 6+ messages in thread
From: Ulrich Drepper @ 2008-05-05 3:42 UTC (permalink / raw)
To: linux-kernel, netdev; +Cc: akpm, davidel, mtk.manpages, torvalds
This patch adds the new epoll_create2 syscall. It extends the old epoll_create
syscall by one parameter which is meant to hold a flag value. In this
patch the only flag support is EPOLL_CLOEXEC which causes the close-on-exec
flag for the returned file descriptor to be set.
A new flag EPOLL_CLOEXEC is used instead of reusing O_CLOEXEC to prevent
exhaustion of the int bit field in case we need more flags.
The following test must be adjusted for architectures other than x86 and
x86-64 and in case the syscall numbers changed.
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
#include <fcntl.h>
#include <stdio.h>
#include <time.h>
#include <unistd.h>
#include <sys/syscall.h>
#ifndef __NR_epoll_create2
# ifdef __x86_64__
# define __NR_epoll_create2 291
# elif defined __i386__
# define __NR_epoll_create2 329
# else
# error "need __NR_epoll_create2"
# endif
#endif
#define EPOLL_CLOEXEC (1 << 0)
int
main (void)
{
int fd = syscall (__NR_epoll_create2, 1, 0);
if (fd == -1)
{
puts ("epoll_create2(0) failed");
return 1;
}
int coe = fcntl (fd, F_GETFD);
if (coe == -1)
{
puts ("fcntl failed");
return 1;
}
if (coe & FD_CLOEXEC)
{
puts ("epoll_create2(0) set close-on-exec flag");
return 1;
}
close (fd);
fd = syscall (__NR_epoll_create2, 1, EPOLL_CLOEXEC);
if (fd == -1)
{
puts ("epoll_create2(EPOLL_CLOEXEC) failed");
return 1;
}
coe = fcntl (fd, F_GETFD);
if (coe == -1)
{
puts ("fcntl failed");
return 1;
}
if ((coe & FD_CLOEXEC) == 0)
{
puts ("epoll_create2(EPOLL_CLOEXEC) set close-on-exec flag");
return 1;
}
close (fd);
puts ("OK");
return 0;
}
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
arch/x86/ia32/ia32entry.S | 1 +
arch/x86/kernel/syscall_table_32.S | 1 +
fs/eventpoll.c | 20 ++++++++++++++++++--
include/asm-x86/unistd_32.h | 1 +
include/asm-x86/unistd_64.h | 2 ++
include/linux/eventpoll.h | 2 ++
include/linux/syscalls.h | 1 +
7 files changed, 26 insertions(+), 2 deletions(-)
Signed-off-by: Ulrich Drepper <drepper@redhat.com>
diff --git a/arch/x86/ia32/ia32entry.S b/arch/x86/ia32/ia32entry.S
index b5e329d..37e4992 100644
--- a/arch/x86/ia32/ia32entry.S
+++ b/arch/x86/ia32/ia32entry.S
@@ -733,4 +733,5 @@ ia32_sys_call_table:
.quad compat_sys_timerfd_gettime
.quad compat_sys_signalfd4
.quad sys_eventfd2
+ .quad sys_epoll_create2
ia32_syscall_end:
diff --git a/arch/x86/kernel/syscall_table_32.S b/arch/x86/kernel/syscall_table_32.S
index adff556..f59aba5 100644
--- a/arch/x86/kernel/syscall_table_32.S
+++ b/arch/x86/kernel/syscall_table_32.S
@@ -328,3 +328,4 @@ ENTRY(sys_call_table)
.long sys_timerfd_gettime
.long sys_signalfd4
.long sys_eventfd2
+ .long sys_epoll_create2
diff --git a/fs/eventpoll.c b/fs/eventpoll.c
index 990c01d..7714e91 100644
--- a/fs/eventpoll.c
+++ b/fs/eventpoll.c
@@ -33,6 +33,7 @@
#include <linux/bitops.h>
#include <linux/mutex.h>
#include <linux/anon_inodes.h>
+#include <linux/flagsremap.h>
#include <asm/uaccess.h>
#include <asm/system.h>
#include <asm/io.h>
@@ -1040,16 +1041,26 @@ retry:
return res;
}
+static const struct flags_rmap epoll_file_flags_remap[] = {
+ { EPOLL_CLOEXEC, O_CLOEXEC }
+};
+
/*
* It opens an eventpoll file descriptor. The "size" parameter is there
* for historical reasons, when epoll was using an hash instead of an
* RB tree. With the current implementation, the "size" parameter is ignored
* (besides sanity checks).
*/
-asmlinkage long sys_epoll_create(int size)
+asmlinkage long sys_epoll_create2(int size, int flags)
{
int error, fd = -1;
struct eventpoll *ep;
+ int fflags;
+
+ if (flags_remap(epoll_file_flags_remap,
+ ARRAY_SIZE(epoll_file_flags_remap),
+ flags, &fflags))
+ return -EINVAL;
DNPRINTK(3, (KERN_INFO "[%p] eventpoll: sys_epoll_create(%d)\n",
current, size));
@@ -1068,7 +1079,7 @@ asmlinkage long sys_epoll_create(int size)
* Creates all the items needed to setup an eventpoll file. That is,
* a file structure and a free file descriptor.
*/
- fd = anon_inode_getfd("[eventpoll]", &eventpoll_fops, ep, 0);
+ fd = anon_inode_getfd("[eventpoll]", &eventpoll_fops, ep, fflags);
if (fd < 0)
ep_free(ep);
@@ -1079,6 +1090,11 @@ error_return:
return fd;
}
+asmlinkage long sys_epoll_create(int size)
+{
+ return sys_epoll_create2(size, 0);
+}
+
/*
* The following function implements the controller interface for
* the eventpoll file that enables the insertion/removal/change of
diff --git a/include/linux/eventpoll.h b/include/linux/eventpoll.h
index cf79853..ca3a6e8 100644
--- a/include/linux/eventpoll.h
+++ b/include/linux/eventpoll.h
@@ -16,6 +16,8 @@
#include <linux/types.h>
+/* Flags for epoll_create2. */
+#define EPOLL_CLOEXEC (1 << 0)
/* Valid opcodes to issue to sys_epoll_ctl() */
#define EPOLL_CTL_ADD 1
diff --git a/include/asm-x86/unistd_32.h b/include/asm-x86/unistd_32.h
index 8317d94..b3daf50 100644
--- a/include/asm-x86/unistd_32.h
+++ b/include/asm-x86/unistd_32.h
@@ -334,6 +334,7 @@
#define __NR_timerfd_gettime 326
#define __NR_signalfd4 327
#define __NR_eventfd2 328
+#define __NR_epoll_create2 329
#ifdef __KERNEL__
diff --git a/include/asm-x86/unistd_64.h b/include/asm-x86/unistd_64.h
index fe26e36..5ef6778 100644
--- a/include/asm-x86/unistd_64.h
+++ b/include/asm-x86/unistd_64.h
@@ -645,6 +645,8 @@ __SYSCALL(__NR_fallocate, sys_fallocate)
__SYSCALL(__NR_signalfd4, sys_signalfd4)
#define __NR_eventfd2 290
__SYSCALL(__NR_eventfd2, sys_eventfd2)
+#define __NR_epoll_create2 291
+__SYSCALL(__NR_epoll_create2, sys_epoll_create2)
#ifndef __NO_STUBS
diff --git a/include/linux/syscalls.h b/include/linux/syscalls.h
index 0522f36..aeb2df8 100644
--- a/include/linux/syscalls.h
+++ b/include/linux/syscalls.h
@@ -430,6 +430,7 @@ asmlinkage long sys_poll(struct pollfd __user *ufds, unsigned int nfds,
asmlinkage long sys_select(int n, fd_set __user *inp, fd_set __user *outp,
fd_set __user *exp, struct timeval __user *tvp);
asmlinkage long sys_epoll_create(int size);
+asmlinkage long sys_epoll_create2(int size, int flags);
asmlinkage long sys_epoll_ctl(int epfd, int op, int fd,
struct epoll_event __user *event);
asmlinkage long sys_epoll_wait(int epfd, struct epoll_event __user *events,
^ permalink raw reply related [flat|nested] 6+ messages in thread* Re: [PATCH 08/18] flag parameters: epoll_create
2008-05-05 3:42 [PATCH 08/18] flag parameters: epoll_create Ulrich Drepper
@ 2008-05-05 4:52 ` Davide Libenzi
2008-05-06 21:06 ` Matthew Helsley
1 sibling, 0 replies; 6+ messages in thread
From: Davide Libenzi @ 2008-05-05 4:52 UTC (permalink / raw)
To: Ulrich Drepper
Cc: Linux Kernel Mailing List, netdev, Andrew Morton, mtk.manpages,
Linus Torvalds
On Sun, 4 May 2008, Ulrich Drepper wrote:
> This patch adds the new epoll_create2 syscall. It extends the old epoll_create
> syscall by one parameter which is meant to hold a flag value. In this
> patch the only flag support is EPOLL_CLOEXEC which causes the close-on-exec
> flag for the returned file descriptor to be set.
>
> A new flag EPOLL_CLOEXEC is used instead of reusing O_CLOEXEC to prevent
> exhaustion of the int bit field in case we need more flags.
>
> The following test must be adjusted for architectures other than x86 and
> x86-64 and in case the syscall numbers changed.
> Signed-off-by: Ulrich Drepper <drepper@redhat.com>
Acked-by: Davide Libenzi <davidel@xmailserver.org>
- Davide
^ permalink raw reply [flat|nested] 6+ messages in thread
* Re: [PATCH 08/18] flag parameters: epoll_create
2008-05-05 3:42 [PATCH 08/18] flag parameters: epoll_create Ulrich Drepper
2008-05-05 4:52 ` Davide Libenzi
@ 2008-05-06 21:06 ` Matthew Helsley
2008-05-06 22:41 ` Davide Libenzi
1 sibling, 1 reply; 6+ messages in thread
From: Matthew Helsley @ 2008-05-06 21:06 UTC (permalink / raw)
To: Ulrich Drepper
Cc: linux-kernel, netdev, akpm, davidel, mtk.manpages, torvalds
On Sun, 2008-05-04 at 23:42 -0400, Ulrich Drepper wrote:
> This patch adds the new epoll_create2 syscall. It extends the old epoll_create
> syscall by one parameter which is meant to hold a flag value. In this
> patch the only flag support is EPOLL_CLOEXEC which causes the close-on-exec
> flag for the returned file descriptor to be set.
Davide, Ulrich,
A minor question: Why did you choose to pass the seemingly useless
"size" parameter into the new epoll_create2 system call? I did some
googling for previous threads with this series and couldn't find a
discussion on why you chose to keep it.
Cheers,
-Matt Helsley
^ permalink raw reply [flat|nested] 6+ messages in thread
* Re: [PATCH 08/18] flag parameters: epoll_create
2008-05-06 21:06 ` Matthew Helsley
@ 2008-05-06 22:41 ` Davide Libenzi
2008-05-06 23:10 ` Michael Kerrisk
0 siblings, 1 reply; 6+ messages in thread
From: Davide Libenzi @ 2008-05-06 22:41 UTC (permalink / raw)
To: Matthew Helsley
Cc: Ulrich Drepper, Linux Kernel Mailing List, netdev, Andrew Morton,
mtk.manpages, Linus Torvalds
On Tue, 6 May 2008, Matthew Helsley wrote:
>
> On Sun, 2008-05-04 at 23:42 -0400, Ulrich Drepper wrote:
> > This patch adds the new epoll_create2 syscall. It extends the old epoll_create
> > syscall by one parameter which is meant to hold a flag value. In this
> > patch the only flag support is EPOLL_CLOEXEC which causes the close-on-exec
> > flag for the returned file descriptor to be set.
>
> Davide, Ulrich,
>
> A minor question: Why did you choose to pass the seemingly useless
> "size" parameter into the new epoll_create2 system call? I did some
> googling for previous threads with this series and couldn't find a
> discussion on why you chose to keep it.
The very first implementations were using an hash, and that was a size
hint.
- Davide
^ permalink raw reply [flat|nested] 6+ messages in thread
* Re: [PATCH 08/18] flag parameters: epoll_create
2008-05-06 22:41 ` Davide Libenzi
@ 2008-05-06 23:10 ` Michael Kerrisk
2008-05-06 23:20 ` Davide Libenzi
0 siblings, 1 reply; 6+ messages in thread
From: Michael Kerrisk @ 2008-05-06 23:10 UTC (permalink / raw)
To: Davide Libenzi
Cc: Matthew Helsley, Ulrich Drepper, Linux Kernel Mailing List,
netdev, Andrew Morton, mtk.manpages, Linus Torvalds
On Wed, May 7, 2008 at 12:41 AM, Davide Libenzi <davidel@xmailserver.org> wrote:
>
> On Tue, 6 May 2008, Matthew Helsley wrote:
>
> >
> > On Sun, 2008-05-04 at 23:42 -0400, Ulrich Drepper wrote:
> > > This patch adds the new epoll_create2 syscall. It extends the old epoll_create
> > > syscall by one parameter which is meant to hold a flag value. In this
> > > patch the only flag support is EPOLL_CLOEXEC which causes the close-on-exec
> > > flag for the returned file descriptor to be set.
> >
> > Davide, Ulrich,
> >
> > A minor question: Why did you choose to pass the seemingly useless
> > "size" parameter into the new epoll_create2 system call? I did some
> > googling for previous threads with this series and couldn't find a
> > discussion on why you chose to keep it.
>
> The very first implementations were using an hash, and that was a size
> hint.
So, why not simply remove this argument in the new API, since it is now useless?
^ permalink raw reply [flat|nested] 6+ messages in thread
* Re: [PATCH 08/18] flag parameters: epoll_create
2008-05-06 23:10 ` Michael Kerrisk
@ 2008-05-06 23:20 ` Davide Libenzi
0 siblings, 0 replies; 6+ messages in thread
From: Davide Libenzi @ 2008-05-06 23:20 UTC (permalink / raw)
To: Michael Kerrisk
Cc: Matthew Helsley, Ulrich Drepper, Linux Kernel Mailing List,
netdev, Andrew Morton, mtk.manpages, Linus Torvalds
On Wed, 7 May 2008, Michael Kerrisk wrote:
> On Wed, May 7, 2008 at 12:41 AM, Davide Libenzi <davidel@xmailserver.org> wrote:
> >
> > On Tue, 6 May 2008, Matthew Helsley wrote:
> >
> > >
> > > On Sun, 2008-05-04 at 23:42 -0400, Ulrich Drepper wrote:
> > > > This patch adds the new epoll_create2 syscall. It extends the old epoll_create
> > > > syscall by one parameter which is meant to hold a flag value. In this
> > > > patch the only flag support is EPOLL_CLOEXEC which causes the close-on-exec
> > > > flag for the returned file descriptor to be set.
> > >
> > > Davide, Ulrich,
> > >
> > > A minor question: Why did you choose to pass the seemingly useless
> > > "size" parameter into the new epoll_create2 system call? I did some
> > > googling for previous threads with this series and couldn't find a
> > > discussion on why you chose to keep it.
> >
> > The very first implementations were using an hash, and that was a size
> > hint.
>
> So, why not simply remove this argument in the new API, since it is now useless?
I'm more than OK with that.
- Davide
^ permalink raw reply [flat|nested] 6+ messages in thread
end of thread, other threads:[~2008-05-06 23:20 UTC | newest]
Thread overview: 6+ messages (download: mbox.gz follow: Atom feed
-- links below jump to the message on this page --
2008-05-05 3:42 [PATCH 08/18] flag parameters: epoll_create Ulrich Drepper
2008-05-05 4:52 ` Davide Libenzi
2008-05-06 21:06 ` Matthew Helsley
2008-05-06 22:41 ` Davide Libenzi
2008-05-06 23:10 ` Michael Kerrisk
2008-05-06 23:20 ` Davide Libenzi
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.