From: Manfred Spraul <manfred@colorfullife.com>
To: Ingo Molnar <mingo@elte.hu>
Cc: linux-kernel@vger.kernel.org
Subject: Re: [RFC] O(1) proc_pid_readdir
Date: Sat, 22 Mar 2003 17:02:47 +0100 [thread overview]
Message-ID: <3E7C8927.5030808@colorfullife.com> (raw)
In-Reply-To: <Pine.LNX.4.44.0303162203590.11399-100000@localhost.localdomain>
[-- Attachment #1: Type: text/plain, Size: 2715 bytes --]
Ingo Molnar wrote:
>On Sun, 16 Mar 2003, Manfred Spraul wrote:
>
>
>
>>Below is a proposal to get rid of the quadratic behaviour of
>>proc_pid_readir(): Instead of storing the task number in f_pos and
>>walking tasks by tasklist order, the pid is stored in f_pos and the
>>tasks are walked by (hash-mangled) pid order.
>>
>>
>
>have you seen my "procfs/procps threading performance speedup" patch? It
>does something like this.
>
>
The implementation is flawed:
>+static int get_pid_list(int index, int *pids, struct file *filp)
> {
>- struct task_struct *p;
>- int nr_pids = 0;
>+ int nr_pids = 0, pid = 0, pid_cursor = (int)filp->private_data;
>+ struct task_struct *g = NULL, *p = NULL;
>
>- index--;
> read_lock(&tasklist_lock);
>- for_each_process(p) {
>- int pid = p->pid;
>- if (!pid)
>- continue;
>+ if (pid_cursor) {
>+ p = find_task_by_pid(pid_cursor);
>+ g = p->group_leader;
>+ }
>+ if (!p) {
>+ g = p = &init_task;
>+ index--;
>+ } else
>+ index = 0;
>+
>+ goto inside;
>+
>+ __do_each_thread(g, p) {
> if (--index >= 0)
> continue;
>- pids[nr_pids] = pid;
>+ pid = p->pid;
>+ if (!pid)
>+ BUG();
>+ if (p->tgid != p->pid)
>+ pids[nr_pids] = -pid;
>+ else
>+ pids[nr_pids] = pid;
> nr_pids++;
> if (nr_pids >= PROC_MAXPIDS)
>- break;
>- }
>+ goto out;
>+inside:
>+ ;
>+ } while_each_thread(g, p);
>+out:
>+ filp->private_data = (void *)pid;
> read_unlock(&tasklist_lock);
>+
> return nr_pids;
> }
>
>
get_pid_list stores up to 20 pids in an array, and the last pid in the
array is stored in filp->private_data, for the next call.
> int proc_pid_readdir(struct file * filp, void * dirent, filldir_t filldir)
> {
>- unsigned int pid_array[PROC_MAXPIDS];
>+ int pid_array[PROC_MAXPIDS];
> char buf[PROC_NUMBUF];
> unsigned int nr = filp->f_pos - FIRST_PROCESS_ENTRY;
> unsigned int nr_pids, i;
>@@ -1192,14 +1217,16 @@ int proc_pid_readdir(struct file * filp,
> nr++;
> }
>
>- nr_pids = get_pid_list(nr, pid_array);
>+ nr_pids = get_pid_list(nr, pid_array, filp);
>
> for (i = 0; i < nr_pids; i++) {
>- int pid = pid_array[i];
>+ int pid = abs(pid_array[i]);
> ino_t ino = fake_ino(pid,PROC_PID_INO);
> unsigned long j = PROC_NUMBUF;
>
> do buf[--j] = '0' + (pid % 10); while (pid/=10);
>+ if (pid_array[i] < 0)
>+ buf[--j] = '.';
>
> if (filldir(dirent, buf+j, PROC_NUMBUF-j, filp->f_pos, ino, DT_DIR) < 0)
> break;
>
>
But: proc_pid_readdir() doesn't use all 20 pids: It may return early if
the user space buffer is full. Then your patch skips a few threads.
Attached is my test app:
./getdents /proc 0 24 returns just 3 threads,
./getdents /proc 0 4000 returns (probably) all: 66 threads or processes.
--
Manfred
[-- Attachment #2: getdents.cpp --]
[-- Type: text/plain, Size: 2182 bytes --]
/*
* gendents.cpp: getdents tester.
*
* Copyright (C) 1999, 2001, 2003 by Manfred Spraul.
* All rights reserved except the rights granted by the GPL.
*
* Redistribution of this file is permitted under the terms of the GNU
* General Public License (GPL) version 2 or later.
* $Header: /pub/home/manfred/cvs-tree/getdents/getdents.cpp,v 1.2 2003/03/22 16:01:34 manfred Exp $
*/
#include <stdio.h>
#include <stdlib.h>
#include <unistd.h>
#include <linux/types.h>
#include <linux/dirent.h>
#include <linux/unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <errno.h>
#define BUFSZ 131072
unsigned char entries[BUFSZ];
#define _syscall3(type,name,type1,arg1,type2,arg2,type3,arg3) \
type name(type1 arg1,type2 arg2,type3 arg3) \
{ \
long __res; \
__asm__ volatile ("int $0x80" \
: "=a" (__res) \
: "0" (__NR_##name),"b" ((long)(arg1)),"c" ((long)(arg2)), \
"d" ((long)(arg3))); \
__syscall_return(type,__res); \
}
_syscall3(int, getdents, uint, fd, struct dirent *, dirp, uint, count);
static void hexdump(unsigned char* array, int len)
{
int i;
for(i=0;i<len;i++) {
if ((i%16) == 0)
printf("\n%03x:", i);
if((i%16)==8)
printf(":");
printf("%02x ",(unsigned)array[i]);
}
printf("\n");
}
int main(int argc, char **argv)
{
int fd, retval, bufsz;
printf("GETDENTS <dir> <offset> [<bufsz>]\n");
if (argc < 3 || argc > 4)
return 1;
fd = open(argv[1],O_RDONLY);
if (fd < 0) {
printf("open failed, errno %d.\n", errno);
return 2;
}
if (argc == 4)
bufsz = atoi(argv[3]);
else
bufsz = BUFSZ;
lseek(fd, atoi(argv[2]), SEEK_SET);
for(;;) {
int offset = 0;
retval = getdents(fd, (struct dirent *)entries, bufsz);
printf("retval is %d.\n", retval);
if (retval <= 0)
break;
while (offset < retval) {
struct dirent *walk = (struct dirent *)(&entries[offset]);
// printf("dirent: %lxh.\n", (unsigned long)walk);
// printf("dirent->d_ino = %ld.\n", walk->d_ino);
// printf("dirent->d_off = %ld.\n", walk->d_off);
// printf("dirent->d_reclen = %ld.\n", walk->d_reclen);
printf("dirent->d_name = '%s'@%ld\n", walk->d_name, walk->d_off);
offset += walk->d_reclen;
}
}
return 0;
}
prev parent reply other threads:[~2003-03-22 15:55 UTC|newest]
Thread overview: 15+ messages / expand[flat|nested] mbox.gz Atom feed top
2003-03-16 15:52 [RFC] O(1) proc_pid_readdir Manfred Spraul
2003-03-16 20:10 ` William Lee Irwin III
2003-03-16 21:05 ` Ingo Molnar
2003-03-16 21:24 ` Manfred Spraul
2003-03-16 21:35 ` William Lee Irwin III
2003-03-16 21:45 ` Manfred Spraul
2003-03-17 6:22 ` Ingo Molnar
2003-03-17 7:03 ` William Lee Irwin III
2003-03-17 18:17 ` Manfred Spraul
2003-03-18 0:14 ` William Lee Irwin III
2003-03-18 0:48 ` William Lee Irwin III
2003-03-18 1:22 ` William Lee Irwin III
2003-03-18 9:25 ` William Lee Irwin III
2003-03-17 6:19 ` Ingo Molnar
2003-03-22 16:02 ` Manfred Spraul [this message]
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=3E7C8927.5030808@colorfullife.com \
--to=manfred@colorfullife.com \
--cc=linux-kernel@vger.kernel.org \
--cc=mingo@elte.hu \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox