From: Janani Venkataraman <jananive@linux.vnet.ibm.com>
To: Pavel Emelyanov <xemul@parallels.com>
Cc: amwang@redhat.com, procps@freelists.org, oleg@redhat.com,
rdunlap@xenotime.net, tarundsk@linux.vnet.ibm.com,
aravinda@linux.vnet.ibm.com, hch@lst.de, mhiramat@redhat.com,
jeremy.fitzhardinge@citrix.com, suzuki@linux.vnet.ibm.com,
coreutils@gnu.org, kosaki.motohiro@jp.fujitsu.com,
adobriyan@gmail.com, util-linux@vger.kernel.org,
james.hogan@imgtec.com, roland@hack.frob.com,
ananth@linux.vnet.ibm.com, gorcunov@openvz.org,
avagin@openvz.org, linux-kernel@vger.kernel.org,
eparis@redhat.com, d.hatayama@jp.fujitsu.com,
andi@firstfloor.org, tj@kernel.org, akpm@linux-foundation.org,
torvalds@linux-foundation.org
Subject: Re: [PATCH 04/33] Hold threads
Date: Fri, 18 Apr 2014 19:34:37 +0530 [thread overview]
Message-ID: <535130F5.3030700@linux.vnet.ibm.com> (raw)
In-Reply-To: <532B3B00.6080201@parallels.com>
[-- Attachment #1: Type: text/plain, Size: 6087 bytes --]
On 03/21/2014 12:31 AM, Pavel Emelyanov wrote:
> On 03/20/2014 01:39 PM, Janani Venkataraman wrote:
>> Getting number of threads and their respective IDs through /proc/pid/stat and
>> /proc/pid/task.
>>
>> The threads are then seized and interrupted. After the dump is taken they are
>> detached.
>>
>> Signed-off-by: Janani Venkataraman <jananive@linux.vnet.ibm.com>
>> ---
>> +/* Gets the Thread IDS and siezes them */
>> +int seize_threads(int pid)
>> +{
>> + char filename[40];
>> + DIR *dir;
>> + int ct = 0, ret = 0, tmp_tid;
>> + struct dirent *entry;
>> + char state;
>> +
>> + ret = get_thread_count(pid);
>> + if (ret == -1)
>> + return -1;
>> +
>> + cp.thread_count = ret;
>> + cp.t_id = calloc(cp.thread_count, sizeof(int));
>> + if (!cp.t_id) {
>> + status = errno;
>> + gencore_log("Could not allocate memory for thread_ids.\n");
>> + return -1;
>> + }
>> +
>> + snprintf(filename, 40, "/proc/%d/task", pid);
>> + dir = opendir(filename);
>> +
>> + while ((entry = readdir(dir))) {
> This simple loop is not enough -- threads may appear and disappear while
> you do the readdir and seize, so you should scan it several times to
> make sure you caught all the threads.
>
> You can look at how this is done in CRIU in cr-dump,c:collect_threads().
>
If there are any new threads generated after the process is
issued a gencore, we need to ensure even those threads are
captured and seized. Hence we read the /proc/pid/task, till
no new threads are created.
We do a readdir again and again, till we find no new threads.
If a new thread is found, it is inserted in the right position.
This process is repeated till readdir reads no new threads.
Signed-off-by: Suzuki K. Poulose<suzuki@in.ibm.com>
Signed-off-by: Janani Venkataraman<jananive@linux.vnet.ibm.com>
---
src/coredump.c | 161 +++++++++++++++++++++++++++++++++++++++++---------------
1 file changed, 117 insertions(+), 44 deletions(-)
diff --git a/src/coredump.c b/src/coredump.c
index 49af7b3..2247ba2 100644
--- a/src/coredump.c
+++ b/src/coredump.c
@@ -93,68 +93,141 @@ void init_core(void)
memset(&cp, 0, sizeof(struct core_proc));
}
-/* Gets the Thread IDS and siezes them */
-int seize_threads(int pid)
+/* Check if a particular TID is already added to cp.t_id */
+int search(int pid, int n)
{
- char filename[40];
- DIR *dir;
- int ct = 0, ret = 0, tmp_tid;
- struct dirent *entry;
- char state;
+ int first, last, middle;
+
+ first = 0;
+ last = n - 1;
+
+ while( first <= last ) {
+
+ middle = (first + last)/2;
+
+ if ( cp.t_id[middle] < pid )
+ first = middle + 1;
+ else if ( cp.t_id[middle] == pid )
+ return 1;
+ else
+ last = middle - 1;
+ }
- ret = get_thread_count(pid);
- if (ret == -1)
- return -1;
+ return 0;
+}
- cp.thread_count = ret;
- cp.t_id = calloc(cp.thread_count, sizeof(int));
- if (!cp.t_id) {
- status = errno;
- gencore_log("Could not allocate memory for thread_ids.\n");
- return -1;
+/* Insert a TID to cp.t_id */
+void insert (int tid, int n)
+{
+ int i, j, flag = 0;
+
+ for (i = 0; (i < n) && (tid > cp.t_id[i]); i++);
+
+ j = i;
+ while (j < n) {
+ cp.t_id[j + 1] = cp.t_id[j];
+ j++;
}
+ cp.t_id[i] = tid;
+}
+
+/*
+ * Read the directory /proc/pid/task again and again
+ * till we find no new threads.
+ */
+int scan_threads(int pid)
+{
+ DIR *dir;
+ struct dirent *entry;
+ int tmp_tid, ret = 0, k = 0;
+ char state;
+ char filename[40];
+
snprintf(filename, 40, "/proc/%d/task", pid);
+
dir = opendir(filename);
while ((entry = readdir(dir))) {
if (entry->d_type == DT_DIR && entry->d_name[0] != '.') {
tmp_tid = atoi(entry->d_name);
- ret = ptrace(PTRACE_SEIZE, tmp_tid, 0, 0);
- if (ret) {
- state = get_thread_status(tmp_tid);
- if (state == 'Z')
- goto assign;
- status = errno;
- gencore_log("Could not seize thread: %d\n",
- tmp_tid);
- break;
- }
- ret = ptrace(PTRACE_INTERRUPT, tmp_tid, 0, 0);
- if (ret) {
- state = get_thread_status(tmp_tid);
- if (state == 'Z')
- goto assign;
- status = errno;
- gencore_log("Could not interrupt thread: %d\n",
- tmp_tid);
- break;
- }
-assign:
- /* If a new thread, is created after we fetch the thread_count,
- * we may encounter a buffer overflow situation in the cp_tid.
- * Hence we check this case and re-allocate memory if required.
+ /*
+ * Search for the thread, if not present, seize, interrupt
+ * and insert it in cp.t_id.
*/
- cp.t_id[ct++] = tmp_tid;
+ if (!search(tmp_tid, cp.thread_count)) {
+
+ k++;
+
+ ret = ptrace(PTRACE_SEIZE, tmp_tid, 0, 0);
+ if (ret) {
+ state = get_thread_status(tmp_tid);
+ if (state == 'Z')
+ goto assign;
+ status = errno;
+ gencore_log("Could not seize thread: %d\n",
+ tmp_tid);
+ break;
+ }
+
+ ret = ptrace(PTRACE_INTERRUPT, tmp_tid, 0, 0);
+ if (ret) {
+ state = get_thread_status(tmp_tid);
+ if (state == 'Z')
+ goto assign;
+ status = errno;
+ gencore_log("Could not interrupt thread: %d\n",
+ tmp_tid);
+ break;
+ }
+assign:
+ cp.t_id = (char *) realloc(cp.t_id, (cp.thread_count + 1) * sizeof(int));
+ if (!cp.t_id) {
+ status = errno;
+ gencore_log("Could not allocate memory for thread_ids.\n");
+ return -1;
+ }
+
+ insert(tmp_tid, cp.thread_count);
+ cp.thread_count ++;
+ }
}
}
- /* Reassigning based on successful seizes */
- cp.thread_count = ct;
-
closedir(dir);
+ if (!k)
+ return 1;
+
+ return ret;
+}
+
+/* Gets the Thread IDS and siezes them */
+int seize_threads(int pid)
+{
+ int ret = 0;
+
+ cp.thread_count = 0;
+ cp.t_id = calloc(cp.thread_count, sizeof(int));
+ if (!cp.t_id) {
+ status = errno;
+ gencore_log("Could not allocate memory for thread_ids.\n");
+ return -1;
+ }
+
+ /*
+ * Read the directory /proc/pid/task again and again
+ * till we find no new threads.
+ */
+
+ do {
+ ret = scan_threads(pid);
+ } while (ret == 0);
+
/* Successful seize and interrupt on all threads makes ret = 0 */
+ if (ret == 1)
+ return 0;
+
return ret;
}
Thanks.
Janani
[-- Attachment #2: Type: text/html, Size: 6968 bytes --]
next prev parent reply other threads:[~2014-04-18 14:04 UTC|newest]
Thread overview: 44+ messages / expand[flat|nested] mbox.gz Atom feed top
2014-03-20 9:39 [PATCH 00/33] [RFC] Non disruptive application core dump infrastructure Janani Venkataraman
2014-03-20 9:39 ` [PATCH 01/33] Configure and Make files Janani Venkataraman
2014-03-20 9:39 ` [PATCH 02/33] Validity of arguments Janani Venkataraman
2014-03-20 9:39 ` [PATCH 03/33] Process Status Janani Venkataraman
2014-03-20 9:39 ` [PATCH 04/33] Hold threads Janani Venkataraman
2014-03-20 19:01 ` Pavel Emelyanov
2014-03-25 6:58 ` Janani Venkataraman
2014-04-18 14:04 ` Janani Venkataraman [this message]
2014-03-20 9:39 ` [PATCH 05/33] Fetching Memory maps Janani Venkataraman
2014-03-20 9:39 ` [PATCH 06/33] Check ELF class Janani Venkataraman
2014-03-20 9:39 ` [PATCH 07/33] Do elf_coredump Janani Venkataraman
2014-03-20 9:40 ` [PATCH 08/33] Fills elf header Janani Venkataraman
2014-03-20 9:40 ` [PATCH 09/33] Adding notes infrastructure Janani Venkataraman
2014-03-20 9:40 ` [PATCH 10/33] Populates PRPS info Janani Venkataraman
2014-03-20 9:40 ` [PATCH 11/33] Populate AUXV Janani Venkataraman
2014-03-20 9:40 ` [PATCH 12/33] Fetch File maps Janani Venkataraman
2014-03-20 9:41 ` [PATCH 13/33] Fetching thread specific Notes Janani Venkataraman
2014-03-20 9:41 ` [PATCH 14/33] Populating Program Headers Janani Venkataraman
2014-03-20 9:41 ` [PATCH 15/33] Updating Offset Janani Venkataraman
2014-03-20 9:41 ` [PATCH 16/33] Writing to core file Janani Venkataraman
2014-03-20 9:41 ` [PATCH 17/33] Daemonizing the Process Janani Venkataraman
2014-03-20 9:41 ` [PATCH 18/33] Socket operations Janani Venkataraman
2014-03-20 9:41 ` [PATCH 19/33] Block till request Janani Venkataraman
2014-03-20 9:41 ` [PATCH 20/33] Handling Requests Janani Venkataraman
2014-03-20 9:41 ` [PATCH 21/33] Get Clients PID Janani Venkataraman
2014-03-20 9:41 ` [PATCH 22/33] Dump the task Janani Venkataraman
2014-03-20 9:42 ` [PATCH 23/33] Handling SIG TERM of the daemon Janani Venkataraman
2014-03-20 9:42 ` [PATCH 24/33] Handling SIG TERM of the child Janani Venkataraman
2014-03-20 9:42 ` [PATCH 25/33] Systemd Socket ID retrieval Janani Venkataraman
2014-03-20 9:42 ` [PATCH 26/33] [libgencore] Setting up Connection Janani Venkataraman
2014-03-20 9:42 ` [PATCH 27/33] [libgencore] Request for dump Janani Venkataraman
2014-03-20 9:43 ` [PATCH 28/33] Man pages Janani Venkataraman
2014-03-20 9:43 ` [PATCH 29/33] Automake files for the doc folder Janani Venkataraman
2014-03-20 9:43 ` [PATCH 30/33] README, COPYING, Changelog Janani Venkataraman
2014-03-20 9:43 ` [PATCH 31/33] Spec file Janani Venkataraman
2014-03-20 9:43 ` [PATCH 32/33] Socket and Service files Janani Venkataraman
2014-03-20 9:44 ` [PATCH 33/33] Support check Janani Venkataraman
2014-03-20 10:24 ` [PATCH 00/33] [RFC] Non disruptive application core dump infrastructure Pádraig Brady
2014-03-21 8:17 ` Karel Zak
2014-03-21 15:02 ` Phillip Susi
2014-03-24 9:43 ` Janani Venkataraman
2014-03-24 13:54 ` Phillip Susi
2014-07-03 12:59 ` Suzuki K. Poulose
2014-03-24 9:38 ` Janani Venkataraman
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=535130F5.3030700@linux.vnet.ibm.com \
--to=jananive@linux.vnet.ibm.com \
--cc=adobriyan@gmail.com \
--cc=akpm@linux-foundation.org \
--cc=amwang@redhat.com \
--cc=ananth@linux.vnet.ibm.com \
--cc=andi@firstfloor.org \
--cc=aravinda@linux.vnet.ibm.com \
--cc=avagin@openvz.org \
--cc=coreutils@gnu.org \
--cc=d.hatayama@jp.fujitsu.com \
--cc=eparis@redhat.com \
--cc=gorcunov@openvz.org \
--cc=hch@lst.de \
--cc=james.hogan@imgtec.com \
--cc=jeremy.fitzhardinge@citrix.com \
--cc=kosaki.motohiro@jp.fujitsu.com \
--cc=linux-kernel@vger.kernel.org \
--cc=mhiramat@redhat.com \
--cc=oleg@redhat.com \
--cc=procps@freelists.org \
--cc=rdunlap@xenotime.net \
--cc=roland@hack.frob.com \
--cc=suzuki@linux.vnet.ibm.com \
--cc=tarundsk@linux.vnet.ibm.com \
--cc=tj@kernel.org \
--cc=torvalds@linux-foundation.org \
--cc=util-linux@vger.kernel.org \
--cc=xemul@parallels.com \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.