git.vger.kernel.org archive mirror
 help / color / mirror / Atom feed
From: Ramsay Jones <ramsay@ramsayjones.plus.com>
To: David Turner <dturner@twopensource.com>,
	git@vger.kernel.org, pclouds@gmail.com
Subject: Re: [PATCH] index-helper: use watchman to avoid refreshing index with lstat()
Date: Fri, 13 May 2016 21:17:49 +0100	[thread overview]
Message-ID: <5736366D.6080706@ramsayjones.plus.com> (raw)
In-Reply-To: <1463164054-15342-1-git-send-email-dturner@twopensource.com>



On 13/05/16 19:27, David Turner wrote:
> From: Nguyễn Thái Ngọc Duy <pclouds@gmail.com>
[snip]

> +
> +static void reply_to_poke(int client_fd, const char *pid_buf)
> +{
> +	char *capabilities;
> +	struct strbuf sb = STRBUF_INIT;
> +
> +#ifdef USE_WATCHMAN
> +	pid_t client_pid = strtoull(pid_buf, NULL, 10);
> +
> +	prepare_index(client_pid);
> +#endif
> +	capabilities = strchr(pid_buf, ' ');

So, if the pid is *not* followed by a space, the capabilities
will be NULL here, and ...

> +
> +	if (!strcmp(capabilities, " watchman"))

... we segfault here.

> +#ifdef USE_WATCHMAN
> +		packet_buf_write(&sb, "OK watchman");
> +#else
> +		packet_buf_write(&sb, "NAK watchman");
> +#endif
> +	else
> +		packet_buf_write(&sb, "OK");
> +	if (write_in_full(client_fd, sb.buf, sb.len) != sb.len)
> +		warning(_("client write failed"));
> +}
> +
>  static void loop(int fd, int idle_in_seconds)
>  {
>  	assert(idle_in_seconds < INT_MAX / 1000);
> @@ -252,11 +341,15 @@ static void loop(int fd, int idle_in_seconds)
>  			buf[bytes_read] = 0;
>  			if (!strcmp(buf, "refresh")) {
>  				refresh();
> -			} else if (!strcmp(buf, "poke")) {
> -				/*
> -				 * Just a poke to keep us
> -				 * alive, nothing to do.
> -				 */
> +			} else if (starts_with(buf, "poke")) {
> +				if (buf[4] == ' ') {
> +					reply_to_poke(client_fd, buf + 5);
> +				} else {
> +					/*
> +					 * Just a poke to keep us
> +					 * alive, nothing to do.
> +					 */
> +				}
>  			} else {
>  				warning("BUG: Bogus command %s", buf);
>  			}
> diff --git a/read-cache.c b/read-cache.c
> index 1719f5a..8ec4be3 100644
> --- a/read-cache.c
> +++ b/read-cache.c
> @@ -1235,7 +1235,7 @@ int refresh_index(struct index_state *istate, unsigned int flags,
>  		if (!new) {
>  			const char *fmt;
>  
> -			if (really && cache_errno == EINVAL) {
> +			if (really || cache_errno == EINVAL) {
>  				/* If we are doing --really-refresh that
>  				 * means the index is not valid anymore.
>  				 */
> @@ -1375,11 +1375,75 @@ static int verify_hdr(const struct cache_header *hdr, unsigned long size)
>  	return 0;
>  }
>  
> +static struct untracked_cache_dir *find_untracked_cache_dir(
> +	struct untracked_cache *uc, struct untracked_cache_dir *ucd,
> +	const char *name)
> +{
> +	int component_len;
> +	const char *end;
> +	struct untracked_cache_dir *dir;
> +
> +	if (!*name)
> +		return ucd;
> +
> +	end = strchr(name, '/');
> +	if (end)
> +		component_len = end - name;
> +	else
> +		component_len = strlen(name);
> +
> +	dir = lookup_untracked(uc, ucd, name, component_len);
> +	if (dir)
> +		return find_untracked_cache_dir(uc, dir, name + component_len + 1);
> +
> +	return NULL;
> +}
> +
>  static void mark_no_watchman(size_t pos, void *data)
>  {
>  	struct index_state *istate = data;
> +	struct cache_entry *ce = istate->cache[pos];
> +	struct strbuf sb = STRBUF_INIT;
> +	char *c;
> +	struct untracked_cache_dir *dir;
> +
>  	assert(pos < istate->cache_nr);
> -	istate->cache[pos]->ce_flags |= CE_WATCHMAN_DIRTY;
> +	ce->ce_flags |= CE_WATCHMAN_DIRTY;
> +
> +	if (!istate->untracked || !istate->untracked->root)
> +		return;
> +
> +	strbuf_add(&sb, ce->name, ce_namelen(ce));
> +
> +	for (c = sb.buf + sb.len - 1; c > sb.buf; c--) {
> +		if (*c == '/') {
> +			strbuf_setlen(&sb, c - sb.buf);
> +			break;
> +		}
> +	}
> +
> +	if (c == sb.buf)
> +		strbuf_setlen(&sb, 0);
> +
> +	dir = find_untracked_cache_dir(istate->untracked,
> +				       istate->untracked->root, sb.buf);
> +	if (dir)
> +		dir->valid = 0;
> +
> +	strbuf_release(&sb);
> +}
> +
> +static int mark_untracked_invalid(struct string_list_item *item, void *uc)
> +{
> +	struct untracked_cache *untracked = uc;
> +	struct untracked_cache_dir *dir;
> +
> +	dir = find_untracked_cache_dir(untracked, untracked->root,
> +				       item->string);
> +	if (dir)
> +		dir->valid = 0;
> +
> +	return 0;
>  }
>  
>  static int read_watchman_ext(struct index_state *istate, const void *data,
> @@ -1409,10 +1473,24 @@ static int read_watchman_ext(struct index_state *istate, const void *data,
>  	ewah_each_bit(bitmap, mark_no_watchman, istate);
>  	ewah_free(bitmap);
>  
> -	/*
> -	 * TODO: update the untracked cache from the untracked data in this
> -	 * extension.
> -	 */
> +	if (istate->untracked && istate->untracked->root) {
> +		int i;
> +		const char *untracked;
> +
> +		untracked = (const char *)data + len + 8 + bitmap_size;
> +		for (i = 0; i < untracked_nr; ++i) {
> +			int len = strlen(untracked);
> +			string_list_append(&istate->untracked->invalid_untracked,
> +					   untracked);
> +			untracked += len + 1;
> +		}
> +
> +		for_each_string_list(&istate->untracked->invalid_untracked,
> +			 mark_untracked_invalid, istate->untracked);
> +
> +		if (untracked_nr)
> +			istate->cache_changed |= WATCHMAN_CHANGED;
> +	}
>  	return 0;
>  }
>  
> @@ -1645,29 +1723,88 @@ static void post_read_index_from(struct index_state *istate)
>  	tweak_untracked_cache(istate);
>  }
>  
> +/* in ms */
> +#define WATCHMAN_TIMEOUT 1000
> +
> +static int poke_and_wait_for_reply(int fd)
> +{
> +	int ret = -1;
> +	struct pollfd pollfd;
> +	int bytes_read;
> +	char reply_buf[4096];
> +	const char *requested_capabilities = "";
> +
> +#ifdef USE_WATCHMAN
> +	requested_capabilities = "watchman";
> +#endif
> +
> +	if (fd < 0)
> +		return -1;
> +
> +	if (packet_write_gently(fd, "poke %d %s", getpid(), requested_capabilities))

So, adding the empty capabilities (and more importantly the
separating space) is not so much 'doesn't hurt', rather than 
'prevents a core-dump!' ;-)

> +		return -1;
> +	if (packet_flush_gently(fd))
> +		return -1;

And yes, I'd forgotten about the 'maybe sometime in the future, we
could buffer the packets' ...

ATB,
Ramsay Jones

  reply	other threads:[~2016-05-13 20:17 UTC|newest]

Thread overview: 33+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2016-05-12 20:19 [PATCH v10 00/20] index-helper/watchman David Turner
2016-05-12 20:19 ` [PATCH v10 01/20] read-cache.c: fix constness of verify_hdr() David Turner
2016-05-12 20:19 ` [PATCH v10 02/20] read-cache: allow to keep mmap'd memory after reading David Turner
2016-05-12 20:19 ` [PATCH v10 03/20] pkt-line: add gentle version of packet_write David Turner
2016-05-12 21:14   ` Junio C Hamano
2016-05-12 20:19 ` [PATCH v10 04/20] index-helper: new daemon for caching index and related stuff David Turner
2016-05-12 20:20 ` [PATCH v10 05/20] index-helper: add --strict David Turner
2016-05-12 20:20 ` [PATCH v10 06/20] daemonize(): set a flag before exiting the main process David Turner
2016-05-12 20:20 ` [PATCH v10 07/20] index-helper: add --detach David Turner
2016-05-12 20:20 ` [PATCH v10 08/20] index-helper: log warnings David Turner
2016-05-12 20:20 ` [PATCH v10 09/20] read-cache: add watchman 'WAMA' extension David Turner
2016-05-12 20:20 ` [PATCH v10 10/20] watchman: support watchman to reduce index refresh cost David Turner
2016-05-12 20:20 ` [PATCH v10 11/20] index-helper: use watchman to avoid refreshing index with lstat() David Turner
2016-05-12 23:10   ` Ramsay Jones
2016-05-13 17:47     ` David Turner
2016-05-13 18:27     ` [PATCH] " David Turner
2016-05-13 20:17       ` Ramsay Jones [this message]
2016-05-13 21:16         ` [PATCH v10 ter] " David Turner
2016-05-12 20:20 ` [PATCH v10 12/20] update-index: enable/disable watchman support David Turner
2016-05-12 20:20 ` [PATCH v10 13/20] unpack-trees: preserve index extensions David Turner
2016-05-12 20:20 ` [PATCH v10 14/20] watchman: add a config option to enable the extension David Turner
2016-05-12 20:20 ` [PATCH v10 15/20] index-helper: kill mode David Turner
2016-05-12 20:20 ` [PATCH v10 16/20] index-helper: don't run if already running David Turner
2016-05-12 20:20 ` [PATCH v10 17/20] index-helper: autorun mode David Turner
2016-05-12 20:20 ` [PATCH v10 18/20] index-helper: optionally automatically run David Turner
2016-05-12 20:20 ` [PATCH v10 19/20] trace: measure where the time is spent in the index-heavy operations David Turner
2016-05-12 20:20 ` [PATCH v10 20/20] untracked-cache: config option David Turner
2016-05-15  9:43   ` Duy Nguyen
2016-05-16 18:03     ` David Turner
2016-05-14 13:14 ` [PATCH v10 00/20] index-helper/watchman Dennis Kaarsemaker
2016-05-19 19:08 ` David Turner
2016-05-19 20:11   ` Junio C Hamano
2016-05-19 20:30     ` David Turner

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=5736366D.6080706@ramsayjones.plus.com \
    --to=ramsay@ramsayjones.plus.com \
    --cc=dturner@twopensource.com \
    --cc=git@vger.kernel.org \
    --cc=pclouds@gmail.com \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox;
as well as URLs for NNTP newsgroup(s).