From: Anthony Liguori <anthony@codemonkey.ws>
To: Avi Kivity <avi@redhat.com>
Cc: qemu-devel@nongnu.org, kvm@vger.kernel.org
Subject: Re: [Qemu-devel] [PATCH 11/23] memory: add ioeventfd support
Date: Mon, 25 Jul 2011 14:08:20 -0500 [thread overview]
Message-ID: <4E2DBF24.20803@codemonkey.ws> (raw)
In-Reply-To: <1311602584-23409-12-git-send-email-avi@redhat.com>
On 07/25/2011 09:02 AM, Avi Kivity wrote:
> As with the rest of the memory API, the caller associates an eventfd
> with an address, and the memory API takes care of registering or
> unregistering when the address is made visible or invisible to the
> guest.
>
> Signed-off-by: Avi Kivity<avi@redhat.com>
> ---
> memory.c | 230 ++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
> memory.h | 20 ++++++
> 2 files changed, 250 insertions(+), 0 deletions(-)
>
> diff --git a/memory.c b/memory.c
> index e4446a0..a5cde0c 100644
> --- a/memory.c
> +++ b/memory.c
> @@ -15,6 +15,7 @@
> #include "exec-memory.h"
> #include "ioport.h"
> #include "bitops.h"
> +#include "kvm.h"
> #include<assert.h>
>
> typedef struct AddrRange AddrRange;
> @@ -64,6 +65,50 @@ struct CoalescedMemoryRange {
> QTAILQ_ENTRY(CoalescedMemoryRange) link;
> };
>
> +struct MemoryRegionIoeventfd {
> + AddrRange addr;
> + bool match_data;
> + uint64_t data;
> + int fd;
> +};
> +
> +static bool memory_region_ioeventfd_before(MemoryRegionIoeventfd a,
> + MemoryRegionIoeventfd b)
> +{
> + if (a.addr.start< b.addr.start) {
> + return true;
> + } else if (a.addr.start> b.addr.start) {
> + return false;
> + } else if (a.addr.size< b.addr.size) {
> + return true;
> + } else if (a.addr.size> b.addr.size) {
> + return false;
> + } else if (a.match_data< b.match_data) {
> + return true;
> + } else if (a.match_data> b.match_data) {
> + return false;
> + } else if (a.match_data) {
> + if (a.data< b.data) {
> + return true;
> + } else if (a.data> b.data) {
> + return false;
> + }
> + }
> + if (a.fd< b.fd) {
> + return true;
> + } else if (a.fd> b.fd) {
> + return false;
> + }
> + return false;
> +}
> +
> +static bool memory_region_ioeventfd_equal(MemoryRegionIoeventfd a,
> + MemoryRegionIoeventfd b)
> +{
> + return !memory_region_ioeventfd_before(a, b)
> +&& !memory_region_ioeventfd_before(b, a);
> +}
> +
> typedef struct FlatRange FlatRange;
> typedef struct FlatView FlatView;
>
> @@ -92,6 +137,8 @@ struct AddressSpace {
> const AddressSpaceOps *ops;
> MemoryRegion *root;
> FlatView current_map;
> + int ioeventfd_nb;
> + MemoryRegionIoeventfd *ioeventfds;
> };
>
> struct AddressSpaceOps {
> @@ -99,6 +146,8 @@ struct AddressSpaceOps {
> void (*range_del)(AddressSpace *as, FlatRange *fr);
> void (*log_start)(AddressSpace *as, FlatRange *fr);
> void (*log_stop)(AddressSpace *as, FlatRange *fr);
> + void (*ioeventfd_add)(AddressSpace *as, MemoryRegionIoeventfd *fd);
> + void (*ioeventfd_del)(AddressSpace *as, MemoryRegionIoeventfd *fd);
> };
>
> #define FOR_EACH_FLAT_RANGE(var, view) \
> @@ -201,11 +250,37 @@ static void as_memory_log_stop(AddressSpace *as, FlatRange *fr)
> cpu_physical_log_stop(fr->addr.start, fr->addr.size);
> }
>
> +static void as_memory_ioeventfd_add(AddressSpace *as, MemoryRegionIoeventfd *fd)
> +{
> + int r;
> +
> + if (!fd->match_data || fd->addr.size != 4) {
> + abort();
> + }
> +
> + r = kvm_set_ioeventfd_mmio_long(fd->fd, fd->addr.start, fd->data, true);
> + if (r< 0) {
> + abort();
> + }
asserts would be friendlier.
I really dislike baking ioeventfd into this API. There is only one user
of ioeventfd in the tree.
I worry that by having things like ioeventfd the API, we're making it
too difficult to side-step the API which prevents future optimizations.
I'd prefer virtio-pci to have ugliness in it where it circumvented the
layering vs. having such a device specific thing in generic code.
Regards,
Anthony Liguori
> +}
> +
> +static void as_memory_ioeventfd_del(AddressSpace *as, MemoryRegionIoeventfd *fd)
> +{
> + int r;
> +
> + r = kvm_set_ioeventfd_mmio_long(fd->fd, fd->addr.start, fd->data, false);
> + if (r< 0) {
> + abort();
> + }
> +}
> +
> static const AddressSpaceOps address_space_ops_memory = {
> .range_add = as_memory_range_add,
> .range_del = as_memory_range_del,
> .log_start = as_memory_log_start,
> .log_stop = as_memory_log_stop,
> + .ioeventfd_add = as_memory_ioeventfd_add,
> + .ioeventfd_del = as_memory_ioeventfd_del,
> };
>
> static AddressSpace address_space_memory = {
> @@ -281,9 +356,35 @@ static void as_io_range_del(AddressSpace *as, FlatRange *fr)
> isa_unassign_ioport(fr->addr.start, fr->addr.size);
> }
>
> +static void as_io_ioeventfd_add(AddressSpace *as, MemoryRegionIoeventfd *fd)
> +{
> + int r;
> +
> + if (!fd->match_data || fd->addr.size != 2) {
> + abort();
> + }
> +
> + r = kvm_set_ioeventfd_pio_word(fd->fd, fd->addr.start, fd->data, true);
> + if (r< 0) {
> + abort();
> + }
> +}
> +
> +static void as_io_ioeventfd_del(AddressSpace *as, MemoryRegionIoeventfd *fd)
> +{
> + int r;
> +
> + r = kvm_set_ioeventfd_pio_word(fd->fd, fd->addr.start, fd->data, false);
> + if (r< 0) {
> + abort();
> + }
> +}
> +
> static const AddressSpaceOps address_space_ops_io = {
> .range_add = as_io_range_add,
> .range_del = as_io_range_del,
> + .ioeventfd_add = as_io_ioeventfd_add,
> + .ioeventfd_del = as_io_ioeventfd_del,
> };
>
> static AddressSpace address_space_io = {
> @@ -382,6 +483,69 @@ static FlatView generate_memory_topology(MemoryRegion *mr)
> return view;
> }
>
> +static void address_space_add_del_ioeventfds(AddressSpace *as,
> + MemoryRegionIoeventfd *fds_new,
> + unsigned fds_new_nb,
> + MemoryRegionIoeventfd *fds_old,
> + unsigned fds_old_nb)
> +{
> + unsigned iold, inew;
> +
> + /* Generate a symmetric difference of the old and new fd sets, adding
> + * and deleting as necessary.
> + */
> +
> + iold = inew = 0;
> + while (iold< fds_old_nb || inew< fds_new_nb) {
> + if (iold< fds_old_nb
> +&& (inew == fds_new_nb
> + || memory_region_ioeventfd_before(fds_old[iold],
> + fds_new[inew]))) {
> + as->ops->ioeventfd_del(as,&fds_old[iold]);
> + ++iold;
> + } else if (inew< fds_new_nb
> +&& (iold == fds_old_nb
> + || memory_region_ioeventfd_before(fds_new[inew],
> + fds_old[iold]))) {
> + as->ops->ioeventfd_add(as,&fds_new[inew]);
> + ++inew;
> + } else {
> + ++iold;
> + ++inew;
> + }
> + }
> +}
> +
> +static void address_space_update_ioeventfds(AddressSpace *as)
> +{
> + FlatRange *fr;
> + unsigned ioeventfd_nb = 0;
> + MemoryRegionIoeventfd *ioeventfds = NULL;
> + AddrRange tmp;
> + unsigned i;
> +
> + FOR_EACH_FLAT_RANGE(fr,&as->current_map) {
> + for (i = 0; i< fr->mr->ioeventfd_nb; ++i) {
> + tmp = addrrange_shift(fr->mr->ioeventfds[i].addr,
> + fr->addr.start - fr->offset_in_region);
> + if (addrrange_intersects(fr->addr, tmp)) {
> + ++ioeventfd_nb;
> + ioeventfds = qemu_realloc(ioeventfds,
> + ioeventfd_nb * sizeof(*ioeventfds));
> + ioeventfds[ioeventfd_nb-1] = fr->mr->ioeventfds[i];
> + ioeventfds[ioeventfd_nb-1].addr = tmp;
> + }
> + }
> + }
> +
> + address_space_add_del_ioeventfds(as, ioeventfds, ioeventfd_nb,
> + as->ioeventfds, as->ioeventfd_nb);
> +
> + qemu_free(as->ioeventfds);
> + as->ioeventfds = ioeventfds;
> + as->ioeventfd_nb = ioeventfd_nb;
> +}
> +
> static void address_space_update_topology(AddressSpace *as)
> {
> FlatView old_view = as->current_map;
> @@ -434,6 +598,7 @@ static void address_space_update_topology(AddressSpace *as)
> }
> as->current_map = new_view;
> flatview_destroy(&old_view);
> + address_space_update_ioeventfds(as);
> }
>
> static void memory_region_update_topology(void)
> @@ -464,6 +629,8 @@ void memory_region_init(MemoryRegion *mr,
> QTAILQ_INIT(&mr->coalesced);
> mr->name = qemu_strdup(name);
> mr->dirty_log_mask = 0;
> + mr->ioeventfd_nb = 0;
> + mr->ioeventfds = NULL;
> }
>
> static bool memory_region_access_valid(MemoryRegion *mr,
> @@ -675,6 +842,7 @@ void memory_region_destroy(MemoryRegion *mr)
> assert(QTAILQ_EMPTY(&mr->subregions));
> memory_region_clear_coalescing(mr);
> qemu_free((char *)mr->name);
> + qemu_free(mr->ioeventfds);
> }
>
> target_phys_addr_t memory_region_size(MemoryRegion *mr)
> @@ -798,6 +966,68 @@ void memory_region_clear_coalescing(MemoryRegion *mr)
> memory_region_update_coalesced_range(mr);
> }
>
> +void memory_region_add_eventfd(MemoryRegion *mr,
> + target_phys_addr_t addr,
> + unsigned size,
> + bool match_data,
> + uint64_t data,
> + int fd)
> +{
> + MemoryRegionIoeventfd mrfd = {
> + .addr.start = addr,
> + .addr.size = size,
> + .match_data = match_data,
> + .data = data,
> + .fd = fd,
> + };
> + unsigned i;
> +
> + for (i = 0; i< mr->ioeventfd_nb; ++i) {
> + if (memory_region_ioeventfd_before(mrfd, mr->ioeventfds[i])) {
> + break;
> + }
> + }
> + ++mr->ioeventfd_nb;
> + mr->ioeventfds = qemu_realloc(mr->ioeventfds,
> + sizeof(*mr->ioeventfds) * mr->ioeventfd_nb);
> + memmove(&mr->ioeventfds[i+1],&mr->ioeventfds[i],
> + sizeof(*mr->ioeventfds) * (mr->ioeventfd_nb-1 - i));
> + mr->ioeventfds[i] = mrfd;
> + memory_region_update_topology();
> +}
> +
> +void memory_region_del_eventfd(MemoryRegion *mr,
> + target_phys_addr_t addr,
> + unsigned size,
> + bool match_data,
> + uint64_t data,
> + int fd)
> +{
> + MemoryRegionIoeventfd mrfd = {
> + .addr.start = addr,
> + .addr.size = size,
> + .match_data = match_data,
> + .data = data,
> + .fd = fd,
> + };
> + unsigned i;
> +
> + for (i = 0; i< mr->ioeventfd_nb; ++i) {
> + if (memory_region_ioeventfd_equal(mrfd, mr->ioeventfds[i])) {
> + break;
> + }
> + }
> + if (i == mr->ioeventfd_nb) {
> + abort();
> + }
> + memmove(&mr->ioeventfds[i],&mr->ioeventfds[i+1],
> + sizeof(*mr->ioeventfds) * (mr->ioeventfd_nb - (i+1)));
> + --mr->ioeventfd_nb;
> + mr->ioeventfds = qemu_realloc(mr->ioeventfds,
> + sizeof(*mr->ioeventfds)*mr->ioeventfd_nb + 1);
> + memory_region_update_topology();
> +}
> +
> static void memory_region_add_subregion_common(MemoryRegion *mr,
> target_phys_addr_t offset,
> MemoryRegion *subregion)
> diff --git a/memory.h b/memory.h
> index 4624946..e4c0ad1 100644
> --- a/memory.h
> +++ b/memory.h
> @@ -85,6 +85,7 @@ struct MemoryRegionOps {
> };
>
> typedef struct CoalescedMemoryRange CoalescedMemoryRange;
> +typedef struct MemoryRegionIoeventfd MemoryRegionIoeventfd;
>
> struct MemoryRegion {
> /* All fields are private - violators will be prosecuted */
> @@ -107,6 +108,8 @@ struct MemoryRegion {
> QTAILQ_HEAD(coalesced_ranges, CoalescedMemoryRange) coalesced;
> const char *name;
> uint8_t dirty_log_mask;
> + unsigned ioeventfd_nb;
> + MemoryRegionIoeventfd *ioeventfds;
> };
>
> struct MemoryRegionPortio {
> @@ -208,6 +211,23 @@ void memory_region_add_coalescing(MemoryRegion *mr,
> /* Disable MMIO coalescing for the region. */
> void memory_region_clear_coalescing(MemoryRegion *mr);
>
> +
> +/* Request an eventfd to be triggered when a word is written to a location */
> +void memory_region_add_eventfd(MemoryRegion *mr,
> + target_phys_addr_t addr,
> + unsigned size,
> + bool match_data,
> + uint64_t data,
> + int fd);
> +
> +/* Cancel an existing eventfd */
> +void memory_region_del_eventfd(MemoryRegion *mr,
> + target_phys_addr_t addr,
> + unsigned size,
> + bool match_data,
> + uint64_t data,
> + int fd);
> +
> /* Add a sub-region at @offset. The sub-region may not overlap with other
> * subregions (except for those explicitly marked as overlapping)
> */
next prev parent reply other threads:[~2011-07-25 19:08 UTC|newest]
Thread overview: 66+ messages / expand[flat|nested] mbox.gz Atom feed top
2011-07-25 14:02 [PATCH 00/23] Memory API, batch 1 Avi Kivity
2011-07-25 14:02 ` [PATCH 01/23] Hierarchical memory region API Avi Kivity
2011-07-25 18:41 ` [Qemu-devel] " Anthony Liguori
2011-07-26 9:35 ` Avi Kivity
2011-07-25 14:02 ` [PATCH 02/23] memory: implement dirty tracking Avi Kivity
2011-07-25 18:43 ` Anthony Liguori
2011-07-25 14:02 ` [PATCH 03/23] memory: merge adjacent segments of a single memory region Avi Kivity
2011-07-25 18:48 ` [Qemu-devel] " Anthony Liguori
2011-07-26 9:55 ` Avi Kivity
2011-07-25 14:02 ` [PATCH 04/23] Internal interfaces for memory API Avi Kivity
2011-07-25 18:49 ` [Qemu-devel] " Anthony Liguori
2011-07-25 14:02 ` [PATCH 05/23] memory: abstract address space operations Avi Kivity
2011-07-25 18:51 ` [Qemu-devel] " Anthony Liguori
2011-07-25 14:02 ` [PATCH 06/23] memory: rename MemoryRegion::has_ram_addr to ::terminates Avi Kivity
2011-07-25 18:56 ` [Qemu-devel] " Anthony Liguori
2011-07-26 9:59 ` Avi Kivity
2011-07-25 14:02 ` [PATCH 07/23] memory: late initialization of ram_addr Avi Kivity
2011-07-25 14:02 ` [PATCH 08/23] memory: I/O address space support Avi Kivity
2011-07-25 19:00 ` [Qemu-devel] " Anthony Liguori
2011-07-25 14:02 ` [PATCH 09/23] memory: add backward compatibility for old portio registration Avi Kivity
2011-07-25 19:01 ` [Qemu-devel] " Anthony Liguori
2011-07-25 14:02 ` [PATCH 10/23] memory: add backward compatibility for old mmio registration Avi Kivity
2011-07-25 19:02 ` [Qemu-devel] " Anthony Liguori
2011-07-25 14:02 ` [PATCH 11/23] memory: add ioeventfd support Avi Kivity
2011-07-25 15:16 ` [Qemu-devel] " malc
2011-07-25 15:17 ` Avi Kivity
2011-07-25 15:22 ` malc
2011-07-25 15:28 ` [Qemu-devel] " Avi Kivity
2011-07-25 15:38 ` malc
2011-07-25 15:43 ` Avi Kivity
2011-07-25 19:08 ` Anthony Liguori [this message]
2011-07-26 10:08 ` Avi Kivity
2011-07-25 14:02 ` [PATCH 12/23] memory: separate building the final memory map into two steps Avi Kivity
2011-07-25 19:12 ` [Qemu-devel] " Anthony Liguori
2011-07-26 10:43 ` Avi Kivity
2011-07-25 14:02 ` [PATCH 13/23] memory: document the memory API Avi Kivity
2011-07-25 19:15 ` [Qemu-devel] " Anthony Liguori
2011-07-26 10:44 ` Avi Kivity
2011-07-25 14:02 ` [PATCH 14/23] memory: transaction API Avi Kivity
2011-07-25 19:16 ` [Qemu-devel] " Anthony Liguori
2011-07-26 10:48 ` Avi Kivity
2011-07-26 11:39 ` Avi Kivity
2011-07-25 14:02 ` [PATCH 15/23] exec.c: initialize memory map Avi Kivity
2011-07-25 19:17 ` [Qemu-devel] " Anthony Liguori
2011-07-26 10:55 ` Avi Kivity
2011-07-25 14:02 ` [PATCH 16/23] ioport: register ranges by byte aligned addresses always Avi Kivity
2011-07-25 19:20 ` [Qemu-devel] " Anthony Liguori
2011-07-26 10:59 ` Avi Kivity
2011-07-25 14:02 ` [PATCH 17/23] pc: grab system_memory Avi Kivity
2011-07-25 19:22 ` [Qemu-devel] " Anthony Liguori
2011-07-25 14:02 ` [PATCH 18/23] pc: convert pc_memory_init() to memory API Avi Kivity
2011-07-25 19:23 ` [Qemu-devel] " Anthony Liguori
2011-07-25 14:03 ` [PATCH 19/23] pc: move global memory map out of pc_init1() and into its callers Avi Kivity
2011-07-25 20:02 ` [Qemu-devel] " Anthony Liguori
2011-07-26 11:02 ` Avi Kivity
2011-07-25 14:03 ` [PATCH 20/23] pci: pass address space to pci bus when created Avi Kivity
2011-07-25 20:03 ` Anthony Liguori
2011-07-25 14:03 ` [PATCH 21/23] pci: add MemoryRegion based BAR management API Avi Kivity
2011-07-25 20:20 ` Anthony Liguori
2011-07-26 11:06 ` Avi Kivity
2011-07-25 14:03 ` [PATCH 22/23] sysbus: add MemoryRegion based memory " Avi Kivity
2011-07-25 20:21 ` Anthony Liguori
2011-07-25 14:03 ` [PATCH 23/23] usb-ohci: convert to MemoryRegion Avi Kivity
2011-07-25 20:22 ` [Qemu-devel] " Anthony Liguori
2011-07-25 20:23 ` [PATCH 00/23] Memory API, batch 1 Anthony Liguori
2011-07-26 11:32 ` [Qemu-devel] " Avi Kivity
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=4E2DBF24.20803@codemonkey.ws \
--to=anthony@codemonkey.ws \
--cc=avi@redhat.com \
--cc=kvm@vger.kernel.org \
--cc=qemu-devel@nongnu.org \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox