public inbox for kvm@vger.kernel.org
 help / color / mirror / Atom feed
From: Binbin Wu <binbin.wu@linux.intel.com>
To: Jason Gunthorpe <jgg@nvidia.com>
Cc: Anthony Krowiak <akrowiak@linux.ibm.com>,
	Alex Williamson <alex.williamson@redhat.com>,
	Bagas Sanjaya <bagasdotme@gmail.com>,
	Lu Baolu <baolu.lu@linux.intel.com>,
	Chaitanya Kulkarni <chaitanyak@nvidia.com>,
	Cornelia Huck <cohuck@redhat.com>,
	Jonathan Corbet <corbet@lwn.net>,
	Daniel Jordan <daniel.m.jordan@oracle.com>,
	David Gibson <david@gibson.dropbear.id.au>,
	Eric Auger <eric.auger@redhat.com>,
	Eric Farman <farman@linux.ibm.com>,
	iommu@lists.linux.dev, Jason Wang <jasowang@redhat.com>,
	Jean-Philippe Brucker <jean-philippe@linaro.org>,
	Jason Herne <jjherne@linux.ibm.com>,
	Joao Martins <joao.m.martins@oracle.com>,
	Kevin Tian <kevin.tian@intel.com>,
	kvm@vger.kernel.org, Lixiao Yang <lixiao.yang@intel.com>,
	Matthew Rosato <mjrosato@linux.ibm.com>,
	"Michael S. Tsirkin" <mst@redhat.com>,
	Nicolin Chen <nicolinc@nvidia.com>,
	Halil Pasic <pasic@linux.ibm.com>,
	Niklas Schnelle <schnelle@linux.ibm.com>,
	Shameerali Kolothum Thodi  <shameerali.kolothum.thodi@huawei.com>,
	Yi Liu <yi.l.liu@intel.com>, Yu He <yu.he@intel.com>,
	Keqian Zhu <zhukeqian1@huawei.com>
Subject: Re: [PATCH v6 08/19] iommufd: PFN handling for iopt_pages
Date: Tue, 6 Dec 2022 20:36:20 +0800	[thread overview]
Message-ID: <235bce13-9855-940f-d43c-cec60f0714dc@linux.intel.com> (raw)
In-Reply-To: <8-v6-a196d26f289e+11787-iommufd_jgg@nvidia.com>


On 11/30/2022 4:29 AM, Jason Gunthorpe wrote:
> +
> +/* pfn_reader_user is just the pin_user_pages() path */
> +struct pfn_reader_user {
> +	struct page **upages;
> +	size_t upages_len;
> +	unsigned long upages_start;
> +	unsigned long upages_end;
> +	unsigned int gup_flags;
> +	/*
> +	 * 1 means mmget() and mmap_read_lock(), 0 means only mmget(), -1 is
> +	 * neither
> +	 */
> +	int locked;
> +};
> +
> +static void pfn_reader_user_init(struct pfn_reader_user *user,
> +				 struct iopt_pages *pages)
> +{
> +	user->upages = NULL;
> +	user->upages_start = 0;
> +	user->upages_end = 0;
> +	user->locked = -1;
> +
> +	if (pages->writable) {
> +		user->gup_flags = FOLL_LONGTERM | FOLL_WRITE;
> +	} else {
> +		/* Still need to break COWs on read */
> +		user->gup_flags = FOLL_LONGTERM | FOLL_FORCE | FOLL_WRITE;
> +	}
> +}
> +
> +static void pfn_reader_user_destroy(struct pfn_reader_user *user,
> +				    struct iopt_pages *pages)
> +{
> +	if (user->locked != -1) {
> +		if (user->locked)
> +			mmap_read_unlock(pages->source_mm);
> +		if (pages->source_mm != current->mm)
> +			mmput(pages->source_mm);
> +		user->locked = 0;

Set back to -1 is more aligned with the definition of the locked?

Although the value doesn't matter due to the end of lifecyle of 
pfn_reader_user.



> +	}
> +
> +	kfree(user->upages);
> +	user->upages = NULL;
> +}
> +
> +static int pfn_reader_user_pin(struct pfn_reader_user *user,
> +			       struct iopt_pages *pages,
> +			       unsigned long start_index,
> +			       unsigned long last_index)
> +{
> +	bool remote_mm = pages->source_mm != current->mm;
> +	unsigned long npages;
> +	uintptr_t uptr;
> +	long rc;
> +
> +	if (!user->upages) {
> +		/* All undone in pfn_reader_destroy() */
> +		user->upages_len =
> +			(last_index - start_index + 1) * sizeof(*user->upages);
> +		user->upages = temp_kmalloc(&user->upages_len, NULL, 0);
> +		if (!user->upages)
> +			return -ENOMEM;
> +	}
> +
> +	if (user->locked == -1) {
> +		/*
> +		 * The majority of usages will run the map task within the mm
> +		 * providing the pages, so we can optimize into
> +		 * get_user_pages_fast()
> +		 */
> +		if (remote_mm) {
> +			if (!mmget_not_zero(pages->source_mm))
> +				return -EFAULT;
> +		}
> +		user->locked = 0;
> +	}
> +
> +	npages = min_t(unsigned long, last_index - start_index + 1,
> +		       user->upages_len / sizeof(*user->upages));
> +
> +	uptr = (uintptr_t)(pages->uptr + start_index * PAGE_SIZE);
> +	if (!remote_mm)
> +		rc = pin_user_pages_fast(uptr, npages, user->gup_flags,
> +					 user->upages);
> +	else {
> +		if (!user->locked) {
> +			mmap_read_lock(pages->source_mm);
> +			user->locked = 1;
> +		}
> +		/*
> +		 * FIXME: last NULL can be &pfns->locked once the GUP patch
> +		 * is merged.
> +		 */
> +		rc = pin_user_pages_remote(pages->source_mm, uptr, npages,
> +					   user->gup_flags, user->upages, NULL,
> +					   NULL);
> +	}
> +	if (rc <= 0) {
> +		if (WARN_ON(!rc))
> +			return -EFAULT;
> +		return rc;
> +	}
> +	iopt_pages_add_npinned(pages, rc);
> +	user->upages_start = start_index;
> +	user->upages_end = start_index + rc;
> +	return 0;
> +}
> +
> +/* This is the "modern" and faster accounting method used by io_uring */
> +static int incr_user_locked_vm(struct iopt_pages *pages, unsigned long npages)
> +{
> +	unsigned long lock_limit;
> +	unsigned long cur_pages;
> +	unsigned long new_pages;
> +
> +	lock_limit = task_rlimit(pages->source_task, RLIMIT_MEMLOCK) >>
> +		     PAGE_SHIFT;
> +	npages = pages->npinned - pages->last_npinned;

The passed in value of npages is not used?


> +	do {
> +		cur_pages = atomic_long_read(&pages->source_user->locked_vm);
> +		new_pages = cur_pages + npages;
> +		if (new_pages > lock_limit)
> +			return -ENOMEM;
> +	} while (atomic_long_cmpxchg(&pages->source_user->locked_vm, cur_pages,
> +				     new_pages) != cur_pages);
> +	return 0;
> +}
> +

  parent reply	other threads:[~2022-12-06 12:37 UTC|newest]

Thread overview: 39+ messages / expand[flat|nested]  mbox.gz  Atom feed  top
2022-11-29 20:29 [PATCH v6 00/19] IOMMUFD Generic interface Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 01/19] iommu: Add IOMMU_CAP_ENFORCE_CACHE_COHERENCY Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 02/19] iommu: Add device-centric DMA ownership interfaces Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 03/19] interval-tree: Add a utility to iterate over spans in an interval tree Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 04/19] scripts/kernel-doc: support EXPORT_SYMBOL_NS_GPL() with -export Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 05/19] iommufd: Document overview of iommufd Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 06/19] iommufd: File descriptor, context, kconfig and makefiles Jason Gunthorpe
2022-11-30 14:02   ` Eric Auger
2022-12-04 10:58   ` Binbin Wu
2022-11-29 20:29 ` [PATCH v6 07/19] kernel/user: Allow user::locked_vm to be usable for iommufd Jason Gunthorpe
2022-11-29 20:42   ` Michael S. Tsirkin
2022-11-29 20:48     ` Jason Gunthorpe
2022-11-29 21:10       ` Michael S. Tsirkin
2022-11-29 20:29 ` [PATCH v6 08/19] iommufd: PFN handling for iopt_pages Jason Gunthorpe
2022-12-05 15:58   ` Binbin Wu
2022-12-06 20:53     ` Jason Gunthorpe
2022-12-06 12:36   ` Binbin Wu [this message]
2022-12-06 20:57     ` Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 09/19] iommufd: Algorithms for PFN storage Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 10/19] iommufd: Data structure to provide IOVA to PFN mapping Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 11/19] iommufd: IOCTLs for the io_pagetable Jason Gunthorpe
2022-11-30 14:04   ` Eric Auger
2022-11-29 20:29 ` [PATCH v6 12/19] iommufd: Add a HW pagetable object Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 13/19] iommufd: Add kAPI toward external drivers for physical devices Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 14/19] iommufd: Add kAPI toward external drivers for kernel access Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 15/19] iommufd: vfio container FD ioctl compatibility Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 16/19] iommufd: Add kernel support for testing iommufd Jason Gunthorpe
2024-04-22  7:27   ` Geert Uytterhoeven
2024-04-22 11:54     ` Jason Gunthorpe
2024-04-22 12:48       ` Geert Uytterhoeven
2024-04-22 12:50         ` Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 17/19] iommufd: Add some fault injection points Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 18/19] iommufd: Add additional invariant assertions Jason Gunthorpe
2022-11-29 20:29 ` [PATCH v6 19/19] iommufd: Add a selftest Jason Gunthorpe
2022-11-30  7:14   ` Yi Liu
2022-11-30 13:51     ` Jason Gunthorpe
2022-11-30 17:18       ` Eric Auger
2022-12-01  0:13         ` Jason Gunthorpe
2022-12-01  4:59         ` Yi Liu

Reply instructions:

You may reply publicly to this message via plain-text email
using any one of the following methods:

* Save the following mbox file, import it into your mail client,
  and reply-to-all from there: mbox

  Avoid top-posting and favor interleaved quoting:
  https://en.wikipedia.org/wiki/Posting_style#Interleaved_style

* Reply using the --to, --cc, and --in-reply-to
  switches of git-send-email(1):

  git send-email \
    --in-reply-to=235bce13-9855-940f-d43c-cec60f0714dc@linux.intel.com \
    --to=binbin.wu@linux.intel.com \
    --cc=akrowiak@linux.ibm.com \
    --cc=alex.williamson@redhat.com \
    --cc=bagasdotme@gmail.com \
    --cc=baolu.lu@linux.intel.com \
    --cc=chaitanyak@nvidia.com \
    --cc=cohuck@redhat.com \
    --cc=corbet@lwn.net \
    --cc=daniel.m.jordan@oracle.com \
    --cc=david@gibson.dropbear.id.au \
    --cc=eric.auger@redhat.com \
    --cc=farman@linux.ibm.com \
    --cc=iommu@lists.linux.dev \
    --cc=jasowang@redhat.com \
    --cc=jean-philippe@linaro.org \
    --cc=jgg@nvidia.com \
    --cc=jjherne@linux.ibm.com \
    --cc=joao.m.martins@oracle.com \
    --cc=kevin.tian@intel.com \
    --cc=kvm@vger.kernel.org \
    --cc=lixiao.yang@intel.com \
    --cc=mjrosato@linux.ibm.com \
    --cc=mst@redhat.com \
    --cc=nicolinc@nvidia.com \
    --cc=pasic@linux.ibm.com \
    --cc=schnelle@linux.ibm.com \
    --cc=shameerali.kolothum.thodi@huawei.com \
    --cc=yi.l.liu@intel.com \
    --cc=yu.he@intel.com \
    --cc=zhukeqian1@huawei.com \
    /path/to/YOUR_REPLY

  https://kernel.org/pub/software/scm/git/docs/git-send-email.html

* If your mail client supports setting the In-Reply-To header
  via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox