Xen project Mailing List

Re: [PATCH v2 4/8] vpci: add a wait operation to the vpci vcpu pending actions

To: Mykyta Poturai <Mykyta_Poturai@xxxxxxxx>, "xen-devel@xxxxxxxxxxxxxxxxxxxx" <xen-devel@xxxxxxxxxxxxxxxxxxxx>

From: Stewart Hildebrand <stewart.hildebrand@xxxxxxx>

Date: Tue, 17 Mar 2026 10:02:50 -0400

Arc-authentication-results: i=1; mx.microsoft.com 1; spf=pass (sender ip is 165.204.84.17) smtp.rcpttodomain=epam.com smtp.mailfrom=amd.com; dmarc=pass (p=quarantine sp=quarantine pct=100) action=none header.from=amd.com; dkim=none (message not signed); arc=none (0)

Arc-message-signature: i=1; a=rsa-sha256; c=relaxed/relaxed; d=microsoft.com; s=arcselector10001; h=From:Date:Subject:Message-ID:Content-Type:MIME-Version:X-MS-Exchange-AntiSpam-MessageData-ChunkCount:X-MS-Exchange-AntiSpam-MessageData-0:X-MS-Exchange-AntiSpam-MessageData-1; bh=2WnqgkijuWbeWnj3nAVyJNEqnrR8a2gTEYVrpA262Xg=; b=eOZnlR66m4NaW50Iz1B5ZgcsIwOdL4WM3UaE3DqhzZuFixe8SUUteQvPCll6jDADa4pJM9/uEnSbT3N19Dx67slSgtpqOciUefVkcxfiEW5IPChXD3hbnPLVn2WuKDdXsmCzxCldKNtSJOT2H0GpQDuXurWaR/jeYp2LpeK2yTjso4B8Ogfz5vPFoeEt91Nn1gmap2taHq4fuOP/xEZOON3nqrbVgnaduC/3IiKVZDw3DE9tQEppR2SWnJgCi7umI4X2PUiaBLgn81gk+gZUipPTgu8tWNljDA8czSKR1wXVynNbhZxXRe+ak+hNPzCjSwBe3YHiij6XY/e4g7HCPA==

Arc-seal: i=1; a=rsa-sha256; s=arcselector10001; d=microsoft.com; cv=none; b=B1NXYDbV9zjjwoa0Sx7DwBkSuM8RvDILkDjVG8XSL/QeUK+J4Hz41PIsm+hDl9Ndf9UoBTOjpZm4w9OfIAD88222GTrAeh4xKxiVPQ1BuqlhDFgnsUTZouEzN/wM5WdA1Ac2EPUs8pysF6rLzXef50XA112bN2WUuPurqJ28RWKyhlz+cCxGQ6O/A9wk1Yjvj7Xba0cOzp3WWV99vrTrHn6QHpJaZferUUtxJmhE1j7eeLLDlkOPf7dz4uoXAzw7O/wVvWHYu2ubLv1znaKPnoH68+OC0U8Y6FzcUP/El8PAgo9r/i4ZoDaQBpVq5DTFhe3TaW4ixqOl/GrCAJLORg==

Cc: Roger Pau Monné <roger.pau@xxxxxxxxxx>

Delivery-date: Tue, 17 Mar 2026 14:02:55 +0000

List-id: Xen developer discussion <xen-devel.lists.xenproject.org>

On 3/9/26 07:08, Mykyta Poturai wrote: > This allows waiting a specified number of cycles on the vcpu. Once the > wait has finished a callback is executed. > > Note that this is still not used, but introduced here in order to > simplify the complexity of the patches that actually make use of it. > > Signed-off-by: Roger Pau Monné <roger.pau@xxxxxxxxxx> > Signed-off-by: Mykyta Poturai <mykyta_poturai@xxxxxxxx> > --- > v1->v2: > * new patch > --- > xen/drivers/vpci/header.c | 125 ++++++++++++++++++++++---------------- > xen/include/xen/vpci.h | 19 ++++++ > 2 files changed, 90 insertions(+), 54 deletions(-) > > diff --git a/xen/drivers/vpci/header.c b/xen/drivers/vpci/header.c > index cb64d9b9fc..284964f0d4 100644 > --- a/xen/drivers/vpci/header.c > +++ b/xen/drivers/vpci/header.c > @@ -175,76 +175,92 @@ static void modify_decoding(const struct pci_dev *pdev, > uint16_t cmd, > > bool vpci_process_pending(struct vcpu *v) > { > - const struct pci_dev *pdev = v->vpci.pdev; > - struct vpci_header *header = NULL; > - unsigned int i; > - > - if ( !pdev ) > - return false; > - > - read_lock(&v->domain->pci_lock); > - > - if ( !pdev->vpci || (v->domain != pdev->domain) ) > + switch ( v->vpci.task ) > { > - v->vpci.pdev = NULL; > - read_unlock(&v->domain->pci_lock); > - return false; > - } > - > - header = &pdev->vpci->header; > - for ( i = 0; i < ARRAY_SIZE(header->bars); i++ ) > + case MODIFY_MEMORY: > { > - struct vpci_bar *bar = &header->bars[i]; > - struct rangeset *mem = v->vpci.bar_mem[i]; > - struct map_data data = { > - .d = v->domain, > - .map = v->vpci.cmd & PCI_COMMAND_MEMORY, > - .bar = bar, > - }; > - int rc; > + const struct pci_dev *pdev = v->vpci.memory.pdev; > + struct vpci_header *header = NULL; > + unsigned int i; > > - if ( rangeset_is_empty(mem) ) > - continue; > + if ( !pdev ) > + break; > > - rc = rangeset_consume_ranges(mem, map_range, &data); > + read_lock(&v->domain->pci_lock); > > - if ( rc == -ERESTART ) > + if ( !pdev->vpci || (v->domain != pdev->domain) ) > { > + v->vpci.memory.pdev = NULL; > read_unlock(&v->domain->pci_lock); > - return true; > + break; > } > > - if ( rc ) > + header = &pdev->vpci->header; > + for ( i = 0; i < ARRAY_SIZE(header->bars); i++ ) > { > - spin_lock(&pdev->vpci->lock); > - /* Disable memory decoding unconditionally on failure. */ > - modify_decoding(pdev, v->vpci.cmd & ~PCI_COMMAND_MEMORY, > - false); > - spin_unlock(&pdev->vpci->lock); > + struct vpci_bar *bar = &header->bars[i]; > + struct rangeset *mem = v->vpci.bar_mem[i]; > + struct map_data data = { > + .d = v->domain, > + .map = v->vpci.memory.cmd & PCI_COMMAND_MEMORY, > + .bar = bar, > + }; > + int rc; > + > + if ( rangeset_is_empty(mem) ) > + continue; > > - /* Clean all the rangesets */ > - for ( i = 0; i < ARRAY_SIZE(header->bars); i++ ) > - if ( !rangeset_is_empty(v->vpci.bar_mem[i]) ) > - rangeset_purge(v->vpci.bar_mem[i]); > + rc = rangeset_consume_ranges(mem, map_range, &data); > > - v->vpci.pdev = NULL; > + if ( rc == -ERESTART ) > + { > + read_unlock(&v->domain->pci_lock); > + return true; > + } > > - read_unlock(&v->domain->pci_lock); > + if ( rc ) > + { > + spin_lock(&pdev->vpci->lock); > + /* Disable memory decoding unconditionally on failure. */ > + modify_decoding(pdev, v->vpci.memory.cmd & > ~PCI_COMMAND_MEMORY, > + false); > + spin_unlock(&pdev->vpci->lock); > + > + /* Clean all the rangesets */ > + for ( i = 0; i < ARRAY_SIZE(header->bars); i++ ) > + if ( !rangeset_is_empty(v->vpci.bar_mem[i]) ) > + rangeset_purge(v->vpci.bar_mem[i]); > + > + v->vpci.memory.pdev = NULL; > + > + read_unlock(&v->domain->pci_lock); > > - if ( !is_hardware_domain(v->domain) ) > - domain_crash(v->domain); > + if ( !is_hardware_domain(v->domain) ) > + domain_crash(v->domain); > > - return false; > + break; > + } > } > - } > - v->vpci.pdev = NULL; > + v->vpci.memory.pdev = NULL; > > - spin_lock(&pdev->vpci->lock); > - modify_decoding(pdev, v->vpci.cmd, v->vpci.rom_only); > - spin_unlock(&pdev->vpci->lock); > + spin_lock(&pdev->vpci->lock); > + modify_decoding(pdev, v->vpci.memory.cmd, v->vpci.memory.rom_only); > + spin_unlock(&pdev->vpci->lock); > > - read_unlock(&v->domain->pci_lock); > + read_unlock(&v->domain->pci_lock); > + > + break; > + } Nit: this is a lot of churn for a relatively small number of changes. Could the indentation level be retained (reducing churn) by putting the block in a new function? > + case WAIT: > + if ( NOW() < v->vpci.wait.end ) > + return true; > + v->vpci.wait.callback(v->vpci.wait.data); > + break; > + case NONE: > + return false; > + } > > + v->vpci.task = NONE; > return false; > } > > @@ -295,9 +311,10 @@ static void defer_map(const struct pci_dev *pdev, > uint16_t cmd, bool rom_only) > * is mapped. This can lead to parallel mapping operations being > * started for the same device if the domain is not well-behaved. > */ > - curr->vpci.pdev = pdev; > - curr->vpci.cmd = cmd; > - curr->vpci.rom_only = rom_only; > + curr->vpci.memory.pdev = pdev; > + curr->vpci.memory.cmd = cmd; > + curr->vpci.memory.rom_only = rom_only; > + curr->vpci.task = MODIFY_MEMORY; > /* > * Raise a scheduler softirq in order to prevent the guest from resuming > * execution with pending mapping operations, to trigger the invocation > diff --git a/xen/include/xen/vpci.h b/xen/include/xen/vpci.h > index fa654545e5..47cdb54d42 100644 > --- a/xen/include/xen/vpci.h > +++ b/xen/include/xen/vpci.h > @@ -212,7 +212,26 @@ struct vpci_vcpu { > /* Per-vcpu structure to store state while {un}mapping of PCI BARs. */ > const struct pci_dev *pdev; pdev can now be removed from here > #ifdef __XEN__ > + enum { > + NONE, > + MODIFY_MEMORY, > + WAIT, > + } task; > struct rangeset *bar_mem[PCI_HEADER_NORMAL_NR_BARS + 1]; > + union { > + struct { > + /* Store state while {un}mapping of PCI BARs. */ > + const struct pci_dev *pdev; > + uint16_t cmd; > + bool rom_only : 1; > + } memory; > + struct { > + /* Store wait state. */ > + s_time_t end; > + void (*callback)(void *); > + void *data; > + } wait; > + }; > #endif > uint16_t cmd; > bool rom_only : 1; cmd and rom_only can be removed from here

©2013 Xen Project, A Linux Foundation Collaborative Project. All Rights Reserved.
Linux Foundation is a registered trademark of The Linux Foundation.
Xen Project is a trademark of The Linux Foundation.