Xen project Mailing List

Re: [PATCH v5 2/5] arm/irq: Migrate IRQs during CPU up/down operations

To: Mykyta Poturai <Mykyta_Poturai@xxxxxxxx>

From: Bertrand Marquis <Bertrand.Marquis@xxxxxxx>

Date: Wed, 4 Feb 2026 14:20:22 +0000

Accept-language: en-GB, en-US

Arc-authentication-results: i=2; mx.microsoft.com 1; spf=pass (sender ip is 4.158.2.129) smtp.rcpttodomain=epam.com smtp.mailfrom=arm.com; dmarc=pass (p=none sp=none pct=100) action=none header.from=arm.com; dkim=pass (signature was verified) header.d=arm.com; arc=pass (0 oda=1 ltdi=1 spf=[1,1,smtp.mailfrom=arm.com] dkim=[1,1,header.d=arm.com] dmarc=[1,1,header.from=arm.com])

Arc-authentication-results: i=1; mx.microsoft.com 1; spf=pass smtp.mailfrom=arm.com; dmarc=pass action=none header.from=arm.com; dkim=pass header.d=arm.com; arc=none

Arc-message-signature: i=2; a=rsa-sha256; c=relaxed/relaxed; d=microsoft.com; s=arcselector10001; h=From:Date:Subject:Message-ID:Content-Type:MIME-Version:X-MS-Exchange-AntiSpam-MessageData-ChunkCount:X-MS-Exchange-AntiSpam-MessageData-0:X-MS-Exchange-AntiSpam-MessageData-1; bh=a3TgfEc++SekQkuUGacyFfqTZV6P4qcYaQamkIVbr+M=; b=R2oNqKrIKdJdg7OWfwjeRH9v6X3uJ9z3V1GFx/xdDEhRGr7ZzJ4Sjuf9n5bLLruzlAXaJLZ5VYlZe3ZyfmwIhocX7Qe/cgjmy++WYA1x40r0OhulSY869m2qZfIOetmcMbkVdyJRV7zRwOfpcOYmHrYmAhdrgbMqWFUqhKcxY8eekd92dsRKQp+i/H8D1LwDigPqDVaFZuvvF9Fu+nQOTFsBLs86H0xPinstSif9gessJLkjVO372IMm4FlCiwQ8/lgZizUM59qTXp9D48u1MkablJZ4U+9FyEWwHpiwWFOjdYSQ51lHQqFFyh8zAn8emNQTjD4jAuJkuPH7CxfhAA==

Arc-message-signature: i=1; a=rsa-sha256; c=relaxed/relaxed; d=microsoft.com; s=arcselector10001; h=From:Date:Subject:Message-ID:Content-Type:MIME-Version:X-MS-Exchange-AntiSpam-MessageData-ChunkCount:X-MS-Exchange-AntiSpam-MessageData-0:X-MS-Exchange-AntiSpam-MessageData-1; bh=a3TgfEc++SekQkuUGacyFfqTZV6P4qcYaQamkIVbr+M=; b=Xr2G7yrVj+so+PfG1VBIk1BRhXZh7drKmt6EX80yuXLHj2m7vt5Ub+LHDQOfSaJ+bng7VPXP6z9BgsvACP390SYuOfeRvh3SMqPe50zUyHh3CWTZ8yNkjuGak3nWUKnDpiyFgawNEUEXtVvCs3xlu66Wu0hrXtXR0u65FdP2MhkiNd0unJsRS2GuVE+4ILC/nyiuwGpvlFv72wswImkxw2HALQH9KVWSCqq9L7tKZYhH9iCQ7ofGy4rIoKljuBsFxbMz78J+/uuZsOVjOfC48FXY/6w/HsIz2gEaYfFwALN5uy07MYvs5RnaFrZBAwuarMGk59P2Pp2CEofwrBnDXQ==

Arc-seal: i=2; a=rsa-sha256; s=arcselector10001; d=microsoft.com; cv=pass; b=T+pX1/FmwF55burFzIY1V5xB/qmEB/hs7+t3EO3qX1gOmnn0k9Mn9Cz1t0ujM5HIvvA/5WFjvaEHVhEKUr2R7Rji7Jqi2MX9hGDWL3T6BJjg8THnzKeoFNMKixvPE6uvQJCQyHNBfWKOMP0gBMAy4vHfka+eRWpK66kA/OdjIT4KQhI0kBBeQ12OzHzDm7L0TTTJLWf70mX4RONcdCnaOs1FD9Dl8iJV1i+roVjJPnS12Hs4+SS81PlZ52GkpBGVf0Fdd06/enn8v3osW4LzGuQfNMABVfgTMVFzhIGcP+MgWNP4n+6/cM4NbgsFVXFsoWXKzBuzdoL8pA0tzOcOIA==

Arc-seal: i=1; a=rsa-sha256; s=arcselector10001; d=microsoft.com; cv=none; b=GFjRKXqsMkafHKMwUVsbvsomO/vMELicAup2durjUafM13RWjbI08juGALzAE6B7Gkyj5Q5yfnTgDsJbuk2UVD6yCgngg6gL0f2kYS7MjYoKys+JgnyvuaQkCmSPtPBbaXo8j3AuVVcdw30BrBbioweJEf+UgX6P53GhrrSjCr3riFs3mQmHMdL2xlRi/RfzmBAjR35uYEo1I/D0cDOjk5a+z8aQuzxQSbSggtQ9ZkhfSz77I4Aj+n/FLEFCFkal0fJz1PDvfEXVLCb1SvxpZgd0elGM57hoFl0b1Xz2fVkHIH3JCKRVpftYR+nQeTx0K84rUIASGll8giKjH4uTNg==

Authentication-results-original: dkim=none (message not signed) header.d=none;dmarc=none action=none header.from=arm.com;

Cc: "xen-devel@xxxxxxxxxxxxxxxxxxxx" <xen-devel@xxxxxxxxxxxxxxxxxxxx>, Stefano Stabellini <sstabellini@xxxxxxxxxx>, Julien Grall <julien@xxxxxxx>, Michal Orzel <michal.orzel@xxxxxxx>, Volodymyr Babchuk <Volodymyr_Babchuk@xxxxxxxx>

Delivery-date: Wed, 04 Feb 2026 14:21:48 +0000

List-id: Xen developer discussion <xen-devel.lists.xenproject.org>

Nodisclaimer: true

Thread-index: AQHchGj73A4kTs3O/EWyR3N/eFmlXrVyue0A

Thread-topic: [PATCH v5 2/5] arm/irq: Migrate IRQs during CPU up/down operations

Hi Mykyta. > On 13 Jan 2026, at 09:45, Mykyta Poturai <Mykyta_Poturai@xxxxxxxx> wrote: > > Move IRQs from dying CPU to the online ones when a CPU is getting > offlined. When onlining, rebalance all IRQs in a round-robin fashion. > Guest-bound IRQs are already handled by scheduler in the process of > moving vCPUs to active pCPUs, so we only need to handle IRQs used by Xen > itself. > > Signed-off-by: Mykyta Poturai <mykyta_poturai@xxxxxxxx> > --- > v4->v5: > * handle CPU onlining as well > * more comments > * fix crash when ESPI is disabled > * don't assume CPU 0 is a boot CPU > * use insigned int for irq number > * remove assumption that all irqs a bound to CPU 0 by default from the > commit message > > v3->v4: > * patch introduced > --- > xen/arch/arm/include/asm/irq.h | 2 ++ > xen/arch/arm/irq.c | 54 ++++++++++++++++++++++++++++++++++ > xen/arch/arm/smpboot.c | 6 ++++ > 3 files changed, 62 insertions(+) > > diff --git a/xen/arch/arm/include/asm/irq.h b/xen/arch/arm/include/asm/irq.h > index 09788dbfeb..a0250bac85 100644 > --- a/xen/arch/arm/include/asm/irq.h > +++ b/xen/arch/arm/include/asm/irq.h > @@ -126,6 +126,8 @@ bool irq_type_set_by_domain(const struct domain *d); > void irq_end_none(struct irq_desc *irq); > #define irq_end_none irq_end_none > > +void rebalance_irqs(unsigned int from, bool up); > + > #endif /* _ASM_HW_IRQ_H */ > /* > * Local variables: > diff --git a/xen/arch/arm/irq.c b/xen/arch/arm/irq.c > index 7204bc2b68..a32dc729f8 100644 > --- a/xen/arch/arm/irq.c > +++ b/xen/arch/arm/irq.c > @@ -158,6 +158,58 @@ static int init_local_irq_data(unsigned int cpu) > return 0; > } > > +static int cpu_next; > + > +static void balance_irq(int irq, unsigned int from, bool up) > +{ > + struct irq_desc *desc = irq_to_desc(irq); > + unsigned long flags; > + > + ASSERT(!cpumask_empty(&cpu_online_map)); > + > + spin_lock_irqsave(&desc->lock, flags); > + if ( likely(!desc->action) ) > + goto out; > + > + if ( likely(test_bit(_IRQ_GUEST, &desc->status) || > + test_bit(_IRQ_MOVE_PENDING, &desc->status)) ) > + goto out; > + > + /* > + * Setting affinity to a mask of multiple CPUs causes the GIC drivers to > + * select one CPU from that mask. If the dying CPU was included in the > IRQ's > + * affinity mask, we cannot determine exactly which CPU the interrupt is > + * currently routed to, as GIC drivers lack a concrete get_affinity API. > So > + * to be safe we must reroute it to a new, definitely online, CPU. In the > + * case of CPU going down, we move only the interrupt that could reside > on > + * it. Otherwise, we rearrange all interrupts in a round-robin fashion. > + */ > + if ( !up && !cpumask_test_cpu(from, desc->affinity) ) > + goto out; I am a bit lost here on what you are trying to do in the case where a cpu is coming up here, it feels like you are trying to change the affinity of all interrupts in this case to cycle everything. Is it really what is expected ? If affinity was set by a VM on its interrupts, I would not expect Xen to round-robin everything each time a cpu comes up. > + > + cpu_next = cpumask_cycle(cpu_next, &cpu_online_map); > + irq_set_affinity(desc, cpumask_of(cpu_next)); > + > +out: > + spin_unlock_irqrestore(&desc->lock, flags); > +} > + > +void rebalance_irqs(unsigned int from, bool up) > +{ > + int irq; > + > + if ( cpumask_empty(&cpu_online_map) ) > + return; > + > + for ( irq = NR_LOCAL_IRQS; irq < NR_IRQS; irq++ ) > + balance_irq(irq, from, up); > + > +#ifdef CONFIG_GICV3_ESPI > + for ( irq = ESPI_BASE_INTID; irq < ESPI_MAX_INTID; irq++ ) > + balance_irq(irq, from, up); > +#endif > +} > + > static int cpu_callback(struct notifier_block *nfb, unsigned long action, > void *hcpu) > { > @@ -172,6 +224,8 @@ static int cpu_callback(struct notifier_block *nfb, > unsigned long action, > printk(XENLOG_ERR "Unable to allocate local IRQ for CPU%u\n", > cpu); > break; > + case CPU_ONLINE: > + rebalance_irqs(cpu, true); > } > > return notifier_from_errno(rc); > diff --git a/xen/arch/arm/smpboot.c b/xen/arch/arm/smpboot.c > index 7f3cfa812e..e1b9f94458 100644 > --- a/xen/arch/arm/smpboot.c > +++ b/xen/arch/arm/smpboot.c > @@ -425,6 +425,12 @@ void __cpu_disable(void) > > smp_mb(); > > + /* > + * Now that the interrupts are cleared and the CPU marked as offline, > + * move interrupts out of it > + */ > + rebalance_irqs(cpu, false); > + I would expect this to only be useful when HOTPLUG is enabled, maybe we could have a static inline doing nothing when HOTPLUG is not on and only do something if HOTPLUG is enabled here ? Cheers Bertrand > /* Return to caller; eventually the IPI mechanism will unwind and the > * scheduler will drop to the idle loop, which will call stop_cpu(). */ > } > -- > 2.51.2

©2013 Xen Project, A Linux Foundation Collaborative Project. All Rights Reserved.
Linux Foundation is a registered trademark of The Linux Foundation.
Xen Project is a trademark of The Linux Foundation.