[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

Re: [PATCH v3 09/23] xen/arm: vsmmuv3: Add support for cmdqueue handling

To: Milan Djokic <milan_djokic@xxxxxxxx>, "xen-devel@xxxxxxxxxxxxxxxxxxxx" <xen-devel@xxxxxxxxxxxxxxxxxxxx>
From: Julien Grall <julien@xxxxxxx>
Date: Tue, 14 Apr 2026 17:18:19 +0900
Cc: Rahul Singh <rahul.singh@xxxxxxx>, Stefano Stabellini <sstabellini@xxxxxxxxxx>, Bertrand Marquis <bertrand.marquis@xxxxxxx>, Michal Orzel <michal.orzel@xxxxxxx>, Volodymyr Babchuk <Volodymyr_Babchuk@xxxxxxxx>
Delivery-date: Tue, 14 Apr 2026 20:24:54 +0000
List-id: Xen developer discussion <xen-devel.lists.xenproject.org>

Hi Milan,

On 31/03/2026 10:52, Milan Djokic wrote:

From: Rahul Singh <rahul.singh@xxxxxxx>

Add support for virtual cmdqueue handling for guests

This commit message is quite light. There are quite a few pitfalss withthe command queue because it can be long running which require someexplaining on the plan to handle it.

If this is delayed for later, then it would be useful to document in thecode what's missing so it is easier to know whether the vSMMUv3implementation can be security supported (I assume this will be the goal).


Signed-off-by: Rahul Singh <rahul.singh@xxxxxxx>
Signed-off-by: Milan Djokic <milan_djokic@xxxxxxxx>
---
  xen/drivers/passthrough/arm/vsmmu-v3.c | 101 +++++++++++++++++++++++++
  1 file changed, 101 insertions(+)

diff --git a/xen/drivers/passthrough/arm/vsmmu-v3.c 
b/xen/drivers/passthrough/arm/vsmmu-v3.c
index 3ae1e62a50..02fe6a4422 100644
--- a/xen/drivers/passthrough/arm/vsmmu-v3.c
+++ b/xen/drivers/passthrough/arm/vsmmu-v3.c
@@ -1,5 +1,6 @@
  /* SPDX-License-Identifier: (GPL-2.0-or-later OR BSD-2-Clause) */

+#include <xen/guest_access.h>

  #include <xen/param.h>
  #include <xen/sched.h>
  #include <asm/mmio.h>
@@ -25,6 +26,26 @@
  /* Struct to hold the vIOMMU ops and vIOMMU type */
  extern const struct viommu_desc __read_mostly *cur_viommu;

+/* SMMUv3 command definitions */

+#define CMDQ_OP_PREFETCH_CFG    0x1
+#define CMDQ_OP_CFGI_STE        0x3
+#define CMDQ_OP_CFGI_ALL        0x4
+#define CMDQ_OP_CFGI_CD         0x5
+#define CMDQ_OP_CFGI_CD_ALL     0x6
+#define CMDQ_OP_TLBI_NH_ASID    0x11
+#define CMDQ_OP_TLBI_NH_VA      0x12
+#define CMDQ_OP_TLBI_NSNH_ALL   0x30
+#define CMDQ_OP_CMD_SYNC        0x46
+
+/* Queue Handling */
+#define Q_BASE(q)       ((q)->q_base & Q_BASE_ADDR_MASK)
+#define Q_CONS_ENT(q)   (Q_BASE(q) + Q_IDX(q, (q)->cons) * (q)->ent_size)
+#define Q_PROD_ENT(q)   (Q_BASE(q) + Q_IDX(q, (q)->prod) * (q)->ent_size)
+
+/* Helper Macros */
+#define smmu_get_cmdq_enabled(x)    FIELD_GET(CR0_CMDQEN, x)
+#define smmu_cmd_get_command(x)     FIELD_GET(CMDQ_0_OP, x)
+
  /* virtual smmu queue */
  struct arm_vsmmu_queue {
      uint64_t    q_base; /* base register */
@@ -49,8 +70,80 @@ struct virt_smmu {
      uint64_t    gerror_irq_cfg0;
      uint64_t    evtq_irq_cfg0;
      struct      arm_vsmmu_queue evtq, cmdq;
+    spinlock_t  cmd_queue_lock;
  };

+/* Queue manipulation functions */

+static bool queue_empty(struct arm_vsmmu_queue *q)
+{
+    return Q_IDX(q, q->prod) == Q_IDX(q, q->cons) &&
+           Q_WRP(q, q->prod) == Q_WRP(q, q->cons);
+}
+
+static void queue_inc_cons(struct arm_vsmmu_queue *q)
+{
+    uint32_t cons = (Q_WRP(q, q->cons) | Q_IDX(q, q->cons)) + 1;
+    q->cons = Q_OVF(q->cons) | Q_WRP(q, cons) | Q_IDX(q, cons);
+}
+
+static void dump_smmu_command(uint64_t *command)
+{
+    gdprintk(XENLOG_ERR, "cmd 0x%02llx: %016lx %016lx\n",
+             smmu_cmd_get_command(command[0]), command[0], command[1]);

I would consider using gprintk() because this could be useful even innon-production build.

+}
+static int arm_vsmmu_handle_cmds(struct virt_smmu *smmu)
+{
+    struct arm_vsmmu_queue *q = &smmu->cmdq;
+    struct domain *d = smmu->d;
+    uint64_t command[CMDQ_ENT_DWORDS];
+    paddr_t addr;
+
+    if ( !smmu_get_cmdq_enabled(smmu->cr[0]) )
+        return 0;
+
+    while ( !queue_empty(q) )

> +    {> +        int ret;

+
+        addr = Q_CONS_ENT(q);
+        ret = access_guest_memory_by_gpa(d, addr, command,
+                                         sizeof(command), false);
+        if ( ret )
+            return ret;
+
+        switch ( smmu_cmd_get_command(command[0]) )
+        {
+        case CMDQ_OP_CFGI_STE:
+            break;
+        case CMDQ_OP_PREFETCH_CFG:
+        case CMDQ_OP_CFGI_CD:
+        case CMDQ_OP_CFGI_CD_ALL:
+        case CMDQ_OP_CFGI_ALL:
+        case CMDQ_OP_CMD_SYNC:

Is this empty because there is nothing to do? Or is this empty becausethey are not yet implemented?

+            break;
+        case CMDQ_OP_TLBI_NH_ASID:
+        case CMDQ_OP_TLBI_NSNH_ALL:
+        case CMDQ_OP_TLBI_NH_VA:
+            if ( !iommu_iotlb_flush_all(smmu->d, 1) )

This is quite a bigger hammer when the guest may only want to flush theS1 TLB for a single device. I am ok for now, but it would be good to adda TODO for optimizing it.

+                break;
+        default:
+            gdprintk(XENLOG_ERR, "vSMMUv3: unhandled command\n");
+            dump_smmu_command(command);
+            break;
+        }
+
+        if ( ret )
+        {
+            gdprintk(XENLOG_ERR,
+                     "vSMMUv3: command error %d while handling command\n",
+                     ret);
+            dump_smmu_command(command);
+        }
+        queue_inc_cons(q);
+    }
+    return 0;
+}
+
  static int vsmmuv3_mmio_write(struct vcpu *v, mmio_info_t *info,
                                register_t r, void *priv)
  {
@@ -104,9 +197,15 @@ static int vsmmuv3_mmio_write(struct vcpu *v, mmio_info_t 
*info,
          break;

case VREG32(ARM_SMMU_CMDQ_PROD):

+        spin_lock(&smmu->cmd_queue_lock);
          reg32 = smmu->cmdq.prod;
          vreg_reg32_update(&reg32, r, info);
          smmu->cmdq.prod = reg32;
+
+        if ( arm_vsmmu_handle_cmds(smmu) )
+            gdprintk(XENLOG_ERR, "error handling vSMMUv3 commands\n");
+
+        spin_unlock(&smmu->cmd_queue_lock);
          break;

case VREG32(ARM_SMMU_CMDQ_CONS):

@@ -326,6 +425,8 @@ static int vsmmuv3_init_single(struct domain *d, paddr_t 
addr, paddr_t size)
      smmu->evtq.q_base = FIELD_PREP(Q_BASE_LOG2SIZE, SMMU_EVTQS);
      smmu->evtq.ent_size = EVTQ_ENT_DWORDS * DWORDS_BYTES;

+ spin_lock_init(&smmu->cmd_queue_lock);

+
      register_mmio_handler(d, &vsmmuv3_mmio_handler, addr, size, smmu);

/* Register the vIOMMU to be able to clean it up later. */


Cheers,

--
Julien Grall

Prev by Date: Re: [PATCH v3 08/23] xen/arm: vsmmuv3: Add support for registers emulation
Next by Date: RE: [EXTERNAL] Re: [XEN PATCH] xen/common: validate shared memory guest address overlap with guest RAM
Previous by thread: Re: [PATCH v3 09/23] xen/arm: vsmmuv3: Add support for cmdqueue handling
Next by thread: Re: [PATCH v3 10/23] xen/arm: vsmmuv3: Add support for command CMD_CFGI_STE
Index(es):
- Date
- Thread

Lists.xenproject.org is hosted with RackSpace, monitoring our
servers 24x7x365 and backed by RackSpace's Fanatical Support®.