[libvirt] [RFC PATCH v1 2/4] qemu: driver changes adding vNUMA vCPU hotplug support

Wim Ten Have wim.ten.have at oracle.com
Mon Oct 21 19:21:06 UTC 2019


From: Wim ten Have <wim.ten.have at oracle.com>

Add support for hot plugging/unplugging vCPUs in vNUMA partitioned
KVM guests.

Signed-off-by: Wim ten Have <wim.ten.have at oracle.com>
Signed-off-by: Menno Lageman <menno.lageman at oracle.com>
---
 src/qemu/qemu_driver.c  |  6 ++-
 src/qemu/qemu_hotplug.c | 95 ++++++++++++++++++++++++++++++++++++++---
 2 files changed, 94 insertions(+), 7 deletions(-)

diff --git a/src/qemu/qemu_driver.c b/src/qemu/qemu_driver.c
index 71947efa4e50..e64afcb8efc9 100644
--- a/src/qemu/qemu_driver.c
+++ b/src/qemu/qemu_driver.c
@@ -4965,14 +4965,16 @@ qemuDomainSetVcpusMax(virQEMUDriverPtr driver,
         return -1;
     }
 
-    if (virDomainNumaGetCPUCountTotal(persistentDef->numa) > nvcpus) {
+    if (!virDomainVnumaIsEnabled(persistentDef->numa) &&
+        virDomainNumaGetCPUCountTotal(persistentDef->numa) > nvcpus) {
         virReportError(VIR_ERR_INVALID_ARG, "%s",
                        _("Number of CPUs in <numa> exceeds the desired "
                          "maximum vcpu count"));
         return -1;
     }
 
-    if (virDomainDefGetVcpusTopology(persistentDef, &topologycpus) == 0 &&
+    if (!virDomainVnumaIsEnabled(persistentDef->numa) &&
+        virDomainDefGetVcpusTopology(persistentDef, &topologycpus) == 0 &&
         nvcpus != topologycpus) {
         /* allow setting a valid vcpu count for the topology so an invalid
          * setting may be corrected via this API */
diff --git a/src/qemu/qemu_hotplug.c b/src/qemu/qemu_hotplug.c
index 2d47f7461f93..2d48c5bba762 100644
--- a/src/qemu/qemu_hotplug.c
+++ b/src/qemu/qemu_hotplug.c
@@ -6081,6 +6081,60 @@ qemuDomainHotplugAddVcpu(virQEMUDriverPtr driver,
 }
 
 
+/**
+ * qemuDomainGetNumaMappedVcpuEntry:
+ *
+ * In case of vNUMA guest description we need the node
+ * mapped vcpu to ensure that guest vcpus are hot-plugged
+ * or hot-unplugged in a round-robin fashion with whole
+ * cores on the same NUMA node so they get sibling host
+ * CPUs.
+ *
+ * 2 NUMA node system, 2 threads/core:
+ *      +---+---+---+---+---+---+---+---+---+---+--//
+ * vcpu | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 |...
+ *      +---+---+---+---+---+---+---+---+---+---+--//
+ * NUMA \------/ \-----/ \-----/ \-----/ \-----/ \-//
+ * node     0       1       0       1       0      ...
+ *
+ * bit    0   1   0   1   2   3   2   3   4   5  ...
+ *
+ * 4 NUMA node system, 2 threads/core:
+ *      +---+---+---+---+---+---+---+---+---+---+--//
+ * vcpu | 0 | 1 | 2 | 3 | 4 | 5 | 6 | 7 | 8 | 9 |...
+ *      +---+---+---+---+---+---+---+---+---+---+--//
+ * NUMA \------/ \-----/ \-----/ \-----/ \-----/ \-//
+ * node     0       1       2       3       0      ...
+ *
+ * bit    0   1   0   1   0   1   0   1   2   3  ...
+ *
+ */
+static ssize_t
+qemuDomainGetNumaMappedVcpuEntry(virDomainDefPtr def,
+                                 ssize_t vcpu)
+{
+    virBitmapPtr nodecpumask = NULL;
+    size_t ncells = virDomainNumaGetNodeCount(def->numa);
+    size_t threads = def->cpu->threads ? def->cpu->threads : 1;
+    ssize_t node, bit, pcpu = -1;
+
+    if (!ncells)
+        return vcpu;
+
+    node = (vcpu / threads) % ncells;
+    nodecpumask = virDomainNumaGetNodeCpumask(def->numa, node);
+
+    bit = ((vcpu / (threads * ncells)) * threads) + (vcpu % threads);
+
+    while (((pcpu = virBitmapNextSetBit(nodecpumask, pcpu)) >= 0) && bit--);
+
+    /* GIGO: Garbage In?  Garbage Out! */
+    pcpu = (pcpu < 0) ? vcpu : pcpu;
+
+    return pcpu;
+}
+
+
 /**
  * qemuDomainSelectHotplugVcpuEntities:
  *
@@ -6104,7 +6158,27 @@ qemuDomainSelectHotplugVcpuEntities(virDomainDefPtr def,
     qemuDomainVcpuPrivatePtr vcpupriv;
     unsigned int maxvcpus = virDomainDefGetVcpusMax(def);
     unsigned int curvcpus = virDomainDefGetVcpus(def);
-    ssize_t i;
+    ssize_t i, target;
+    size_t threads = def->cpu->threads;
+    size_t nnumaCell = virDomainNumaGetNodeCount(def->numa);
+    size_t minvcpus = nnumaCell * threads;
+    bool HasAutonuma = virDomainVnumaIsEnabled(def->numa);
+
+    /* If SMT topology is in place, check that the number of vcpus meets
+     * the following constraints:
+     * - at least one fully used core is assigned on each NUMA node
+     * - cores must be used fully, i.e. all threads of a core are assigned to
+     *   the same guest
+     */
+    if (HasAutonuma && threads &&
+        (nvcpus < minvcpus || (nvcpus - minvcpus) % threads)) {
+        virReportError(VIR_ERR_CONFIG_UNSUPPORTED,
+                       _("vNUMA: guest %s configured %d vcpus setting "
+                         "does not fit the vNUMA topology for at "
+                         "least one whole core per vNUMA node."),
+                       def->name, nvcpus);
+        goto error;
+    }
 
     if (!(ret = virBitmapNew(maxvcpus)))
         return NULL;
@@ -6113,7 +6187,9 @@ qemuDomainSelectHotplugVcpuEntities(virDomainDefPtr def,
         *enable = true;
 
         for (i = 0; i < maxvcpus && curvcpus < nvcpus; i++) {
-            vcpu = virDomainDefGetVcpu(def, i);
+
+            target = qemuDomainGetNumaMappedVcpuEntry(def, i);
+            vcpu = virDomainDefGetVcpu(def, target);
             vcpupriv =  QEMU_DOMAIN_VCPU_PRIVATE(vcpu);
 
             if (vcpu->online)
@@ -6130,14 +6206,17 @@ qemuDomainSelectHotplugVcpuEntities(virDomainDefPtr def,
                                  "desired vcpu count"));
                 goto error;
             }
+            VIR_DEBUG("guest %s hotplug target vcpu = %zd\n", def->name, target);
 
-            ignore_value(virBitmapSetBit(ret, i));
+            ignore_value(virBitmapSetBit(ret, target));
         }
     } else {
         *enable = false;
 
         for (i = maxvcpus - 1; i >= 0 && curvcpus > nvcpus; i--) {
-            vcpu = virDomainDefGetVcpu(def, i);
+
+            target = qemuDomainGetNumaMappedVcpuEntry(def, i);
+            vcpu = virDomainDefGetVcpu(def, target);
             vcpupriv =  QEMU_DOMAIN_VCPU_PRIVATE(vcpu);
 
             if (!vcpu->online)
@@ -6157,8 +6236,9 @@ qemuDomainSelectHotplugVcpuEntities(virDomainDefPtr def,
                                  "desired vcpu count"));
                 goto error;
             }
+            VIR_DEBUG("guest %s hotunplug target vcpu = %zd\n", def->name, target);
 
-            ignore_value(virBitmapSetBit(ret, i));
+            ignore_value(virBitmapSetBit(ret, target));
         }
     }
 
@@ -6241,6 +6321,11 @@ qemuDomainSetVcpusConfig(virDomainDefPtr def,
     if (curvcpus == nvcpus)
         return;
 
+    if (virDomainVnumaIsEnabled(def->numa)) {
+        virDomainDefSetVcpusVnuma(def, nvcpus);
+        return;
+    }
+
     if (curvcpus < nvcpus) {
         for (i = 0; i < maxvcpus; i++) {
             vcpu = virDomainDefGetVcpu(def, i);
-- 
2.21.0




More information about the libvir-list mailing list