render / rpms / libvirt

Forked from rpms/libvirt 11 months ago
Clone
99cbc7
From 6013f8d130b617ab0ff14075e225b4bb8836702e Mon Sep 17 00:00:00 2001
99cbc7
Message-Id: <6013f8d130b617ab0ff14075e225b4bb8836702e@dist-git>
99cbc7
From: Bing Niu <bing.niu@intel.com>
99cbc7
Date: Mon, 15 Apr 2019 17:32:49 +0200
99cbc7
Subject: [PATCH] util: Add MBA allocation to virresctrl
99cbc7
MIME-Version: 1.0
99cbc7
Content-Type: text/plain; charset=UTF-8
99cbc7
Content-Transfer-Encoding: 8bit
99cbc7
99cbc7
Add memory bandwidth allocation support to virresctrl class.
99cbc7
Introducing virResctrlAllocMemBW which is used for allocating memory
99cbc7
bandwidth. Following virResctrlAllocPerType, it also employs a
99cbc7
nested sparse array to indicate whether allocation is available for
99cbc7
particular last level cache.
99cbc7
99cbc7
Signed-off-by: Bing Niu <bing.niu@intel.com>
99cbc7
Reviewed-by: John Ferlan <jferlan@redhat.com>
99cbc7
(cherry picked from commit 4c727dacbf1bd2a8c4797daf6192b81b85f872f1)
99cbc7
99cbc7
Resolves: https://bugzilla.redhat.com/show_bug.cgi?id=1468650
99cbc7
99cbc7
Signed-off-by: Pavel Hrdina <phrdina@redhat.com>
99cbc7
Message-Id: <6c5c1d7dfd4415699a0bf7a5461c99e915dfea1b.1555342313.git.phrdina@redhat.com>
99cbc7
Reviewed-by: Ján Tomko <jtomko@redhat.com>
99cbc7
---
99cbc7
 src/util/virresctrl.c | 63 ++++++++++++++++++++++++++++++++++++++++---
99cbc7
 1 file changed, 59 insertions(+), 4 deletions(-)
99cbc7
99cbc7
diff --git a/src/util/virresctrl.c b/src/util/virresctrl.c
99cbc7
index f454868f1e..8a25798f7d 100644
99cbc7
--- a/src/util/virresctrl.c
99cbc7
+++ b/src/util/virresctrl.c
99cbc7
@@ -36,9 +36,9 @@ VIR_LOG_INIT("util.virresctrl")
99cbc7
 
99cbc7
 
99cbc7
 /* Resctrl is short for Resource Control.  It might be implemented for various
99cbc7
- * resources, but at the time of this writing this is only supported for cache
99cbc7
- * allocation technology (aka CAT).  Hence the reson for leaving 'Cache' out of
99cbc7
- * all the structure and function names for now (can be added later if needed.
99cbc7
+ * resources. Currently this supports cache allocation technology (aka CAT) and
99cbc7
+ * memory bandwidth allocation (aka MBA). More resources technologies may be
99cbc7
+ * added in the future.
99cbc7
  */
99cbc7
 
99cbc7
 
99cbc7
@@ -89,6 +89,9 @@ typedef virResctrlAllocPerType *virResctrlAllocPerTypePtr;
99cbc7
 typedef struct _virResctrlAllocPerLevel virResctrlAllocPerLevel;
99cbc7
 typedef virResctrlAllocPerLevel *virResctrlAllocPerLevelPtr;
99cbc7
 
99cbc7
+typedef struct _virResctrlAllocMemBW virResctrlAllocMemBW;
99cbc7
+typedef virResctrlAllocMemBW *virResctrlAllocMemBWPtr;
99cbc7
+
99cbc7
 
99cbc7
 /* Class definitions and initializations */
99cbc7
 static virClassPtr virResctrlInfoClass;
99cbc7
@@ -180,7 +183,10 @@ virResctrlInfoDispose(void *obj)
99cbc7
  * consequently a directory under /sys/fs/resctrl).  Since it can have multiple
99cbc7
  * parts of multiple caches allocated it is represented as bunch of nested
99cbc7
  * sparse arrays (by sparse I mean array of pointers so that each might be NULL
99cbc7
- * in case there is no allocation for that particular one (level, cache, ...)).
99cbc7
+ * in case there is no allocation for that particular cache allocation (level,
99cbc7
+ * cache, ...) or memory allocation for particular node).
99cbc7
+ *
99cbc7
+ * =====Cache allocation technology (CAT)=====
99cbc7
  *
99cbc7
  * Since one allocation can be made for caches on different levels, the first
99cbc7
  * nested sparse array is of types virResctrlAllocPerLevel.  For example if you
99cbc7
@@ -205,6 +211,17 @@ virResctrlInfoDispose(void *obj)
99cbc7
  * all of them.  While doing that we store the bitmask in a sparse array of
99cbc7
  * virBitmaps named `masks` indexed the same way as `sizes`.  The upper bounds
99cbc7
  * of the sparse arrays are stored in nmasks or nsizes, respectively.
99cbc7
+ + *
99cbc7
+ * =====Memory Bandwidth allocation technology (MBA)=====
99cbc7
+ *
99cbc7
+ * The memory bandwidth allocation support in virResctrlAlloc works in the
99cbc7
+ * same fashion as CAT. However, memory bandwidth controller doesn't have a
99cbc7
+ * hierarchy organization as cache, each node have one memory bandwidth
99cbc7
+ * controller to memory bandwidth distribution. The number of memory bandwidth
99cbc7
+ * controller is identical with number of last level cache. So MBA also employs
99cbc7
+ * a sparse array to represent whether a memory bandwidth allocation happens
99cbc7
+ * on corresponding node. The available memory controller number is collected
99cbc7
+ * in 'virResctrlInfo'.
99cbc7
  */
99cbc7
 struct _virResctrlAllocPerType {
99cbc7
     /* There could be bool saying whether this is set or not, but since everything
99cbc7
@@ -225,12 +242,24 @@ struct _virResctrlAllocPerLevel {
99cbc7
      * VIR_CACHE_TYPE_LAST number of items */
99cbc7
 };
99cbc7
 
99cbc7
+/*
99cbc7
+ * virResctrlAllocMemBW represents one memory bandwidth allocation.
99cbc7
+ * Since it can have several last level caches in a NUMA system, it is
99cbc7
+ * also represented as a nested sparse arrays as virRestrlAllocPerLevel.
99cbc7
+ */
99cbc7
+struct _virResctrlAllocMemBW {
99cbc7
+    unsigned int **bandwidths;
99cbc7
+    size_t nbandwidths;
99cbc7
+};
99cbc7
+
99cbc7
 struct _virResctrlAlloc {
99cbc7
     virObject parent;
99cbc7
 
99cbc7
     virResctrlAllocPerLevelPtr *levels;
99cbc7
     size_t nlevels;
99cbc7
 
99cbc7
+    virResctrlAllocMemBWPtr mem_bw;
99cbc7
+
99cbc7
     /* The identifier (any unique string for now) */
99cbc7
     char *id;
99cbc7
     /* libvirt-generated path in /sys/fs/resctrl for this particular
99cbc7
@@ -274,6 +303,13 @@ virResctrlAllocDispose(void *obj)
99cbc7
         VIR_FREE(level);
99cbc7
     }
99cbc7
 
99cbc7
+    if (alloc->mem_bw) {
99cbc7
+        virResctrlAllocMemBWPtr mem_bw = alloc->mem_bw;
99cbc7
+        for (i = 0; i < mem_bw->nbandwidths; i++)
99cbc7
+            VIR_FREE(mem_bw->bandwidths[i]);
99cbc7
+        VIR_FREE(alloc->mem_bw);
99cbc7
+    }
99cbc7
+
99cbc7
     VIR_FREE(alloc->id);
99cbc7
     VIR_FREE(alloc->path);
99cbc7
     VIR_FREE(alloc->levels);
99cbc7
@@ -692,6 +728,9 @@ virResctrlAllocIsEmpty(virResctrlAllocPtr alloc)
99cbc7
     if (!alloc)
99cbc7
         return true;
99cbc7
 
99cbc7
+    if (alloc->mem_bw)
99cbc7
+        return false;
99cbc7
+
99cbc7
     for (i = 0; i < alloc->nlevels; i++) {
99cbc7
         virResctrlAllocPerLevelPtr a_level = alloc->levels[i];
99cbc7
 
99cbc7
@@ -1266,6 +1305,22 @@ virResctrlAllocNewFromInfo(virResctrlInfoPtr info)
99cbc7
         }
99cbc7
     }
99cbc7
 
99cbc7
+    /* set default free memory bandwidth to 100%*/
99cbc7
+    if (info->membw_info) {
99cbc7
+        if (VIR_ALLOC(ret->mem_bw) < 0)
99cbc7
+            goto error;
99cbc7
+
99cbc7
+        if (VIR_EXPAND_N(ret->mem_bw->bandwidths, ret->mem_bw->nbandwidths,
99cbc7
+                         info->membw_info->max_id + 1) < 0)
99cbc7
+            goto error;
99cbc7
+
99cbc7
+        for (i = 0; i < ret->mem_bw->nbandwidths; i++) {
99cbc7
+            if (VIR_ALLOC(ret->mem_bw->bandwidths[i]) < 0)
99cbc7
+                goto error;
99cbc7
+            *(ret->mem_bw->bandwidths[i]) = 100;
99cbc7
+        }
99cbc7
+    }
99cbc7
+
99cbc7
  cleanup:
99cbc7
     virBitmapFree(mask);
99cbc7
     return ret;
99cbc7
-- 
99cbc7
2.21.0
99cbc7