|
|
99cbc7 |
From 6013f8d130b617ab0ff14075e225b4bb8836702e Mon Sep 17 00:00:00 2001
|
|
|
99cbc7 |
Message-Id: <6013f8d130b617ab0ff14075e225b4bb8836702e@dist-git>
|
|
|
99cbc7 |
From: Bing Niu <bing.niu@intel.com>
|
|
|
99cbc7 |
Date: Mon, 15 Apr 2019 17:32:49 +0200
|
|
|
99cbc7 |
Subject: [PATCH] util: Add MBA allocation to virresctrl
|
|
|
99cbc7 |
MIME-Version: 1.0
|
|
|
99cbc7 |
Content-Type: text/plain; charset=UTF-8
|
|
|
99cbc7 |
Content-Transfer-Encoding: 8bit
|
|
|
99cbc7 |
|
|
|
99cbc7 |
Add memory bandwidth allocation support to virresctrl class.
|
|
|
99cbc7 |
Introducing virResctrlAllocMemBW which is used for allocating memory
|
|
|
99cbc7 |
bandwidth. Following virResctrlAllocPerType, it also employs a
|
|
|
99cbc7 |
nested sparse array to indicate whether allocation is available for
|
|
|
99cbc7 |
particular last level cache.
|
|
|
99cbc7 |
|
|
|
99cbc7 |
Signed-off-by: Bing Niu <bing.niu@intel.com>
|
|
|
99cbc7 |
Reviewed-by: John Ferlan <jferlan@redhat.com>
|
|
|
99cbc7 |
(cherry picked from commit 4c727dacbf1bd2a8c4797daf6192b81b85f872f1)
|
|
|
99cbc7 |
|
|
|
99cbc7 |
Resolves: https://bugzilla.redhat.com/show_bug.cgi?id=1468650
|
|
|
99cbc7 |
|
|
|
99cbc7 |
Signed-off-by: Pavel Hrdina <phrdina@redhat.com>
|
|
|
99cbc7 |
Message-Id: <6c5c1d7dfd4415699a0bf7a5461c99e915dfea1b.1555342313.git.phrdina@redhat.com>
|
|
|
99cbc7 |
Reviewed-by: Ján Tomko <jtomko@redhat.com>
|
|
|
99cbc7 |
---
|
|
|
99cbc7 |
src/util/virresctrl.c | 63 ++++++++++++++++++++++++++++++++++++++++---
|
|
|
99cbc7 |
1 file changed, 59 insertions(+), 4 deletions(-)
|
|
|
99cbc7 |
|
|
|
99cbc7 |
diff --git a/src/util/virresctrl.c b/src/util/virresctrl.c
|
|
|
99cbc7 |
index f454868f1e..8a25798f7d 100644
|
|
|
99cbc7 |
--- a/src/util/virresctrl.c
|
|
|
99cbc7 |
+++ b/src/util/virresctrl.c
|
|
|
99cbc7 |
@@ -36,9 +36,9 @@ VIR_LOG_INIT("util.virresctrl")
|
|
|
99cbc7 |
|
|
|
99cbc7 |
|
|
|
99cbc7 |
/* Resctrl is short for Resource Control. It might be implemented for various
|
|
|
99cbc7 |
- * resources, but at the time of this writing this is only supported for cache
|
|
|
99cbc7 |
- * allocation technology (aka CAT). Hence the reson for leaving 'Cache' out of
|
|
|
99cbc7 |
- * all the structure and function names for now (can be added later if needed.
|
|
|
99cbc7 |
+ * resources. Currently this supports cache allocation technology (aka CAT) and
|
|
|
99cbc7 |
+ * memory bandwidth allocation (aka MBA). More resources technologies may be
|
|
|
99cbc7 |
+ * added in the future.
|
|
|
99cbc7 |
*/
|
|
|
99cbc7 |
|
|
|
99cbc7 |
|
|
|
99cbc7 |
@@ -89,6 +89,9 @@ typedef virResctrlAllocPerType *virResctrlAllocPerTypePtr;
|
|
|
99cbc7 |
typedef struct _virResctrlAllocPerLevel virResctrlAllocPerLevel;
|
|
|
99cbc7 |
typedef virResctrlAllocPerLevel *virResctrlAllocPerLevelPtr;
|
|
|
99cbc7 |
|
|
|
99cbc7 |
+typedef struct _virResctrlAllocMemBW virResctrlAllocMemBW;
|
|
|
99cbc7 |
+typedef virResctrlAllocMemBW *virResctrlAllocMemBWPtr;
|
|
|
99cbc7 |
+
|
|
|
99cbc7 |
|
|
|
99cbc7 |
/* Class definitions and initializations */
|
|
|
99cbc7 |
static virClassPtr virResctrlInfoClass;
|
|
|
99cbc7 |
@@ -180,7 +183,10 @@ virResctrlInfoDispose(void *obj)
|
|
|
99cbc7 |
* consequently a directory under /sys/fs/resctrl). Since it can have multiple
|
|
|
99cbc7 |
* parts of multiple caches allocated it is represented as bunch of nested
|
|
|
99cbc7 |
* sparse arrays (by sparse I mean array of pointers so that each might be NULL
|
|
|
99cbc7 |
- * in case there is no allocation for that particular one (level, cache, ...)).
|
|
|
99cbc7 |
+ * in case there is no allocation for that particular cache allocation (level,
|
|
|
99cbc7 |
+ * cache, ...) or memory allocation for particular node).
|
|
|
99cbc7 |
+ *
|
|
|
99cbc7 |
+ * =====Cache allocation technology (CAT)=====
|
|
|
99cbc7 |
*
|
|
|
99cbc7 |
* Since one allocation can be made for caches on different levels, the first
|
|
|
99cbc7 |
* nested sparse array is of types virResctrlAllocPerLevel. For example if you
|
|
|
99cbc7 |
@@ -205,6 +211,17 @@ virResctrlInfoDispose(void *obj)
|
|
|
99cbc7 |
* all of them. While doing that we store the bitmask in a sparse array of
|
|
|
99cbc7 |
* virBitmaps named `masks` indexed the same way as `sizes`. The upper bounds
|
|
|
99cbc7 |
* of the sparse arrays are stored in nmasks or nsizes, respectively.
|
|
|
99cbc7 |
+ + *
|
|
|
99cbc7 |
+ * =====Memory Bandwidth allocation technology (MBA)=====
|
|
|
99cbc7 |
+ *
|
|
|
99cbc7 |
+ * The memory bandwidth allocation support in virResctrlAlloc works in the
|
|
|
99cbc7 |
+ * same fashion as CAT. However, memory bandwidth controller doesn't have a
|
|
|
99cbc7 |
+ * hierarchy organization as cache, each node have one memory bandwidth
|
|
|
99cbc7 |
+ * controller to memory bandwidth distribution. The number of memory bandwidth
|
|
|
99cbc7 |
+ * controller is identical with number of last level cache. So MBA also employs
|
|
|
99cbc7 |
+ * a sparse array to represent whether a memory bandwidth allocation happens
|
|
|
99cbc7 |
+ * on corresponding node. The available memory controller number is collected
|
|
|
99cbc7 |
+ * in 'virResctrlInfo'.
|
|
|
99cbc7 |
*/
|
|
|
99cbc7 |
struct _virResctrlAllocPerType {
|
|
|
99cbc7 |
/* There could be bool saying whether this is set or not, but since everything
|
|
|
99cbc7 |
@@ -225,12 +242,24 @@ struct _virResctrlAllocPerLevel {
|
|
|
99cbc7 |
* VIR_CACHE_TYPE_LAST number of items */
|
|
|
99cbc7 |
};
|
|
|
99cbc7 |
|
|
|
99cbc7 |
+/*
|
|
|
99cbc7 |
+ * virResctrlAllocMemBW represents one memory bandwidth allocation.
|
|
|
99cbc7 |
+ * Since it can have several last level caches in a NUMA system, it is
|
|
|
99cbc7 |
+ * also represented as a nested sparse arrays as virRestrlAllocPerLevel.
|
|
|
99cbc7 |
+ */
|
|
|
99cbc7 |
+struct _virResctrlAllocMemBW {
|
|
|
99cbc7 |
+ unsigned int **bandwidths;
|
|
|
99cbc7 |
+ size_t nbandwidths;
|
|
|
99cbc7 |
+};
|
|
|
99cbc7 |
+
|
|
|
99cbc7 |
struct _virResctrlAlloc {
|
|
|
99cbc7 |
virObject parent;
|
|
|
99cbc7 |
|
|
|
99cbc7 |
virResctrlAllocPerLevelPtr *levels;
|
|
|
99cbc7 |
size_t nlevels;
|
|
|
99cbc7 |
|
|
|
99cbc7 |
+ virResctrlAllocMemBWPtr mem_bw;
|
|
|
99cbc7 |
+
|
|
|
99cbc7 |
/* The identifier (any unique string for now) */
|
|
|
99cbc7 |
char *id;
|
|
|
99cbc7 |
/* libvirt-generated path in /sys/fs/resctrl for this particular
|
|
|
99cbc7 |
@@ -274,6 +303,13 @@ virResctrlAllocDispose(void *obj)
|
|
|
99cbc7 |
VIR_FREE(level);
|
|
|
99cbc7 |
}
|
|
|
99cbc7 |
|
|
|
99cbc7 |
+ if (alloc->mem_bw) {
|
|
|
99cbc7 |
+ virResctrlAllocMemBWPtr mem_bw = alloc->mem_bw;
|
|
|
99cbc7 |
+ for (i = 0; i < mem_bw->nbandwidths; i++)
|
|
|
99cbc7 |
+ VIR_FREE(mem_bw->bandwidths[i]);
|
|
|
99cbc7 |
+ VIR_FREE(alloc->mem_bw);
|
|
|
99cbc7 |
+ }
|
|
|
99cbc7 |
+
|
|
|
99cbc7 |
VIR_FREE(alloc->id);
|
|
|
99cbc7 |
VIR_FREE(alloc->path);
|
|
|
99cbc7 |
VIR_FREE(alloc->levels);
|
|
|
99cbc7 |
@@ -692,6 +728,9 @@ virResctrlAllocIsEmpty(virResctrlAllocPtr alloc)
|
|
|
99cbc7 |
if (!alloc)
|
|
|
99cbc7 |
return true;
|
|
|
99cbc7 |
|
|
|
99cbc7 |
+ if (alloc->mem_bw)
|
|
|
99cbc7 |
+ return false;
|
|
|
99cbc7 |
+
|
|
|
99cbc7 |
for (i = 0; i < alloc->nlevels; i++) {
|
|
|
99cbc7 |
virResctrlAllocPerLevelPtr a_level = alloc->levels[i];
|
|
|
99cbc7 |
|
|
|
99cbc7 |
@@ -1266,6 +1305,22 @@ virResctrlAllocNewFromInfo(virResctrlInfoPtr info)
|
|
|
99cbc7 |
}
|
|
|
99cbc7 |
}
|
|
|
99cbc7 |
|
|
|
99cbc7 |
+ /* set default free memory bandwidth to 100%*/
|
|
|
99cbc7 |
+ if (info->membw_info) {
|
|
|
99cbc7 |
+ if (VIR_ALLOC(ret->mem_bw) < 0)
|
|
|
99cbc7 |
+ goto error;
|
|
|
99cbc7 |
+
|
|
|
99cbc7 |
+ if (VIR_EXPAND_N(ret->mem_bw->bandwidths, ret->mem_bw->nbandwidths,
|
|
|
99cbc7 |
+ info->membw_info->max_id + 1) < 0)
|
|
|
99cbc7 |
+ goto error;
|
|
|
99cbc7 |
+
|
|
|
99cbc7 |
+ for (i = 0; i < ret->mem_bw->nbandwidths; i++) {
|
|
|
99cbc7 |
+ if (VIR_ALLOC(ret->mem_bw->bandwidths[i]) < 0)
|
|
|
99cbc7 |
+ goto error;
|
|
|
99cbc7 |
+ *(ret->mem_bw->bandwidths[i]) = 100;
|
|
|
99cbc7 |
+ }
|
|
|
99cbc7 |
+ }
|
|
|
99cbc7 |
+
|
|
|
99cbc7 |
cleanup:
|
|
|
99cbc7 |
virBitmapFree(mask);
|
|
|
99cbc7 |
return ret;
|
|
|
99cbc7 |
--
|
|
|
99cbc7 |
2.21.0
|
|
|
99cbc7 |
|