[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]
Re: [RFC PATCH v2 4/5] Add migration support for KVM guest with MTE
From: |
Dr. David Alan Gilbert |
Subject: |
Re: [RFC PATCH v2 4/5] Add migration support for KVM guest with MTE |
Date: |
Wed, 17 Mar 2021 20:11:17 +0000 |
User-agent: |
Mutt/2.0.5 (2021-01-21) |
* Haibo Xu (haibo.xu@linaro.org) wrote:
> To make it easier to keep the page tags sync with
> the page data, tags for one page are appended to
> the data during ram save iteration.
>
> This patch only add the pre-copy migration support.
> Post-copy and compress as well as zero page saving
> are not supported yet.
>
> Signed-off-by: Haibo Xu <haibo.xu@linaro.org>
My guess is that this doesn't work with a lot of other options; e.g.
postcopy and probably compression and a bunch of other things.
Postcopy I can see you'll need some interesting kernel changes for -
you'd need to be able to atomically place a page with it's tag data.
You probably need to add stuff to migrate_caps_check to disable
features that you don't support.
> ---
> include/hw/arm/virt.h | 2 +
> include/migration/misc.h | 1 +
> migration/ram.c | 86 +++++++++++++++++++++++++++++++++++++++-
> 3 files changed, 88 insertions(+), 1 deletion(-)
>
> diff --git a/include/hw/arm/virt.h b/include/hw/arm/virt.h
> index 921416f918..8b28cde8bf 100644
> --- a/include/hw/arm/virt.h
> +++ b/include/hw/arm/virt.h
> @@ -166,6 +166,8 @@ struct VirtMachineState {
> PCIBus *bus;
> char *oem_id;
> char *oem_table_id;
> + /* migrate memory tags */
> + NotifierWithReturn precopy_notifier;
> };
>
> #define VIRT_ECAM_ID(high) (high ? VIRT_HIGH_PCIE_ECAM : VIRT_PCIE_ECAM)
> diff --git a/include/migration/misc.h b/include/migration/misc.h
> index bccc1b6b44..005133f471 100644
> --- a/include/migration/misc.h
> +++ b/include/migration/misc.h
> @@ -38,6 +38,7 @@ void precopy_add_notifier(NotifierWithReturn *n);
> void precopy_remove_notifier(NotifierWithReturn *n);
> int precopy_notify(PrecopyNotifyReason reason, Error **errp);
> void precopy_enable_free_page_optimization(void);
> +void precopy_enable_metadata_migration(void);
>
> void ram_mig_init(void);
> void qemu_guest_free_page_hint(void *addr, size_t len);
> diff --git a/migration/ram.c b/migration/ram.c
> index 72143da0ac..e67b798c3b 100644
> --- a/migration/ram.c
> +++ b/migration/ram.c
> @@ -53,10 +53,12 @@
> #include "block.h"
> #include "sysemu/sysemu.h"
> #include "sysemu/cpu-throttle.h"
> +#include "sysemu/kvm.h"
> #include "savevm.h"
> #include "qemu/iov.h"
> #include "multifd.h"
> #include "sysemu/runstate.h"
> +#include "kvm_arm.h"
>
> #if defined(__linux__)
> #include "qemu/userfaultfd.h"
> @@ -80,6 +82,9 @@
> #define RAM_SAVE_FLAG_XBZRLE 0x40
> /* 0x80 is reserved in migration.h start with 0x100 next */
> #define RAM_SAVE_FLAG_COMPRESS_PAGE 0x100
> +#define RAM_SAVE_FLAG_MTE 0x200
I think that's using the last free bit in the flags field, which is a
bit painful.
> +#define MTE_GRANULE_SIZE (16)
>
> static inline bool is_zero_range(uint8_t *p, uint64_t size)
> {
> @@ -317,6 +322,8 @@ struct RAMState {
> bool ram_bulk_stage;
> /* The free page optimization is enabled */
> bool fpo_enabled;
> + /* The RAM meta data(e.t memory tag) is enabled */
> + bool metadata_enabled;
> /* How many times we have dirty too many pages */
> int dirty_rate_high_cnt;
> /* these variables are used for bitmap sync */
> @@ -394,6 +401,15 @@ void precopy_enable_free_page_optimization(void)
> ram_state->fpo_enabled = true;
> }
>
> +void precopy_enable_metadata_migration(void)
> +{
> + if (!ram_state) {
> + return;
> + }
> +
> + ram_state->metadata_enabled = true;
> +}
> +
> uint64_t ram_bytes_remaining(void)
> {
> return ram_state ? (ram_state->migration_dirty_pages * TARGET_PAGE_SIZE)
> :
> @@ -1134,6 +1150,61 @@ static bool control_save_page(RAMState *rs, RAMBlock
> *block, ram_addr_t offset,
> return true;
> }
>
> +static int save_normal_page_mte_tags(QEMUFile *f, uint8_t *addr)
> +{
> + uint8_t *tag_buf = NULL;
> + uint64_t ipa;
> + int size = TARGET_PAGE_SIZE / MTE_GRANULE_SIZE;
This function needs to be mostly somewhere aarch specific; or somehow
made more generic.
We shouldn't have RAM_SAVE_FLAG_MTE as well - we should be something
like RAM_SAVE_FLAG_ARCH_METADATA and that way other architectures with
something else glued onto pages can do something similar.
Try and keep migration/ architecture independent.
> + if (kvm_physical_memory_addr_from_host(kvm_state, addr, &ipa)) {
> + /* Buffer for the page tags(one byte per tag) */
> + tag_buf = g_try_malloc0(size);
It feels like you want to allocate tag_buf in setup and free it at the
end rather than doing this in every page.
> + if (!tag_buf) {
> + error_report("%s: Error allocating MTE tag_buf", __func__);
> + return 0;
> + }
> +
> + if (kvm_arm_mte_get_tags(ipa, TARGET_PAGE_SIZE, tag_buf) < 0) {
> + error_report("%s: Can't get MTE tags from guest", __func__);
For any error like this you probably want to say the addresses to make
it easier to debug when it fails.
> + g_free(tag_buf);
> + return 0;
> + }
> +
> + qemu_put_buffer(f, tag_buf, size);
> +
> + g_free(tag_buf);
> +
> + return size;
> + }
> +
> + return 0;
> +}
> +
> +static void load_normal_page_mte_tags(QEMUFile *f, uint8_t *addr)
> +{
> + uint8_t *tag_buf = NULL;
> + uint64_t ipa;
> + int size = TARGET_PAGE_SIZE / MTE_GRANULE_SIZE;
> +
> + if (kvm_physical_memory_addr_from_host(kvm_state, addr, &ipa)) {
> + /* Buffer for the page tags(one byte per tag) */
> + tag_buf = g_try_malloc0(size);
> + if (!tag_buf) {
> + error_report("%s: Error allocating MTE tag_buf", __func__);
> + return;
> + }
> +
> + qemu_get_buffer(f, tag_buf, size);
> + if (kvm_arm_mte_set_tags(ipa, TARGET_PAGE_SIZE, tag_buf) < 0) {
what protections are there here to stop you setting the mte on something
useful, like part of the host kernel or qemu?
> + error_report("%s: Can't set MTE tags to guest", __func__);
> + }
> +
> + g_free(tag_buf);
> + }
> +
> + return;
> +}
> +
> /*
> * directly send the page to the stream
> *
> @@ -1148,6 +1219,10 @@ static bool control_save_page(RAMState *rs, RAMBlock
> *block, ram_addr_t offset,
> static int save_normal_page(RAMState *rs, RAMBlock *block, ram_addr_t offset,
> uint8_t *buf, bool async)
> {
> + if (rs->metadata_enabled) {
> + offset |= RAM_SAVE_FLAG_MTE;
> + }
> +
> ram_counters.transferred += save_page_header(rs, rs->f, block,
> offset |
> RAM_SAVE_FLAG_PAGE);
> if (async) {
> @@ -1159,6 +1234,11 @@ static int save_normal_page(RAMState *rs, RAMBlock
> *block, ram_addr_t offset,
> }
> ram_counters.transferred += TARGET_PAGE_SIZE;
> ram_counters.normal++;
> +
> + if (rs->metadata_enabled) {
> + ram_counters.transferred += save_normal_page_mte_tags(rs->f, buf);
> + }
> +
> return 1;
> }
>
> @@ -2189,6 +2269,7 @@ static void ram_state_reset(RAMState *rs)
> rs->last_version = ram_list.version;
> rs->ram_bulk_stage = true;
> rs->fpo_enabled = false;
> + rs->metadata_enabled = false;
> }
>
> #define MAX_WAIT 50 /* ms, half buffered_file limit */
> @@ -3779,7 +3860,7 @@ static int ram_load_precopy(QEMUFile *f)
> trace_ram_load_loop(block->idstr, (uint64_t)addr, flags, host);
> }
>
> - switch (flags & ~RAM_SAVE_FLAG_CONTINUE) {
> + switch (flags & ~(RAM_SAVE_FLAG_CONTINUE | RAM_SAVE_FLAG_MTE)) {
> case RAM_SAVE_FLAG_MEM_SIZE:
> /* Synchronize RAM block list */
> total_ram_bytes = addr;
> @@ -3849,6 +3930,9 @@ static int ram_load_precopy(QEMUFile *f)
>
> case RAM_SAVE_FLAG_PAGE:
> qemu_get_buffer(f, host, TARGET_PAGE_SIZE);
> + if (flags & RAM_SAVE_FLAG_MTE) {
> + load_normal_page_mte_tags(f, host);
> + }
> break;
>
> case RAM_SAVE_FLAG_COMPRESS_PAGE:
> --
> 2.17.1
>
--
Dr. David Alan Gilbert / dgilbert@redhat.com / Manchester, UK
- [RFC PATCH v2 0/5] target/arm: Add MTE support to KVM guest, Haibo Xu, 2021/03/17
- [RFC PATCH v2 1/5] Update Linux headers with new MTE support, Haibo Xu, 2021/03/17
- [RFC PATCH v2 2/5] Add basic MTE support to KVM guest, Haibo Xu, 2021/03/17
- [RFC PATCH v2 3/5] Add APIs to get/set MTE tags, Haibo Xu, 2021/03/17
- [RFC PATCH v2 4/5] Add migration support for KVM guest with MTE, Haibo Xu, 2021/03/17
- Re: [RFC PATCH v2 4/5] Add migration support for KVM guest with MTE,
Dr. David Alan Gilbert <=
- Re: [RFC PATCH v2 4/5] Add migration support for KVM guest with MTE, Juan Quintela, 2021/03/25
- [RFC PATCH v2 5/5] Enable the MTE support for KVM guest, Haibo Xu, 2021/03/17