qemu-devel
[Top][All Lists]
Advanced

[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index]

Re: [Qemu-devel] [PATCH v5 22/45] postcopy: OS support test


From: David Gibson
Subject: Re: [Qemu-devel] [PATCH v5 22/45] postcopy: OS support test
Date: Fri, 13 Mar 2015 12:23:46 +1100
User-agent: Mutt/1.5.23 (2014-03-12)

On Wed, Feb 25, 2015 at 04:51:45PM +0000, Dr. David Alan Gilbert (git) wrote:
> From: "Dr. David Alan Gilbert" <address@hidden>
> 
> Provide a check to see if the OS we're running on has all the bits
> needed for postcopy.
> 
> Creates postcopy-ram.c which will get most of the other helpers we need.
> 
> Signed-off-by: Dr. David Alan Gilbert <address@hidden>
> ---
>  include/migration/postcopy-ram.h |  19 +++++
>  migration/Makefile.objs          |   2 +-
>  migration/postcopy-ram.c         | 161 
> +++++++++++++++++++++++++++++++++++++++
>  savevm.c                         |   5 ++
>  4 files changed, 186 insertions(+), 1 deletion(-)
>  create mode 100644 include/migration/postcopy-ram.h
>  create mode 100644 migration/postcopy-ram.c
> 
> diff --git a/include/migration/postcopy-ram.h 
> b/include/migration/postcopy-ram.h
> new file mode 100644
> index 0000000..d81934f
> --- /dev/null
> +++ b/include/migration/postcopy-ram.h
> @@ -0,0 +1,19 @@
> +/*
> + * Postcopy migration for RAM
> + *
> + * Copyright 2013 Red Hat, Inc. and/or its affiliates
> + *
> + * Authors:
> + *  Dave Gilbert  <address@hidden>
> + *
> + * This work is licensed under the terms of the GNU GPL, version 2 or later.
> + * See the COPYING file in the top-level directory.
> + *
> + */
> +#ifndef QEMU_POSTCOPY_RAM_H
> +#define QEMU_POSTCOPY_RAM_H
> +
> +/* Return true if the host supports everything we need to do postcopy-ram */
> +bool postcopy_ram_supported_by_host(void);
> +
> +#endif
> diff --git a/migration/Makefile.objs b/migration/Makefile.objs
> index d929e96..0cac6d7 100644
> --- a/migration/Makefile.objs
> +++ b/migration/Makefile.objs
> @@ -1,7 +1,7 @@
>  common-obj-y += migration.o tcp.o
>  common-obj-y += vmstate.o
>  common-obj-y += qemu-file.o qemu-file-buf.o qemu-file-unix.o 
> qemu-file-stdio.o
> -common-obj-y += xbzrle.o
> +common-obj-y += xbzrle.o postcopy-ram.o
>  
>  common-obj-$(CONFIG_RDMA) += rdma.o
>  common-obj-$(CONFIG_POSIX) += exec.o unix.o fd.o
> diff --git a/migration/postcopy-ram.c b/migration/postcopy-ram.c
> new file mode 100644
> index 0000000..a0e20b2
> --- /dev/null
> +++ b/migration/postcopy-ram.c
> @@ -0,0 +1,161 @@
> +/*
> + * Postcopy migration for RAM
> + *
> + * Copyright 2013-2014 Red Hat, Inc. and/or its affiliates
> + *
> + * Authors:
> + *  Dave Gilbert  <address@hidden>
> + *
> + * This work is licensed under the terms of the GNU GPL, version 2 or later.
> + * See the COPYING file in the top-level directory.
> + *
> + */
> +
> +/*
> + * Postcopy is a migration technique where the execution flips from the
> + * source to the destination before all the data has been copied.
> + */
> +
> +#include <glib.h>
> +#include <stdio.h>
> +#include <unistd.h>
> +
> +#include "qemu-common.h"
> +#include "migration/migration.h"
> +#include "migration/postcopy-ram.h"
> +#include "sysemu/sysemu.h"
> +#include "qemu/error-report.h"
> +#include "trace.h"
> +
> +/* Postcopy needs to detect accesses to pages that haven't yet been copied
> + * across, and efficiently map new pages in, the techniques for doing this
> + * are target OS specific.
> + */
> +#if defined(__linux__)
> +
> +#include <sys/mman.h>
> +#include <sys/ioctl.h>
> +#include <sys/types.h>
> +#include <asm/types.h> /* for __u64 */
> +#include <linux/userfaultfd.h>
> +
> +#ifdef HOST_X86_64
> +#ifndef __NR_userfaultfd
> +#define __NR_userfaultfd 323

Sholdn't this come from the kernel headers imported in the previous
patch?  Rather than having an arch-specific hack.

> +#endif
> +#endif
> +
> +#endif
> +
> +#if defined(__linux__) && defined(__NR_userfaultfd)
> +
> +static bool ufd_version_check(int ufd)
> +{
> +    struct uffdio_api api_struct;
> +    uint64_t feature_mask;
> +
> +    api_struct.api = UFFD_API;
> +    if (ioctl(ufd, UFFDIO_API, &api_struct)) {
> +        perror("postcopy_ram_supported_by_host: UFFDIO_API failed");

This should be error_report() not, perror(), to match qemu
conventions, shouldn't it?

> +        return false;
> +    }
> +
> +    feature_mask = (__u64)1 << _UFFDIO_REGISTER |
> +                   (__u64)1 << _UFFDIO_UNREGISTER;
> +    if ((api_struct.ioctls & feature_mask) != feature_mask) {
> +        error_report("Missing userfault features: %" PRIu64,
> +                     (uint64_t)(~api_struct.ioctls & feature_mask));
> +        return false;
> +    }
> +
> +    return true;
> +}
> +
> +bool postcopy_ram_supported_by_host(void)
> +{
> +    long pagesize = getpagesize();
> +    int ufd = -1;
> +    bool ret = false; /* Error unless we change it */
> +    void *testarea = NULL;
> +    struct uffdio_register reg_struct;
> +    struct uffdio_range range_struct;
> +    uint64_t feature_mask;
> +
> +    if ((1ul << qemu_target_page_bits()) > pagesize) {
> +        /* The PMI code doesn't yet deal with TPS>HPS */
> +        error_report("Target page size bigger than host page size");
> +        goto out;
> +    }
> +
> +    ufd = syscall(__NR_userfaultfd, O_CLOEXEC);
> +    if (ufd == -1) {
> +        perror("postcopy_ram_supported_by_host: userfaultfd not available");

And here as well?  And several places below.

> +        goto out;
> +    }
> +
> +    /* Version and features check */
> +    if (!ufd_version_check(ufd)) {
> +        goto out;
> +    }
> +
> +    /*
> +     *  We need to check that the ops we need are supported on anon memory
> +     *  To do that we need to register a chunk and see the flags that
> +     *  are returned.
> +     */
> +    testarea = mmap(NULL, pagesize, PROT_READ | PROT_WRITE, MAP_PRIVATE |
> +                                    MAP_ANONYMOUS, -1, 0);
> +    if (!testarea) {

This should be (testarea == MAP_FAILED).  Otherwise mmap() failures
will always trip the assert below.

> +        perror("postcopy_ram_supported_by_host: Failed to map test area");
> +        goto out;
> +    }
> +    g_assert(((size_t)testarea & (pagesize-1)) == 0);
> +
> +    reg_struct.range.start = (uint64_t)(uintptr_t)testarea;
> +    reg_struct.range.len = (uint64_t)pagesize;
> +    reg_struct.mode = UFFDIO_REGISTER_MODE_MISSING;
> +
> +    if (ioctl(ufd, UFFDIO_REGISTER, &reg_struct)) {
> +        perror("postcopy_ram_supported_by_host userfault register");
> +        goto out;
> +    }
> +
> +    range_struct.start = (uint64_t)(uintptr_t)testarea;
> +    range_struct.len = (uint64_t)pagesize;

I don't think you need the (uint64_t) casts (though you do need the
uintptr_t cast).  I think the assignment will do an implicit
conversion without probvlems.

> +    if (ioctl(ufd, UFFDIO_UNREGISTER, &range_struct)) {
> +        perror("postcopy_ram_supported_by_host userfault unregister");
> +        goto out;
> +    }
> +
> +    feature_mask = (__u64)1 << _UFFDIO_WAKE |
> +                   (__u64)1 << _UFFDIO_COPY |
> +                   (__u64)1 << _UFFDIO_ZEROPAGE;
> +    if ((reg_struct.ioctls & feature_mask) != feature_mask) {
> +        error_report("Missing userfault map features: %" PRIu64,

I'm guessing you want PRIx64, in order to make the feature mask at
least semi-readable.

> +                     (uint64_t)(~reg_struct.ioctls & feature_mask));
> +        goto out;
> +    }
> +
> +    /* Success! */
> +    ret = true;
> +out:
> +    if (testarea) {
> +        munmap(testarea, pagesize);
> +    }
> +    if (ufd != -1) {
> +        close(ufd);
> +    }
> +    return ret;
> +}
> +
> +#else
> +/* No target OS support, stubs just fail */
> +
> +bool postcopy_ram_supported_by_host(void)
> +{
> +    error_report("%s: No OS support", __func__);
> +    return false;
> +}
> +
> +#endif
> +
> diff --git a/savevm.c b/savevm.c
> index e301a0a..2ea4c76 100644
> --- a/savevm.c
> +++ b/savevm.c
> @@ -33,6 +33,7 @@
>  #include "qemu/timer.h"
>  #include "audio/audio.h"
>  #include "migration/migration.h"
> +#include "migration/postcopy-ram.h"
>  #include "qemu/sockets.h"
>  #include "qemu/queue.h"
>  #include "sysemu/cpus.h"
> @@ -1109,6 +1110,10 @@ static int 
> loadvm_postcopy_handle_advise(MigrationIncomingState *mis,
>          return -1;
>      }
>  
> +    if (!postcopy_ram_supported_by_host()) {
> +        return -1;
> +    }
> +
>      if (remote_hps != getpagesize())  {
>          /*
>           * Some combinations of mismatch are probably possible but it gets

-- 
David Gibson                    | I'll have my music baroque, and my code
david AT gibson.dropbear.id.au  | minimalist, thank you.  NOT _the_ _other_
                                | _way_ _around_!
http://www.ozlabs.org/~dgibson

Attachment: pgpt1AraZV0uK.pgp
Description: PGP signature


reply via email to

[Prev in Thread] Current Thread [Next in Thread]