Message ID | 1579904044-20790-3-git-send-email-walling@linux.ibm.com (mailing list archive) |
---|---|
State | New, archived |
Headers | show |
Series | Use DIAG318 to set Control Program Name & Version Codes | expand |
[...] > @@ -0,0 +1,85 @@ > +/* > + * DIAGNOSE 0x318 functions for reset and migration > + * > + * Copyright IBM, Corp. 2019 Should be 2020 now. [...] > +static void s390_diag318_reset(DeviceState *dev) > +{ > + if (kvm_enabled()) > + kvm_s390_set_diag318_info(0); > +} > + > +static void s390_diag318_class_init(ObjectClass *klass, void *data) > +{ > + DeviceClass *dc = DEVICE_CLASS(klass); > + > + dc->reset = s390_diag318_reset; > + dc->vmsd = &vmstate_diag318; > + dc->hotpluggable = false; > + /* Reason: Created automatically during machine instantiation */ > + dc->user_creatable = false; > +} > + > +static const TypeInfo s390_diag318_info = { > + .class_init = s390_diag318_class_init, > + .parent = TYPE_DEVICE, > + .name = TYPE_S390_DIAG318, > + .instance_size = sizeof(DIAG318State), > +}; > + > +static void s390_diag318_register_types(void) > +{ > + type_register_static(&s390_diag318_info); > +} Do we really need a new device? Can't we simply glue that extended state to the machine state? -> target/s390x/machine.c > + > +type_init(s390_diag318_register_types) > diff --git a/hw/s390x/diag318.h b/hw/s390x/diag318.h > new file mode 100644 > index 0000000..06d9f67 > --- /dev/null > +++ b/hw/s390x/diag318.h > @@ -0,0 +1,40 @@ > +/* > + * DIAGNOSE 0x318 functions for reset and migration > + * > + * Copyright IBM, Corp. 2019 > + * > + * Authors: > + * Collin Walling <walling@linux.ibm.com> > + * > + * This work is licensed under the terms of the GNU GPL, version 2 or (at your > + * option) any later version. See the COPYING file in the top-level directory. > + */ > + > +#ifndef HW_DIAG318_H > +#define HW_DIAG318_H > + > +#include "qemu/osdep.h" > +#include "migration/vmstate.h" > +#include "qom/object.h" > +#include "hw/qdev-core.h" > + > +#define TYPE_S390_DIAG318 "diag318" > +#define DIAG318(obj) \ > + OBJECT_CHECK(DIAG318State, (obj), TYPE_S390_DIAG318) > + > +typedef struct DIAG318State { > + /*< private >*/ > + DeviceState parent_obj; > + > + /*< public >*/ > + uint64_t info; > +} DIAG318State; > + > +typedef struct DIAG318Class { > + /*< private >*/ > + DeviceClass parent_class; > + > + /*< public >*/ > +} DIAG318Class; > + > +#endif /* HW_DIAG318_H */ > \ No newline at end of file > diff --git a/hw/s390x/s390-virtio-ccw.c b/hw/s390x/s390-virtio-ccw.c > index e0e2813..d5b7a33 100644 > --- a/hw/s390x/s390-virtio-ccw.c > +++ b/hw/s390x/s390-virtio-ccw.c > @@ -41,6 +41,7 @@ > #include "hw/qdev-properties.h" > #include "hw/s390x/tod.h" > #include "sysemu/sysemu.h" > +#include "hw/s390x/diag318.h" > > S390CPU *s390_cpu_addr2state(uint16_t cpu_addr) > { > @@ -97,6 +98,7 @@ static const char *const reset_dev_types[] = { > "s390-sclp-event-facility", > "s390-flic", > "diag288", > + TYPE_S390_DIAG318, > }; > > static void subsystem_reset(void) > @@ -237,6 +239,17 @@ static void s390_create_sclpconsole(const char *type, Chardev *chardev) > qdev_init_nofail(dev); > } > > +static void s390_init_diag318(void) > +{ > + Object *new = object_new(TYPE_S390_DIAG318); > + DeviceState *dev = DEVICE(new); > + > + object_property_add_child(qdev_get_machine(), TYPE_S390_DIAG318, > + new, NULL); > + object_unref(new); > + qdev_init_nofail(dev); > +} > + > static void ccw_init(MachineState *machine) > { > int ret; > @@ -294,6 +307,9 @@ static void ccw_init(MachineState *machine) > > /* init the TOD clock */ > s390_init_tod(); > + > + /* init object used for migrating diag318 info */ > + s390_init_diag318(); > } > > static void s390_cpu_plug(HotplugHandler *hotplug_dev, > @@ -566,6 +582,7 @@ static void machine_set_loadparm(Object *obj, const char *val, Error **errp) > ms->loadparm[i] = ' '; /* pad right with spaces */ > } > } > + unrelated change. > static inline void s390_machine_initfn(Object *obj) > { > object_property_add_bool(obj, "aes-key-wrap", > diff --git a/hw/s390x/sclp.c b/hw/s390x/sclp.c > index f57ce7b..636348c 100644 > --- a/hw/s390x/sclp.c > +++ b/hw/s390x/sclp.c > @@ -15,6 +15,7 @@ > #include "qemu/osdep.h" > #include "qemu/units.h" > #include "qapi/error.h" > +#include "qemu/error-report.h" > #include "cpu.h" > #include "sysemu/sysemu.h" > #include "hw/boards.h" > @@ -22,6 +23,7 @@ > #include "hw/s390x/event-facility.h" > #include "hw/s390x/s390-pci-bus.h" > #include "hw/s390x/ipl.h" > +#include "kvm_s390x.h" > > static inline SCLPDevice *get_sclp_device(void) > { > @@ -37,10 +39,19 @@ static void prepare_cpu_entries(SCLPDevice *sclp, CPUEntry *entry, int *count) > { > MachineState *ms = MACHINE(qdev_get_machine()); > uint8_t features[SCCB_CPU_FEATURE_LEN] = { 0 }; > + int max_entries; > int i; > > + /* Calculate the max number of CPU entries that can be stored in the SCCB */ > + max_entries = (SCCB_SIZE - offsetof(ReadInfo, entries)) / sizeof(CPUEntry); > + > s390_get_feat_block(S390_FEAT_TYPE_SCLP_CPU, features); > for (i = 0, *count = 0; i < ms->possible_cpus->len; i++) { > + if (*count == max_entries) { > + warn_report("Configuration only supports a max of %d CPU entries.", > + max_entries); I remember that "the sclp response will be limited to 247 CPUs if the feature is one". So we should have a double layout and make max_entries depending on s390_has_feat(). Regarding the message, I'd probably do a "Due to the current CPU model, some CPUs might be hidden from the VM (SCLP)." A VM could still manually probe for others. Thanks!
On 24/01/2020 23.14, Collin Walling wrote: > DIAGNOSE 0x318 (diag318) is a privileged s390x instruction that must > be intercepted by SIE and handled via KVM. Let's introduce some > functions to communicate between QEMU and KVM via ioctls. These > will be used to get/set the diag318 information. > > The availability of this instruction is determined by byte 134, bit 0 > of the Read Info block. This coincidentally expands into the space used > for CPU entries by taking away one byte, which means VMs running with > the diag318 capability will not be able to retrieve information regarding > the 248th CPU. This will not effect performance, and VMs can still be s/effect/affect/ ? > ran with 248 CPUs. s/ran/run/ ? > In order to simplify the migration and system reset requirements of > the diag318 data, let's introduce it as a device class and include > a VMStateDescription. > > Diag318 is set to 0 during modified clear and load normal resets. > > Signed-off-by: Collin Walling <walling@linux.ibm.com> > --- > hw/s390x/Makefile.objs | 1 + > hw/s390x/diag318.c | 85 +++++++++++++++++++++++++++++++++++++ > hw/s390x/diag318.h | 40 +++++++++++++++++ > hw/s390x/s390-virtio-ccw.c | 17 ++++++++ > hw/s390x/sclp.c | 13 ++++++ > include/hw/s390x/sclp.h | 2 + > target/s390x/cpu_features.h | 1 + > target/s390x/cpu_features_def.inc.h | 3 ++ > target/s390x/gen-features.c | 1 + > target/s390x/kvm-stub.c | 10 +++++ > target/s390x/kvm.c | 29 +++++++++++++ > target/s390x/kvm_s390x.h | 2 + > 12 files changed, 204 insertions(+) > create mode 100644 hw/s390x/diag318.c > create mode 100644 hw/s390x/diag318.h > > diff --git a/hw/s390x/Makefile.objs b/hw/s390x/Makefile.objs > index e02ed80..93621dc 100644 > --- a/hw/s390x/Makefile.objs > +++ b/hw/s390x/Makefile.objs > @@ -34,3 +34,4 @@ obj-$(CONFIG_KVM) += s390-stattrib-kvm.o > obj-y += s390-ccw.o > obj-y += ap-device.o > obj-y += ap-bridge.o > +obj-y += diag318.o > diff --git a/hw/s390x/diag318.c b/hw/s390x/diag318.c > new file mode 100644 > index 0000000..2d30bb2 > --- /dev/null > +++ b/hw/s390x/diag318.c > @@ -0,0 +1,85 @@ > +/* > + * DIAGNOSE 0x318 functions for reset and migration > + * > + * Copyright IBM, Corp. 2019 Bump to 2020 ? > + * Authors: > + * Collin Walling <walling@linux.ibm.com> > + * > + * This work is licensed under the terms of the GNU GPL, version 2 or (at your > + * option) any later version. See the COPYING file in the top-level directory. > + */ > + > +#include "hw/s390x/diag318.h" > +#include "qapi/error.h" > +#include "kvm_s390x.h" > +#include "sysemu/kvm.h" > + > +static int diag318_post_load(void *opaque, int version_id) > +{ > + DIAG318State *d = opaque; > + > + if (kvm_enabled()) > + kvm_s390_set_diag318_info(d->info); QEMU coding style requires curly braces also for single lines. > + return 0; > +} > + > +static int diag318_pre_save(void *opaque) > +{ > + DIAG318State *d = opaque; > + > + if (kvm_enabled()) > + kvm_s390_get_diag318_info(&d->info); dito > + return 0; > +} > + > +static bool diag318_needed(void *opaque) > +{ > + return kvm_enabled() ? s390_has_feat(S390_FEAT_DIAG318) : 0; > +} > + > +const VMStateDescription vmstate_diag318 = { > + .name = "vmstate_diag318", > + .post_load = diag318_post_load, > + .pre_save = diag318_pre_save, > + .version_id = 1, > + .minimum_version_id = 1, > + .needed = diag318_needed, > + .fields = (VMStateField[]) { > + VMSTATE_UINT64(info, DIAG318State), > + VMSTATE_END_OF_LIST() > + } > +}; > + > +static void s390_diag318_reset(DeviceState *dev) > +{ > + if (kvm_enabled()) > + kvm_s390_set_diag318_info(0); dito > +} > + > +static void s390_diag318_class_init(ObjectClass *klass, void *data) > +{ > + DeviceClass *dc = DEVICE_CLASS(klass); > + > + dc->reset = s390_diag318_reset; > + dc->vmsd = &vmstate_diag318; > + dc->hotpluggable = false; > + /* Reason: Created automatically during machine instantiation */ > + dc->user_creatable = false; > +} > + > +static const TypeInfo s390_diag318_info = { > + .class_init = s390_diag318_class_init, > + .parent = TYPE_DEVICE, > + .name = TYPE_S390_DIAG318, > + .instance_size = sizeof(DIAG318State), > +}; > + > +static void s390_diag318_register_types(void) > +{ > + type_register_static(&s390_diag318_info); > +} > + > +type_init(s390_diag318_register_types) > diff --git a/hw/s390x/diag318.h b/hw/s390x/diag318.h > new file mode 100644 > index 0000000..06d9f67 > --- /dev/null > +++ b/hw/s390x/diag318.h > @@ -0,0 +1,40 @@ > +/* > + * DIAGNOSE 0x318 functions for reset and migration > + * > + * Copyright IBM, Corp. 2019 2020 ? > + * Authors: > + * Collin Walling <walling@linux.ibm.com> > + * > + * This work is licensed under the terms of the GNU GPL, version 2 or (at your > + * option) any later version. See the COPYING file in the top-level directory. > + */ > + > +#ifndef HW_DIAG318_H > +#define HW_DIAG318_H > + > +#include "qemu/osdep.h" > +#include "migration/vmstate.h" > +#include "qom/object.h" > +#include "hw/qdev-core.h" > + > +#define TYPE_S390_DIAG318 "diag318" > +#define DIAG318(obj) \ > + OBJECT_CHECK(DIAG318State, (obj), TYPE_S390_DIAG318) > + > +typedef struct DIAG318State { > + /*< private >*/ > + DeviceState parent_obj; > + > + /*< public >*/ > + uint64_t info; > +} DIAG318State; > + > +typedef struct DIAG318Class { > + /*< private >*/ > + DeviceClass parent_class; > + > + /*< public >*/ > +} DIAG318Class; You don't use DIAG318Class anywhere. Please drop it. > +#endif /* HW_DIAG318_H */ > \ No newline at end of file > diff --git a/hw/s390x/s390-virtio-ccw.c b/hw/s390x/s390-virtio-ccw.c > index e0e2813..d5b7a33 100644 > --- a/hw/s390x/s390-virtio-ccw.c > +++ b/hw/s390x/s390-virtio-ccw.c > @@ -41,6 +41,7 @@ > #include "hw/qdev-properties.h" > #include "hw/s390x/tod.h" > #include "sysemu/sysemu.h" > +#include "hw/s390x/diag318.h" > > S390CPU *s390_cpu_addr2state(uint16_t cpu_addr) > { > @@ -97,6 +98,7 @@ static const char *const reset_dev_types[] = { > "s390-sclp-event-facility", > "s390-flic", > "diag288", > + TYPE_S390_DIAG318, > }; > > static void subsystem_reset(void) > @@ -237,6 +239,17 @@ static void s390_create_sclpconsole(const char *type, Chardev *chardev) > qdev_init_nofail(dev); > } > > +static void s390_init_diag318(void) > +{ > + Object *new = object_new(TYPE_S390_DIAG318); For the very unlikely case that we ever switch QEMU to C++ ... could you maybe use a different variable name than "new" ? Simply "obj" maybe? > + DeviceState *dev = DEVICE(new); > + > + object_property_add_child(qdev_get_machine(), TYPE_S390_DIAG318, > + new, NULL); > + object_unref(new); > + qdev_init_nofail(dev); > +} > + Thomas
On Fri, 24 Jan 2020 17:14:04 -0500 Collin Walling <walling@linux.ibm.com> wrote: > DIAGNOSE 0x318 (diag318) is a privileged s390x instruction that must > be intercepted by SIE and handled via KVM. Let's introduce some > functions to communicate between QEMU and KVM via ioctls. These > will be used to get/set the diag318 information. Do you want to give a hint what diag 318 actually does? > > The availability of this instruction is determined by byte 134, bit 0 > of the Read Info block. This coincidentally expands into the space used "SCLP Read Info" > for CPU entries by taking away one byte, which means VMs running with > the diag318 capability will not be able to retrieve information regarding > the 248th CPU. This will not effect performance, and VMs can still be > ran with 248 CPUs. Are there other ways in which that might affect guests? I assume Linux can deal with it? Is it ok architecture-wise? In any case, should go into the patch description :) > > In order to simplify the migration and system reset requirements of > the diag318 data, let's introduce it as a device class and include > a VMStateDescription. > > Diag318 is set to 0 during modified clear and load normal resets. What exactly is set to 0? Stored values? > > Signed-off-by: Collin Walling <walling@linux.ibm.com> > --- > hw/s390x/Makefile.objs | 1 + > hw/s390x/diag318.c | 85 +++++++++++++++++++++++++++++++++++++ > hw/s390x/diag318.h | 40 +++++++++++++++++ > hw/s390x/s390-virtio-ccw.c | 17 ++++++++ > hw/s390x/sclp.c | 13 ++++++ > include/hw/s390x/sclp.h | 2 + > target/s390x/cpu_features.h | 1 + > target/s390x/cpu_features_def.inc.h | 3 ++ > target/s390x/gen-features.c | 1 + > target/s390x/kvm-stub.c | 10 +++++ > target/s390x/kvm.c | 29 +++++++++++++ > target/s390x/kvm_s390x.h | 2 + > 12 files changed, 204 insertions(+) > create mode 100644 hw/s390x/diag318.c > create mode 100644 hw/s390x/diag318.h > (...) > diff --git a/hw/s390x/diag318.c b/hw/s390x/diag318.c > new file mode 100644 > index 0000000..2d30bb2 > --- /dev/null > +++ b/hw/s390x/diag318.c > @@ -0,0 +1,85 @@ > +/* > + * DIAGNOSE 0x318 functions for reset and migration > + * > + * Copyright IBM, Corp. 2019 Happy new year? > + * > + * Authors: > + * Collin Walling <walling@linux.ibm.com> > + * > + * This work is licensed under the terms of the GNU GPL, version 2 or (at your > + * option) any later version. See the COPYING file in the top-level directory. > + */ > + > +#include "hw/s390x/diag318.h" > +#include "qapi/error.h" > +#include "kvm_s390x.h" > +#include "sysemu/kvm.h" > + > +static int diag318_post_load(void *opaque, int version_id) > +{ > + DIAG318State *d = opaque; > + > + if (kvm_enabled()) As already noted by patchew, this needs some curly braces. > + kvm_s390_set_diag318_info(d->info); > + > + return 0; > +} > + > +static int diag318_pre_save(void *opaque) > +{ > + DIAG318State *d = opaque; > + > + if (kvm_enabled()) braces > + kvm_s390_get_diag318_info(&d->info); > + > + return 0; > +} > + > +static bool diag318_needed(void *opaque) > +{ > + return kvm_enabled() ? s390_has_feat(S390_FEAT_DIAG318) : 0; Why do you need to guard this with kvm_enabled()? If tcg does not enable the feature, we should be fine; and if it emulates this in the future, we probably need to migrate something anyway. > +} > + > +const VMStateDescription vmstate_diag318 = { > + .name = "vmstate_diag318", > + .post_load = diag318_post_load, > + .pre_save = diag318_pre_save, > + .version_id = 1, > + .minimum_version_id = 1, > + .needed = diag318_needed, > + .fields = (VMStateField[]) { > + VMSTATE_UINT64(info, DIAG318State), > + VMSTATE_END_OF_LIST() > + } > +}; > + > +static void s390_diag318_reset(DeviceState *dev) > +{ > + if (kvm_enabled()) braces > + kvm_s390_set_diag318_info(0); > +} > + > +static void s390_diag318_class_init(ObjectClass *klass, void *data) > +{ > + DeviceClass *dc = DEVICE_CLASS(klass); > + > + dc->reset = s390_diag318_reset; > + dc->vmsd = &vmstate_diag318; > + dc->hotpluggable = false; > + /* Reason: Created automatically during machine instantiation */ > + dc->user_creatable = false; > +} > + > +static const TypeInfo s390_diag318_info = { > + .class_init = s390_diag318_class_init, > + .parent = TYPE_DEVICE, > + .name = TYPE_S390_DIAG318, > + .instance_size = sizeof(DIAG318State), > +}; > + > +static void s390_diag318_register_types(void) > +{ > + type_register_static(&s390_diag318_info); > +} > + > +type_init(s390_diag318_register_types) > diff --git a/hw/s390x/diag318.h b/hw/s390x/diag318.h > new file mode 100644 > index 0000000..06d9f67 > --- /dev/null > +++ b/hw/s390x/diag318.h > @@ -0,0 +1,40 @@ > +/* > + * DIAGNOSE 0x318 functions for reset and migration > + * > + * Copyright IBM, Corp. 2019 Again, the year needs an update. > + * > + * Authors: > + * Collin Walling <walling@linux.ibm.com> > + * > + * This work is licensed under the terms of the GNU GPL, version 2 or (at your > + * option) any later version. See the COPYING file in the top-level directory. > + */ > + > +#ifndef HW_DIAG318_H > +#define HW_DIAG318_H > + > +#include "qemu/osdep.h" > +#include "migration/vmstate.h" > +#include "qom/object.h" > +#include "hw/qdev-core.h" > + > +#define TYPE_S390_DIAG318 "diag318" > +#define DIAG318(obj) \ > + OBJECT_CHECK(DIAG318State, (obj), TYPE_S390_DIAG318) > + > +typedef struct DIAG318State { > + /*< private >*/ > + DeviceState parent_obj; > + > + /*< public >*/ > + uint64_t info; > +} DIAG318State; > + > +typedef struct DIAG318Class { > + /*< private >*/ > + DeviceClass parent_class; > + > + /*< public >*/ > +} DIAG318Class; > + > +#endif /* HW_DIAG318_H */ > \ No newline at end of file And please add a newline :) > diff --git a/hw/s390x/s390-virtio-ccw.c b/hw/s390x/s390-virtio-ccw.c > index e0e2813..d5b7a33 100644 > --- a/hw/s390x/s390-virtio-ccw.c > +++ b/hw/s390x/s390-virtio-ccw.c > @@ -41,6 +41,7 @@ > #include "hw/qdev-properties.h" > #include "hw/s390x/tod.h" > #include "sysemu/sysemu.h" > +#include "hw/s390x/diag318.h" > > S390CPU *s390_cpu_addr2state(uint16_t cpu_addr) > { > @@ -97,6 +98,7 @@ static const char *const reset_dev_types[] = { > "s390-sclp-event-facility", > "s390-flic", > "diag288", > + TYPE_S390_DIAG318, > }; > > static void subsystem_reset(void) > @@ -237,6 +239,17 @@ static void s390_create_sclpconsole(const char *type, Chardev *chardev) > qdev_init_nofail(dev); > } > > +static void s390_init_diag318(void) > +{ > + Object *new = object_new(TYPE_S390_DIAG318); > + DeviceState *dev = DEVICE(new); > + > + object_property_add_child(qdev_get_machine(), TYPE_S390_DIAG318, > + new, NULL); > + object_unref(new); > + qdev_init_nofail(dev); > +} > + > static void ccw_init(MachineState *machine) > { > int ret; > @@ -294,6 +307,9 @@ static void ccw_init(MachineState *machine) > > /* init the TOD clock */ > s390_init_tod(); > + > + /* init object used for migrating diag318 info */ > + s390_init_diag318(); Doesn't that device do a bit more than 'migrating' info? Also, it seems a bit useless unless you're running with kvm and the feature bit switched on... > } > > static void s390_cpu_plug(HotplugHandler *hotplug_dev, > @@ -566,6 +582,7 @@ static void machine_set_loadparm(Object *obj, const char *val, Error **errp) > ms->loadparm[i] = ' '; /* pad right with spaces */ > } > } > + Still whitespace :) > static inline void s390_machine_initfn(Object *obj) > { > object_property_add_bool(obj, "aes-key-wrap", > diff --git a/hw/s390x/sclp.c b/hw/s390x/sclp.c > index f57ce7b..636348c 100644 > --- a/hw/s390x/sclp.c > +++ b/hw/s390x/sclp.c > @@ -15,6 +15,7 @@ > #include "qemu/osdep.h" > #include "qemu/units.h" > #include "qapi/error.h" > +#include "qemu/error-report.h" > #include "cpu.h" > #include "sysemu/sysemu.h" > #include "hw/boards.h" > @@ -22,6 +23,7 @@ > #include "hw/s390x/event-facility.h" > #include "hw/s390x/s390-pci-bus.h" > #include "hw/s390x/ipl.h" > +#include "kvm_s390x.h" > > static inline SCLPDevice *get_sclp_device(void) > { > @@ -37,10 +39,19 @@ static void prepare_cpu_entries(SCLPDevice *sclp, CPUEntry *entry, int *count) > { > MachineState *ms = MACHINE(qdev_get_machine()); > uint8_t features[SCCB_CPU_FEATURE_LEN] = { 0 }; > + int max_entries; > int i; > > + /* Calculate the max number of CPU entries that can be stored in the SCCB */ > + max_entries = (SCCB_SIZE - offsetof(ReadInfo, entries)) / sizeof(CPUEntry); > + > s390_get_feat_block(S390_FEAT_TYPE_SCLP_CPU, features); > for (i = 0, *count = 0; i < ms->possible_cpus->len; i++) { > + if (*count == max_entries) { > + warn_report("Configuration only supports a max of %d CPU entries.", > + max_entries); IIUC, this only moans during Read Info... but you could previously add more cpus than what could be serviced by Read Info. So, it looks to me you get some messages when a guest is doing Read Info; that seems more confusing than helpful to me. Can't we rather warn at cpu instantiation time? > + break; > + } > if (!ms->possible_cpus->cpus[i].cpu) { > continue; > } > @@ -80,6 +91,8 @@ static void read_SCP_info(SCLPDevice *sclp, SCCB *sccb) > s390_get_feat_block(S390_FEAT_TYPE_SCLP_CONF_CHAR_EXT, > read_info->conf_char_ext); > > + s390_get_feat_block(S390_FEAT_TYPE_SCLP_BYTE_134, read_info->byte_134); > + > read_info->facilities = cpu_to_be64(SCLP_HAS_CPU_INFO | > SCLP_HAS_IOA_RECONFIG); > (...)
On 1/27/20 6:20 AM, David Hildenbrand wrote: > [...] >> @@ -0,0 +1,85 @@ >> +/* >> + * DIAGNOSE 0x318 functions for reset and migration >> + * >> + * Copyright IBM, Corp. 2019 > > Should be 2020 now. > > [...] Where did the time go... >> +static void s390_diag318_reset(DeviceState *dev) >> +{ >> + if (kvm_enabled()) >> + kvm_s390_set_diag318_info(0); >> +} >> + >> +static void s390_diag318_class_init(ObjectClass *klass, void *data) >> +{ >> + DeviceClass *dc = DEVICE_CLASS(klass); >> + >> + dc->reset = s390_diag318_reset; >> + dc->vmsd = &vmstate_diag318; >> + dc->hotpluggable = false; >> + /* Reason: Created automatically during machine instantiation */ >> + dc->user_creatable = false; >> +} >> + >> +static const TypeInfo s390_diag318_info = { >> + .class_init = s390_diag318_class_init, >> + .parent = TYPE_DEVICE, >> + .name = TYPE_S390_DIAG318, >> + .instance_size = sizeof(DIAG318State), >> +}; >> + >> +static void s390_diag318_register_types(void) >> +{ >> + type_register_static(&s390_diag318_info); >> +} > > Do we really need a new device? Can't we simply glue that extended state > to the machine state? > > -> target/s390x/machine.c > Those VM States relate to the CPU state... does it make sense to store the diag318 info in a CPU state? (It doesn't seem necessary to store / migrate this info for each CPU). Should we store this in the S390CcwMachineState? Or perhaps create a generic S390MachineState for information that needs to be stored once and migrated once? >> + >> +type_init(s390_diag318_register_types) >> diff --git a/hw/s390x/diag318.h b/hw/s390x/diag318.h >> new file mode 100644 >> index 0000000..06d9f67 >> --- /dev/null >> +++ b/hw/s390x/diag318.h >> @@ -0,0 +1,40 @@ >> +/* >> + * DIAGNOSE 0x318 functions for reset and migration >> + * >> + * Copyright IBM, Corp. 2019 >> + * >> + * Authors: >> + * Collin Walling <walling@linux.ibm.com> >> + * >> + * This work is licensed under the terms of the GNU GPL, version 2 or (at your >> + * option) any later version. See the COPYING file in the top-level directory. >> + */ >> + >> +#ifndef HW_DIAG318_H >> +#define HW_DIAG318_H >> + >> +#include "qemu/osdep.h" >> +#include "migration/vmstate.h" >> +#include "qom/object.h" >> +#include "hw/qdev-core.h" >> + >> +#define TYPE_S390_DIAG318 "diag318" >> +#define DIAG318(obj) \ >> + OBJECT_CHECK(DIAG318State, (obj), TYPE_S390_DIAG318) >> + >> +typedef struct DIAG318State { >> + /*< private >*/ >> + DeviceState parent_obj; >> + >> + /*< public >*/ >> + uint64_t info; >> +} DIAG318State; >> + >> +typedef struct DIAG318Class { >> + /*< private >*/ >> + DeviceClass parent_class; >> + >> + /*< public >*/ >> +} DIAG318Class; >> + >> +#endif /* HW_DIAG318_H */ >> \ No newline at end of file >> diff --git a/hw/s390x/s390-virtio-ccw.c b/hw/s390x/s390-virtio-ccw.c >> index e0e2813..d5b7a33 100644 >> --- a/hw/s390x/s390-virtio-ccw.c >> +++ b/hw/s390x/s390-virtio-ccw.c >> @@ -41,6 +41,7 @@ >> #include "hw/qdev-properties.h" >> #include "hw/s390x/tod.h" >> #include "sysemu/sysemu.h" >> +#include "hw/s390x/diag318.h" >> >> S390CPU *s390_cpu_addr2state(uint16_t cpu_addr) >> { >> @@ -97,6 +98,7 @@ static const char *const reset_dev_types[] = { >> "s390-sclp-event-facility", >> "s390-flic", >> "diag288", >> + TYPE_S390_DIAG318, >> }; >> >> static void subsystem_reset(void) >> @@ -237,6 +239,17 @@ static void s390_create_sclpconsole(const char *type, Chardev *chardev) >> qdev_init_nofail(dev); >> } >> >> +static void s390_init_diag318(void) >> +{ >> + Object *new = object_new(TYPE_S390_DIAG318); >> + DeviceState *dev = DEVICE(new); >> + >> + object_property_add_child(qdev_get_machine(), TYPE_S390_DIAG318, >> + new, NULL); >> + object_unref(new); >> + qdev_init_nofail(dev); >> +} >> + >> static void ccw_init(MachineState *machine) >> { >> int ret; >> @@ -294,6 +307,9 @@ static void ccw_init(MachineState *machine) >> >> /* init the TOD clock */ >> s390_init_tod(); >> + >> + /* init object used for migrating diag318 info */ >> + s390_init_diag318(); >> } >> >> static void s390_cpu_plug(HotplugHandler *hotplug_dev, >> @@ -566,6 +582,7 @@ static void machine_set_loadparm(Object *obj, const char *val, Error **errp) >> ms->loadparm[i] = ' '; /* pad right with spaces */ >> } >> } >> + > > unrelated change. > >> static inline void s390_machine_initfn(Object *obj) >> { >> object_property_add_bool(obj, "aes-key-wrap", >> diff --git a/hw/s390x/sclp.c b/hw/s390x/sclp.c >> index f57ce7b..636348c 100644 >> --- a/hw/s390x/sclp.c >> +++ b/hw/s390x/sclp.c >> @@ -15,6 +15,7 @@ >> #include "qemu/osdep.h" >> #include "qemu/units.h" >> #include "qapi/error.h" >> +#include "qemu/error-report.h" >> #include "cpu.h" >> #include "sysemu/sysemu.h" >> #include "hw/boards.h" >> @@ -22,6 +23,7 @@ >> #include "hw/s390x/event-facility.h" >> #include "hw/s390x/s390-pci-bus.h" >> #include "hw/s390x/ipl.h" >> +#include "kvm_s390x.h" >> >> static inline SCLPDevice *get_sclp_device(void) >> { >> @@ -37,10 +39,19 @@ static void prepare_cpu_entries(SCLPDevice *sclp, CPUEntry *entry, int *count) >> { >> MachineState *ms = MACHINE(qdev_get_machine()); >> uint8_t features[SCCB_CPU_FEATURE_LEN] = { 0 }; >> + int max_entries; >> int i; >> >> + /* Calculate the max number of CPU entries that can be stored in the SCCB */ >> + max_entries = (SCCB_SIZE - offsetof(ReadInfo, entries)) / sizeof(CPUEntry); >> + >> s390_get_feat_block(S390_FEAT_TYPE_SCLP_CPU, features); >> for (i = 0, *count = 0; i < ms->possible_cpus->len; i++) { >> + if (*count == max_entries) { >> + warn_report("Configuration only supports a max of %d CPU entries.", >> + max_entries); > > I remember that "the sclp response will be limited to 247 CPUs if the > feature is one". So we should have a double layout and make max_entries > depending on s390_has_feat(). I'm looking back on previous discussions we had. Looks like this idea has been mentioned before. (oops!) Perhaps I'm not understanding something. How about we introduce a union in the ReadInfo struct. Something like: union { uint8_t byte_134; struct CPUEntry entries[0]; } x; If the diag318 facility is enabled, then we'll use that first byte for bit indication and only allow 247 CPUs. Otherwise, we'll discard the byte and allow the original 248 CPUs. The offset_cpu field in the ReadInfo struct would still be used to locate the first entry, of course. Note: the Read SCP Info fields are on a 16-byte boundary. > > Regarding the message, I'd probably do a "Due to the current CPU model, > some CPUs might be hidden from the VM (SCLP)." > > A VM could still manually probe for others. > > Thanks! > Right. I'll make the change to the message. Thank you for the review!
On 1/27/20 6:36 AM, Thomas Huth wrote: > On 24/01/2020 23.14, Collin Walling wrote: >> DIAGNOSE 0x318 (diag318) is a privileged s390x instruction that must >> be intercepted by SIE and handled via KVM. Let's introduce some >> functions to communicate between QEMU and KVM via ioctls. These >> will be used to get/set the diag318 information. >> >> The availability of this instruction is determined by byte 134, bit 0 >> of the Read Info block. This coincidentally expands into the space used >> for CPU entries by taking away one byte, which means VMs running with >> the diag318 capability will not be able to retrieve information regarding >> the 248th CPU. This will not effect performance, and VMs can still be > > s/effect/affect/ ? > >> ran with 248 CPUs. > > s/ran/run/ ? > >> In order to simplify the migration and system reset requirements of >> the diag318 data, let's introduce it as a device class and include >> a VMStateDescription. >> >> Diag318 is set to 0 during modified clear and load normal resets. >> >> Signed-off-by: Collin Walling <walling@linux.ibm.com> >> --- >> hw/s390x/Makefile.objs | 1 + >> hw/s390x/diag318.c | 85 +++++++++++++++++++++++++++++++++++++ >> hw/s390x/diag318.h | 40 +++++++++++++++++ >> hw/s390x/s390-virtio-ccw.c | 17 ++++++++ >> hw/s390x/sclp.c | 13 ++++++ >> include/hw/s390x/sclp.h | 2 + >> target/s390x/cpu_features.h | 1 + >> target/s390x/cpu_features_def.inc.h | 3 ++ >> target/s390x/gen-features.c | 1 + >> target/s390x/kvm-stub.c | 10 +++++ >> target/s390x/kvm.c | 29 +++++++++++++ >> target/s390x/kvm_s390x.h | 2 + >> 12 files changed, 204 insertions(+) >> create mode 100644 hw/s390x/diag318.c >> create mode 100644 hw/s390x/diag318.h >> >> diff --git a/hw/s390x/Makefile.objs b/hw/s390x/Makefile.objs >> index e02ed80..93621dc 100644 >> --- a/hw/s390x/Makefile.objs >> +++ b/hw/s390x/Makefile.objs >> @@ -34,3 +34,4 @@ obj-$(CONFIG_KVM) += s390-stattrib-kvm.o >> obj-y += s390-ccw.o >> obj-y += ap-device.o >> obj-y += ap-bridge.o >> +obj-y += diag318.o >> diff --git a/hw/s390x/diag318.c b/hw/s390x/diag318.c >> new file mode 100644 >> index 0000000..2d30bb2 >> --- /dev/null >> +++ b/hw/s390x/diag318.c >> @@ -0,0 +1,85 @@ >> +/* >> + * DIAGNOSE 0x318 functions for reset and migration >> + * >> + * Copyright IBM, Corp. 2019 > > Bump to 2020 ? > >> + * Authors: >> + * Collin Walling <walling@linux.ibm.com> >> + * >> + * This work is licensed under the terms of the GNU GPL, version 2 or (at your >> + * option) any later version. See the COPYING file in the top-level directory. >> + */ >> + >> +#include "hw/s390x/diag318.h" >> +#include "qapi/error.h" >> +#include "kvm_s390x.h" >> +#include "sysemu/kvm.h" >> + >> +static int diag318_post_load(void *opaque, int version_id) >> +{ >> + DIAG318State *d = opaque; >> + >> + if (kvm_enabled()) >> + kvm_s390_set_diag318_info(d->info); > > QEMU coding style requires curly braces also for single lines. > >> + return 0; >> +} >> + >> +static int diag318_pre_save(void *opaque) >> +{ >> + DIAG318State *d = opaque; >> + >> + if (kvm_enabled()) >> + kvm_s390_get_diag318_info(&d->info); > > dito > >> + return 0; >> +} >> + >> +static bool diag318_needed(void *opaque) >> +{ >> + return kvm_enabled() ? s390_has_feat(S390_FEAT_DIAG318) : 0; >> +} >> + >> +const VMStateDescription vmstate_diag318 = { >> + .name = "vmstate_diag318", >> + .post_load = diag318_post_load, >> + .pre_save = diag318_pre_save, >> + .version_id = 1, >> + .minimum_version_id = 1, >> + .needed = diag318_needed, >> + .fields = (VMStateField[]) { >> + VMSTATE_UINT64(info, DIAG318State), >> + VMSTATE_END_OF_LIST() >> + } >> +}; >> + >> +static void s390_diag318_reset(DeviceState *dev) >> +{ >> + if (kvm_enabled()) >> + kvm_s390_set_diag318_info(0); > > dito > >> +} >> + >> +static void s390_diag318_class_init(ObjectClass *klass, void *data) >> +{ >> + DeviceClass *dc = DEVICE_CLASS(klass); >> + >> + dc->reset = s390_diag318_reset; >> + dc->vmsd = &vmstate_diag318; >> + dc->hotpluggable = false; >> + /* Reason: Created automatically during machine instantiation */ >> + dc->user_creatable = false; >> +} >> + >> +static const TypeInfo s390_diag318_info = { >> + .class_init = s390_diag318_class_init, >> + .parent = TYPE_DEVICE, >> + .name = TYPE_S390_DIAG318, >> + .instance_size = sizeof(DIAG318State), >> +}; >> + >> +static void s390_diag318_register_types(void) >> +{ >> + type_register_static(&s390_diag318_info); >> +} >> + >> +type_init(s390_diag318_register_types) >> diff --git a/hw/s390x/diag318.h b/hw/s390x/diag318.h >> new file mode 100644 >> index 0000000..06d9f67 >> --- /dev/null >> +++ b/hw/s390x/diag318.h >> @@ -0,0 +1,40 @@ >> +/* >> + * DIAGNOSE 0x318 functions for reset and migration >> + * >> + * Copyright IBM, Corp. 2019 > > 2020 ? > >> + * Authors: >> + * Collin Walling <walling@linux.ibm.com> >> + * >> + * This work is licensed under the terms of the GNU GPL, version 2 or (at your >> + * option) any later version. See the COPYING file in the top-level directory. >> + */ >> + >> +#ifndef HW_DIAG318_H >> +#define HW_DIAG318_H >> + >> +#include "qemu/osdep.h" >> +#include "migration/vmstate.h" >> +#include "qom/object.h" >> +#include "hw/qdev-core.h" >> + >> +#define TYPE_S390_DIAG318 "diag318" >> +#define DIAG318(obj) \ >> + OBJECT_CHECK(DIAG318State, (obj), TYPE_S390_DIAG318) >> + >> +typedef struct DIAG318State { >> + /*< private >*/ >> + DeviceState parent_obj; >> + >> + /*< public >*/ >> + uint64_t info; >> +} DIAG318State; >> + >> +typedef struct DIAG318Class { >> + /*< private >*/ >> + DeviceClass parent_class; >> + >> + /*< public >*/ >> +} DIAG318Class; > > You don't use DIAG318Class anywhere. Please drop it. > >> +#endif /* HW_DIAG318_H */ >> \ No newline at end of file >> diff --git a/hw/s390x/s390-virtio-ccw.c b/hw/s390x/s390-virtio-ccw.c >> index e0e2813..d5b7a33 100644 >> --- a/hw/s390x/s390-virtio-ccw.c >> +++ b/hw/s390x/s390-virtio-ccw.c >> @@ -41,6 +41,7 @@ >> #include "hw/qdev-properties.h" >> #include "hw/s390x/tod.h" >> #include "sysemu/sysemu.h" >> +#include "hw/s390x/diag318.h" >> >> S390CPU *s390_cpu_addr2state(uint16_t cpu_addr) >> { >> @@ -97,6 +98,7 @@ static const char *const reset_dev_types[] = { >> "s390-sclp-event-facility", >> "s390-flic", >> "diag288", >> + TYPE_S390_DIAG318, >> }; >> >> static void subsystem_reset(void) >> @@ -237,6 +239,17 @@ static void s390_create_sclpconsole(const char *type, Chardev *chardev) >> qdev_init_nofail(dev); >> } >> >> +static void s390_init_diag318(void) >> +{ >> + Object *new = object_new(TYPE_S390_DIAG318); > > For the very unlikely case that we ever switch QEMU to C++ ... could you > maybe use a different variable name than "new" ? Simply "obj" maybe? > >> + DeviceState *dev = DEVICE(new); >> + >> + object_property_add_child(qdev_get_machine(), TYPE_S390_DIAG318, >> + new, NULL); >> + object_unref(new); >> + qdev_init_nofail(dev); >> +} >> + > > Thomas > Noted your comments. Thanks for the review! I'll remember to run checkpatch next time ;)
On 1/27/20 6:47 AM, Cornelia Huck wrote: > On Fri, 24 Jan 2020 17:14:04 -0500 > Collin Walling <walling@linux.ibm.com> wrote: > >> DIAGNOSE 0x318 (diag318) is a privileged s390x instruction that must >> be intercepted by SIE and handled via KVM. Let's introduce some >> functions to communicate between QEMU and KVM via ioctls. These >> will be used to get/set the diag318 information. > > Do you want to give a hint what diag 318 actually does? > For the sake of completeness, I'll have to get back to you on this. >> >> The availability of this instruction is determined by byte 134, bit 0 >> of the Read Info block. This coincidentally expands into the space used > > "SCLP Read Info" > >> for CPU entries by taking away one byte, which means VMs running with >> the diag318 capability will not be able to retrieve information regarding >> the 248th CPU. This will not effect performance, and VMs can still be >> ran with 248 CPUs. > > Are there other ways in which that might affect guests? I assume Linux > can deal with it? Is it ok architecture-wise? > > In any case, should go into the patch description :) > Same as above. I'll try to provide more information regarding what happens here in my next reply. >> >> In order to simplify the migration and system reset requirements of >> the diag318 data, let's introduce it as a device class and include >> a VMStateDescription. >> >> Diag318 is set to 0 during modified clear and load normal resets. > > What exactly is set to 0? Stored values? > Correct. "The stored values set by DIAG318 are reset to 0 during..." >> >> Signed-off-by: Collin Walling <walling@linux.ibm.com> >> --- >> hw/s390x/Makefile.objs | 1 + >> hw/s390x/diag318.c | 85 +++++++++++++++++++++++++++++++++++++ >> hw/s390x/diag318.h | 40 +++++++++++++++++ >> hw/s390x/s390-virtio-ccw.c | 17 ++++++++ >> hw/s390x/sclp.c | 13 ++++++ >> include/hw/s390x/sclp.h | 2 + >> target/s390x/cpu_features.h | 1 + >> target/s390x/cpu_features_def.inc.h | 3 ++ >> target/s390x/gen-features.c | 1 + >> target/s390x/kvm-stub.c | 10 +++++ >> target/s390x/kvm.c | 29 +++++++++++++ >> target/s390x/kvm_s390x.h | 2 + >> 12 files changed, 204 insertions(+) >> create mode 100644 hw/s390x/diag318.c >> create mode 100644 hw/s390x/diag318.h >> > (...) >> diff --git a/hw/s390x/diag318.c b/hw/s390x/diag318.c >> new file mode 100644 >> index 0000000..2d30bb2 >> --- /dev/null >> +++ b/hw/s390x/diag318.c >> @@ -0,0 +1,85 @@ >> +/* >> + * DIAGNOSE 0x318 functions for reset and migration >> + * >> + * Copyright IBM, Corp. 2019 > > Happy new year? > Woo! >> + * >> + * Authors: >> + * Collin Walling <walling@linux.ibm.com> >> + * >> + * This work is licensed under the terms of the GNU GPL, version 2 or (at your >> + * option) any later version. See the COPYING file in the top-level directory. >> + */ >> + >> +#include "hw/s390x/diag318.h" >> +#include "qapi/error.h" >> +#include "kvm_s390x.h" >> +#include "sysemu/kvm.h" >> + >> +static int diag318_post_load(void *opaque, int version_id) >> +{ >> + DIAG318State *d = opaque; >> + >> + if (kvm_enabled()) > > As already noted by patchew, this needs some curly braces. > >> + kvm_s390_set_diag318_info(d->info); >> + >> + return 0; >> +} >> + >> +static int diag318_pre_save(void *opaque) >> +{ >> + DIAG318State *d = opaque; >> + >> + if (kvm_enabled()) > > braces > >> + kvm_s390_get_diag318_info(&d->info); >> + >> + return 0; >> +} >> + >> +static bool diag318_needed(void *opaque) >> +{ >> + return kvm_enabled() ? s390_has_feat(S390_FEAT_DIAG318) : 0; > > Why do you need to guard this with kvm_enabled()? If tcg does not > enable the feature, we should be fine; and if it emulates this in the > future, we probably need to migrate something anyway. > Your explanation makes sense. My thoughts were to not even bother registering the state description if KVM isn't enabled (but I guess that thinking would mean that the other kvm_enabled fencing would be redundant? Doh.) I'll fix this. >> +} >> + >> +const VMStateDescription vmstate_diag318 = { >> + .name = "vmstate_diag318", >> + .post_load = diag318_post_load, >> + .pre_save = diag318_pre_save, >> + .version_id = 1, >> + .minimum_version_id = 1, >> + .needed = diag318_needed, >> + .fields = (VMStateField[]) { >> + VMSTATE_UINT64(info, DIAG318State), >> + VMSTATE_END_OF_LIST() >> + } >> +}; >> + >> +static void s390_diag318_reset(DeviceState *dev) >> +{ >> + if (kvm_enabled()) > > braces > >> + kvm_s390_set_diag318_info(0); >> +} >> + >> +static void s390_diag318_class_init(ObjectClass *klass, void *data) >> +{ >> + DeviceClass *dc = DEVICE_CLASS(klass); >> + >> + dc->reset = s390_diag318_reset; >> + dc->vmsd = &vmstate_diag318; >> + dc->hotpluggable = false; >> + /* Reason: Created automatically during machine instantiation */ >> + dc->user_creatable = false; >> +} >> + >> +static const TypeInfo s390_diag318_info = { >> + .class_init = s390_diag318_class_init, >> + .parent = TYPE_DEVICE, >> + .name = TYPE_S390_DIAG318, >> + .instance_size = sizeof(DIAG318State), >> +}; >> + >> +static void s390_diag318_register_types(void) >> +{ >> + type_register_static(&s390_diag318_info); >> +} >> + >> +type_init(s390_diag318_register_types) >> diff --git a/hw/s390x/diag318.h b/hw/s390x/diag318.h >> new file mode 100644 >> index 0000000..06d9f67 >> --- /dev/null >> +++ b/hw/s390x/diag318.h >> @@ -0,0 +1,40 @@ >> +/* >> + * DIAGNOSE 0x318 functions for reset and migration >> + * >> + * Copyright IBM, Corp. 2019 > > Again, the year needs an update. > >> + * >> + * Authors: >> + * Collin Walling <walling@linux.ibm.com> >> + * >> + * This work is licensed under the terms of the GNU GPL, version 2 or (at your >> + * option) any later version. See the COPYING file in the top-level directory. >> + */ >> + >> +#ifndef HW_DIAG318_H >> +#define HW_DIAG318_H >> + >> +#include "qemu/osdep.h" >> +#include "migration/vmstate.h" >> +#include "qom/object.h" >> +#include "hw/qdev-core.h" >> + >> +#define TYPE_S390_DIAG318 "diag318" >> +#define DIAG318(obj) \ >> + OBJECT_CHECK(DIAG318State, (obj), TYPE_S390_DIAG318) >> + >> +typedef struct DIAG318State { >> + /*< private >*/ >> + DeviceState parent_obj; >> + >> + /*< public >*/ >> + uint64_t info; >> +} DIAG318State; >> + >> +typedef struct DIAG318Class { >> + /*< private >*/ >> + DeviceClass parent_class; >> + >> + /*< public >*/ >> +} DIAG318Class; >> + >> +#endif /* HW_DIAG318_H */ >> \ No newline at end of file > > And please add a newline :) > >> diff --git a/hw/s390x/s390-virtio-ccw.c b/hw/s390x/s390-virtio-ccw.c >> index e0e2813..d5b7a33 100644 >> --- a/hw/s390x/s390-virtio-ccw.c >> +++ b/hw/s390x/s390-virtio-ccw.c >> @@ -41,6 +41,7 @@ >> #include "hw/qdev-properties.h" >> #include "hw/s390x/tod.h" >> #include "sysemu/sysemu.h" >> +#include "hw/s390x/diag318.h" >> >> S390CPU *s390_cpu_addr2state(uint16_t cpu_addr) >> { >> @@ -97,6 +98,7 @@ static const char *const reset_dev_types[] = { >> "s390-sclp-event-facility", >> "s390-flic", >> "diag288", >> + TYPE_S390_DIAG318, >> }; >> >> static void subsystem_reset(void) >> @@ -237,6 +239,17 @@ static void s390_create_sclpconsole(const char *type, Chardev *chardev) >> qdev_init_nofail(dev); >> } >> >> +static void s390_init_diag318(void) >> +{ >> + Object *new = object_new(TYPE_S390_DIAG318); >> + DeviceState *dev = DEVICE(new); >> + >> + object_property_add_child(qdev_get_machine(), TYPE_S390_DIAG318, >> + new, NULL); >> + object_unref(new); >> + qdev_init_nofail(dev); >> +} >> + >> static void ccw_init(MachineState *machine) >> { >> int ret; >> @@ -294,6 +307,9 @@ static void ccw_init(MachineState *machine) >> >> /* init the TOD clock */ >> s390_init_tod(); >> + >> + /* init object used for migrating diag318 info */ >> + s390_init_diag318(); > > Doesn't that device do a bit more than 'migrating' info? > > Also, it seems a bit useless unless you're running with kvm and the > feature bit switched on... > Right... I think this whole "diag318 device" thing needs some rethinking. I made a comment on David's response regarding where to but the VMStateDescription code for diag318. Perhaps including the related information within the S390MachineState would be better? (I'm not sure). >> } >> >> static void s390_cpu_plug(HotplugHandler *hotplug_dev, >> @@ -566,6 +582,7 @@ static void machine_set_loadparm(Object *obj, const char *val, Error **errp) >> ms->loadparm[i] = ' '; /* pad right with spaces */ >> } >> } >> + > > Still whitespace :) > >> static inline void s390_machine_initfn(Object *obj) >> { >> object_property_add_bool(obj, "aes-key-wrap", >> diff --git a/hw/s390x/sclp.c b/hw/s390x/sclp.c >> index f57ce7b..636348c 100644 >> --- a/hw/s390x/sclp.c >> +++ b/hw/s390x/sclp.c >> @@ -15,6 +15,7 @@ >> #include "qemu/osdep.h" >> #include "qemu/units.h" >> #include "qapi/error.h" >> +#include "qemu/error-report.h" >> #include "cpu.h" >> #include "sysemu/sysemu.h" >> #include "hw/boards.h" >> @@ -22,6 +23,7 @@ >> #include "hw/s390x/event-facility.h" >> #include "hw/s390x/s390-pci-bus.h" >> #include "hw/s390x/ipl.h" >> +#include "kvm_s390x.h" >> >> static inline SCLPDevice *get_sclp_device(void) >> { >> @@ -37,10 +39,19 @@ static void prepare_cpu_entries(SCLPDevice *sclp, CPUEntry *entry, int *count) >> { >> MachineState *ms = MACHINE(qdev_get_machine()); >> uint8_t features[SCCB_CPU_FEATURE_LEN] = { 0 }; >> + int max_entries; >> int i; >> >> + /* Calculate the max number of CPU entries that can be stored in the SCCB */ >> + max_entries = (SCCB_SIZE - offsetof(ReadInfo, entries)) / sizeof(CPUEntry); >> + >> s390_get_feat_block(S390_FEAT_TYPE_SCLP_CPU, features); >> for (i = 0, *count = 0; i < ms->possible_cpus->len; i++) { >> + if (*count == max_entries) { >> + warn_report("Configuration only supports a max of %d CPU entries.", >> + max_entries); > > IIUC, this only moans during Read Info... but you could previously add > more cpus than what could be serviced by Read Info. So, it looks to me > you get some messages when a guest is doing Read Info; that seems more > confusing than helpful to me. Can't we rather warn at cpu instantiation > time? > Ahh, I didn't think of that. For some reason, I was thinking that Read Info would only be queried once. Yes, this makes sense. I'll relocate the warning message... >> + break; >> + } >> if (!ms->possible_cpus->cpus[i].cpu) { >> continue; >> } >> @@ -80,6 +91,8 @@ static void read_SCP_info(SCLPDevice *sclp, SCCB *sccb) >> s390_get_feat_block(S390_FEAT_TYPE_SCLP_CONF_CHAR_EXT, >> read_info->conf_char_ext); >> >> + s390_get_feat_block(S390_FEAT_TYPE_SCLP_BYTE_134, read_info->byte_134); >> + >> read_info->facilities = cpu_to_be64(SCLP_HAS_CPU_INFO | >> SCLP_HAS_IOA_RECONFIG); >> > > (...) > > I've noted the nits as well. Thanks for your review!
>>> +static void s390_diag318_reset(DeviceState *dev) >>> +{ >>> + if (kvm_enabled()) >>> + kvm_s390_set_diag318_info(0); >>> +} >>> + >>> +static void s390_diag318_class_init(ObjectClass *klass, void *data) >>> +{ >>> + DeviceClass *dc = DEVICE_CLASS(klass); >>> + >>> + dc->reset = s390_diag318_reset; >>> + dc->vmsd = &vmstate_diag318; >>> + dc->hotpluggable = false; >>> + /* Reason: Created automatically during machine instantiation */ >>> + dc->user_creatable = false; >>> +} >>> + >>> +static const TypeInfo s390_diag318_info = { >>> + .class_init = s390_diag318_class_init, >>> + .parent = TYPE_DEVICE, >>> + .name = TYPE_S390_DIAG318, >>> + .instance_size = sizeof(DIAG318State), >>> +}; >>> + >>> +static void s390_diag318_register_types(void) >>> +{ >>> + type_register_static(&s390_diag318_info); >>> +} >> >> Do we really need a new device? Can't we simply glue that extended state >> to the machine state? >> >> -> target/s390x/machine.c >> > > Those VM States relate to the CPU state... does it make sense to store the > diag318 info in a CPU state? (It doesn't seem necessary to store / migrate > this info for each CPU). I'm sorry, I was looking at the wrong file ... > > Should we store this in the S390CcwMachineState? Or perhaps create a generic > S390MachineState for information that needs to be stored once and migrated > once? ... I actually thought we have something like this already. Personally, I think that would make sense. At least spapr seems to have something like this already (hw/ppc/spapr.c:spapr_machine_init(). @Conny? [...] > > How about we introduce a union in the ReadInfo struct. Something like: > > union { > uint8_t byte_134; > struct CPUEntry entries[0]; > } x; Or drop the "entries" pointer completely and introduce static int cpu_entries_offset(void) { /* * When we have to indicate features in byte 134, we have to move * the start of the cpu entries. */ if (s390_has_feat(S390_FEAT_DIAG318)) { return 144; } return 128; } struct CPUEntry *cpu_entries(ReadInfo *ri) { return (struct CPUEntry *)((void *)ri + cpu_entries_offset()); } unsigned int cpu_entries)count(ReadInfo *ri) { return (SCCB_SIZE - cpu_entries_offset()) / sizeof(CPUEntry); } etc. (might take some tweaking to make it compile) and a comment for the struct. Not sure what's better. Having two struct CPUEntry entries[0] is also confusing. Thanks!
On Mon, 27 Jan 2020 18:09:11 +0100 David Hildenbrand <david@redhat.com> wrote: > >>> +static void s390_diag318_reset(DeviceState *dev) > >>> +{ > >>> + if (kvm_enabled()) > >>> + kvm_s390_set_diag318_info(0); > >>> +} > >>> + > >>> +static void s390_diag318_class_init(ObjectClass *klass, void *data) > >>> +{ > >>> + DeviceClass *dc = DEVICE_CLASS(klass); > >>> + > >>> + dc->reset = s390_diag318_reset; > >>> + dc->vmsd = &vmstate_diag318; > >>> + dc->hotpluggable = false; > >>> + /* Reason: Created automatically during machine instantiation */ > >>> + dc->user_creatable = false; > >>> +} > >>> + > >>> +static const TypeInfo s390_diag318_info = { > >>> + .class_init = s390_diag318_class_init, > >>> + .parent = TYPE_DEVICE, > >>> + .name = TYPE_S390_DIAG318, > >>> + .instance_size = sizeof(DIAG318State), > >>> +}; > >>> + > >>> +static void s390_diag318_register_types(void) > >>> +{ > >>> + type_register_static(&s390_diag318_info); > >>> +} > >> > >> Do we really need a new device? Can't we simply glue that extended state > >> to the machine state? > >> > >> -> target/s390x/machine.c > >> > > > > Those VM States relate to the CPU state... does it make sense to store the > > diag318 info in a CPU state? (It doesn't seem necessary to store / migrate > > this info for each CPU). > > I'm sorry, I was looking at the wrong file ... > > > > > Should we store this in the S390CcwMachineState? Or perhaps create a generic > > S390MachineState for information that needs to be stored once and migrated > > once? > > ... I actually thought we have something like this already. Personally, > I think that would make sense. At least spapr seems to have something > like this already (hw/ppc/spapr.c:spapr_machine_init(). > > @Conny? What are you referring to? I only see the one with the FIXME in front of it... > > [...] > > > > How about we introduce a union in the ReadInfo struct. Something like: > > > > union { > > uint8_t byte_134; > > struct CPUEntry entries[0]; > > } x; > > Or drop the "entries" pointer completely and introduce > > static int cpu_entries_offset(void) > { > /* > * When we have to indicate features in byte 134, we have to move > * the start of the cpu entries. > */ > if (s390_has_feat(S390_FEAT_DIAG318)) { > return 144; > } > return 128; > } > > struct CPUEntry *cpu_entries(ReadInfo *ri) > { > return (struct CPUEntry *)((void *)ri + cpu_entries_offset()); > } > > unsigned int cpu_entries)count(ReadInfo *ri) > { > return (SCCB_SIZE - cpu_entries_offset()) / sizeof(CPUEntry); > } > > etc. (might take some tweaking to make it compile) and a comment for the > struct. Not sure what's better. Having two struct CPUEntry entries[0] is > also confusing. I think that version may end up looking better.
On Mon, 27 Jan 2020 11:39:02 -0500 Collin Walling <walling@linux.ibm.com> wrote: > On 1/27/20 6:47 AM, Cornelia Huck wrote: > > On Fri, 24 Jan 2020 17:14:04 -0500 > > Collin Walling <walling@linux.ibm.com> wrote: > > > >> DIAGNOSE 0x318 (diag318) is a privileged s390x instruction that must > >> be intercepted by SIE and handled via KVM. Let's introduce some > >> functions to communicate between QEMU and KVM via ioctls. These > >> will be used to get/set the diag318 information. > > > > Do you want to give a hint what diag 318 actually does? > > > > For the sake of completeness, I'll have to get back to you on this. > > >> > >> The availability of this instruction is determined by byte 134, bit 0 > >> of the Read Info block. This coincidentally expands into the space used > > > > "SCLP Read Info" > > > >> for CPU entries by taking away one byte, which means VMs running with > >> the diag318 capability will not be able to retrieve information regarding > >> the 248th CPU. This will not effect performance, and VMs can still be > >> ran with 248 CPUs. > > > > Are there other ways in which that might affect guests? I assume Linux > > can deal with it? Is it ok architecture-wise? > > > > In any case, should go into the patch description :) > > > > Same as above. I'll try to provide more information regarding what happens > here in my next reply. I think you can lift some stuff from the cover letter. > > >> > >> In order to simplify the migration and system reset requirements of > >> the diag318 data, let's introduce it as a device class and include > >> a VMStateDescription. > >> > >> Diag318 is set to 0 during modified clear and load normal resets. > > > > What exactly is set to 0? Stored values? > > > > Correct. "The stored values set by DIAG318 are reset to 0 during..." Sounds good. > > >> > >> Signed-off-by: Collin Walling <walling@linux.ibm.com> > >> --- > >> hw/s390x/Makefile.objs | 1 + > >> hw/s390x/diag318.c | 85 +++++++++++++++++++++++++++++++++++++ > >> hw/s390x/diag318.h | 40 +++++++++++++++++ > >> hw/s390x/s390-virtio-ccw.c | 17 ++++++++ > >> hw/s390x/sclp.c | 13 ++++++ > >> include/hw/s390x/sclp.h | 2 + > >> target/s390x/cpu_features.h | 1 + > >> target/s390x/cpu_features_def.inc.h | 3 ++ > >> target/s390x/gen-features.c | 1 + > >> target/s390x/kvm-stub.c | 10 +++++ > >> target/s390x/kvm.c | 29 +++++++++++++ > >> target/s390x/kvm_s390x.h | 2 + > >> 12 files changed, 204 insertions(+) > >> create mode 100644 hw/s390x/diag318.c > >> create mode 100644 hw/s390x/diag318.h > >> > > (...) > >> +static bool diag318_needed(void *opaque) > >> +{ > >> + return kvm_enabled() ? s390_has_feat(S390_FEAT_DIAG318) : 0; > > > > Why do you need to guard this with kvm_enabled()? If tcg does not > > enable the feature, we should be fine; and if it emulates this in the > > future, we probably need to migrate something anyway. > > > > Your explanation makes sense. My thoughts were to not even bother > registering the state description if KVM isn't enabled (but I guess > that thinking would mean that the other kvm_enabled fencing would > be redundant? Doh.) My thinking was along the lines how easy it would be to do some tcg implementation (not sure if that even makes sense.) > > I'll fix this. > > >> @@ -294,6 +307,9 @@ static void ccw_init(MachineState *machine) > >> > >> /* init the TOD clock */ > >> s390_init_tod(); > >> + > >> + /* init object used for migrating diag318 info */ > >> + s390_init_diag318(); > > > > Doesn't that device do a bit more than 'migrating' info? > > > > Also, it seems a bit useless unless you're running with kvm and the > > feature bit switched on... > > > > Right... I think this whole "diag318 device" thing needs some rethinking. > > I made a comment on David's response regarding where to but the VMStateDescription > code for diag318. Perhaps including the related information within the S390MachineState > would be better? (I'm not sure). Replied to David's mail. > >> @@ -37,10 +39,19 @@ static void prepare_cpu_entries(SCLPDevice *sclp, CPUEntry *entry, int *count) > >> { > >> MachineState *ms = MACHINE(qdev_get_machine()); > >> uint8_t features[SCCB_CPU_FEATURE_LEN] = { 0 }; > >> + int max_entries; > >> int i; > >> > >> + /* Calculate the max number of CPU entries that can be stored in the SCCB */ > >> + max_entries = (SCCB_SIZE - offsetof(ReadInfo, entries)) / sizeof(CPUEntry); > >> + > >> s390_get_feat_block(S390_FEAT_TYPE_SCLP_CPU, features); > >> for (i = 0, *count = 0; i < ms->possible_cpus->len; i++) { > >> + if (*count == max_entries) { > >> + warn_report("Configuration only supports a max of %d CPU entries.", > >> + max_entries); > > > > IIUC, this only moans during Read Info... but you could previously add > > more cpus than what could be serviced by Read Info. So, it looks to me > > you get some messages when a guest is doing Read Info; that seems more > > confusing than helpful to me. Can't we rather warn at cpu instantiation > > time? > > > > Ahh, I didn't think of that. For some reason, I was thinking that Read Info > would only be queried once. Linux probably only does it once, but there's nothing stopping a guest from doing it more often :) > > Yes, this makes sense. I'll relocate the warning message... > > >> + break; > >> + } > >> if (!ms->possible_cpus->cpus[i].cpu) { > >> continue; > >> }
On 27.01.20 18:29, Cornelia Huck wrote: > On Mon, 27 Jan 2020 18:09:11 +0100 > David Hildenbrand <david@redhat.com> wrote: > >>>>> +static void s390_diag318_reset(DeviceState *dev) >>>>> +{ >>>>> + if (kvm_enabled()) >>>>> + kvm_s390_set_diag318_info(0); >>>>> +} >>>>> + >>>>> +static void s390_diag318_class_init(ObjectClass *klass, void *data) >>>>> +{ >>>>> + DeviceClass *dc = DEVICE_CLASS(klass); >>>>> + >>>>> + dc->reset = s390_diag318_reset; >>>>> + dc->vmsd = &vmstate_diag318; >>>>> + dc->hotpluggable = false; >>>>> + /* Reason: Created automatically during machine instantiation */ >>>>> + dc->user_creatable = false; >>>>> +} >>>>> + >>>>> +static const TypeInfo s390_diag318_info = { >>>>> + .class_init = s390_diag318_class_init, >>>>> + .parent = TYPE_DEVICE, >>>>> + .name = TYPE_S390_DIAG318, >>>>> + .instance_size = sizeof(DIAG318State), >>>>> +}; >>>>> + >>>>> +static void s390_diag318_register_types(void) >>>>> +{ >>>>> + type_register_static(&s390_diag318_info); >>>>> +} >>>> >>>> Do we really need a new device? Can't we simply glue that extended state >>>> to the machine state? >>>> >>>> -> target/s390x/machine.c >>>> >>> >>> Those VM States relate to the CPU state... does it make sense to store the >>> diag318 info in a CPU state? (It doesn't seem necessary to store / migrate >>> this info for each CPU). >> >> I'm sorry, I was looking at the wrong file ... >> >>> >>> Should we store this in the S390CcwMachineState? Or perhaps create a generic >>> S390MachineState for information that needs to be stored once and migrated >>> once? >> >> ... I actually thought we have something like this already. Personally, >> I think that would make sense. At least spapr seems to have something >> like this already (hw/ppc/spapr.c:spapr_machine_init(). >> >> @Conny? > > What are you referring to? I only see the one with the FIXME in front > of it... That's the one I mean. The fixme states something about qdev ... but AFAIK that's only applicable if TYPE_DEVICE is involved. So maybe right now there is no other way than registering the vmstate directly.
On 1/27/20 12:55 PM, David Hildenbrand wrote: > On 27.01.20 18:29, Cornelia Huck wrote: >> On Mon, 27 Jan 2020 18:09:11 +0100 >> David Hildenbrand <david@redhat.com> wrote: >> >>>>>> +static void s390_diag318_reset(DeviceState *dev) >>>>>> +{ >>>>>> + if (kvm_enabled()) >>>>>> + kvm_s390_set_diag318_info(0); >>>>>> +} >>>>>> + >>>>>> +static void s390_diag318_class_init(ObjectClass *klass, void *data) >>>>>> +{ >>>>>> + DeviceClass *dc = DEVICE_CLASS(klass); >>>>>> + >>>>>> + dc->reset = s390_diag318_reset; >>>>>> + dc->vmsd = &vmstate_diag318; >>>>>> + dc->hotpluggable = false; >>>>>> + /* Reason: Created automatically during machine instantiation */ >>>>>> + dc->user_creatable = false; >>>>>> +} >>>>>> + >>>>>> +static const TypeInfo s390_diag318_info = { >>>>>> + .class_init = s390_diag318_class_init, >>>>>> + .parent = TYPE_DEVICE, >>>>>> + .name = TYPE_S390_DIAG318, >>>>>> + .instance_size = sizeof(DIAG318State), >>>>>> +}; >>>>>> + >>>>>> +static void s390_diag318_register_types(void) >>>>>> +{ >>>>>> + type_register_static(&s390_diag318_info); >>>>>> +} >>>>> >>>>> Do we really need a new device? Can't we simply glue that extended state >>>>> to the machine state? >>>>> >>>>> -> target/s390x/machine.c >>>>> >>>> >>>> Those VM States relate to the CPU state... does it make sense to store the >>>> diag318 info in a CPU state? (It doesn't seem necessary to store / migrate >>>> this info for each CPU). >>> >>> I'm sorry, I was looking at the wrong file ... >>> >>>> >>>> Should we store this in the S390CcwMachineState? Or perhaps create a generic >>>> S390MachineState for information that needs to be stored once and migrated >>>> once? >>> >>> ... I actually thought we have something like this already. Personally, >>> I think that would make sense. At least spapr seems to have something >>> like this already (hw/ppc/spapr.c:spapr_machine_init(). >>> >>> @Conny? >> >> What are you referring to? I only see the one with the FIXME in front >> of it... > > That's the one I mean. The fixme states something about qdev ... but > AFAIK that's only applicable if TYPE_DEVICE is involved. So maybe right > now there is no other way than registering the vmstate directly. > Hmm okay. I'll take a look at how spapr does it. I think I've registered a vmstate via register_savevm_live() in an earlier version, but had difficulties figuring out where to store the data. I'll revisit this approach. Thanks for the feedback!
On 1/27/20 1:21 PM, Collin Walling wrote: > On 1/27/20 12:55 PM, David Hildenbrand wrote: >> On 27.01.20 18:29, Cornelia Huck wrote: >>> On Mon, 27 Jan 2020 18:09:11 +0100 >>> David Hildenbrand <david@redhat.com> wrote: >>> >>>>>>> +static void s390_diag318_reset(DeviceState *dev) >>>>>>> +{ >>>>>>> + if (kvm_enabled()) >>>>>>> + kvm_s390_set_diag318_info(0); >>>>>>> +} >>>>>>> + >>>>>>> +static void s390_diag318_class_init(ObjectClass *klass, void *data) >>>>>>> +{ >>>>>>> + DeviceClass *dc = DEVICE_CLASS(klass); >>>>>>> + >>>>>>> + dc->reset = s390_diag318_reset; >>>>>>> + dc->vmsd = &vmstate_diag318; >>>>>>> + dc->hotpluggable = false; >>>>>>> + /* Reason: Created automatically during machine instantiation */ >>>>>>> + dc->user_creatable = false; >>>>>>> +} >>>>>>> + >>>>>>> +static const TypeInfo s390_diag318_info = { >>>>>>> + .class_init = s390_diag318_class_init, >>>>>>> + .parent = TYPE_DEVICE, >>>>>>> + .name = TYPE_S390_DIAG318, >>>>>>> + .instance_size = sizeof(DIAG318State), >>>>>>> +}; >>>>>>> + >>>>>>> +static void s390_diag318_register_types(void) >>>>>>> +{ >>>>>>> + type_register_static(&s390_diag318_info); >>>>>>> +} >>>>>> >>>>>> Do we really need a new device? Can't we simply glue that extended state >>>>>> to the machine state? >>>>>> >>>>>> -> target/s390x/machine.c >>>>>> >>>>> >>>>> Those VM States relate to the CPU state... does it make sense to store the >>>>> diag318 info in a CPU state? (It doesn't seem necessary to store / migrate >>>>> this info for each CPU). >>>> >>>> I'm sorry, I was looking at the wrong file ... >>>> >>>>> >>>>> Should we store this in the S390CcwMachineState? Or perhaps create a generic >>>>> S390MachineState for information that needs to be stored once and migrated >>>>> once? >>>> >>>> ... I actually thought we have something like this already. Personally, >>>> I think that would make sense. At least spapr seems to have something >>>> like this already (hw/ppc/spapr.c:spapr_machine_init(). >>>> >>>> @Conny? >>> >>> What are you referring to? I only see the one with the FIXME in front >>> of it... >> >> That's the one I mean. The fixme states something about qdev ... but >> AFAIK that's only applicable if TYPE_DEVICE is involved. So maybe right >> now there is no other way than registering the vmstate directly. >> > > Hmm okay. I'll take a look at how spapr does it. I think I've registered a > vmstate via register_savevm_live() in an earlier version, but had difficulties > figuring out where to store the data. I'll revisit this approach. > > Thanks for the feedback! > Err perhaps not entirely in this manner... docs/devel/migration.rst declares the register_savevm_live() function as the "legacy way" of doing things. I'll have to see how other VMStateDescriptions are modeled. I think vmstate_register() is what I want. Sorry for the confusion.
On 1/27/20 12:35 PM, Cornelia Huck wrote: > On Mon, 27 Jan 2020 11:39:02 -0500 > Collin Walling <walling@linux.ibm.com> wrote: > >> On 1/27/20 6:47 AM, Cornelia Huck wrote: >>> On Fri, 24 Jan 2020 17:14:04 -0500 >>> Collin Walling <walling@linux.ibm.com> wrote: >>> [...] >>>> >>>> The availability of this instruction is determined by byte 134, bit 0 >>>> of the Read Info block. This coincidentally expands into the space used >>> >>> "SCLP Read Info" >>> >>>> for CPU entries by taking away one byte, which means VMs running with >>>> the diag318 capability will not be able to retrieve information regarding >>>> the 248th CPU. This will not effect performance, and VMs can still be >>>> ran with 248 CPUs. >>> >>> Are there other ways in which that might affect guests? I assume Linux >>> can deal with it? Is it ok architecture-wise? >>> >>> In any case, should go into the patch description :) >>> >> >> Same as above. I'll try to provide more information regarding what happens >> here in my next reply. > > I think you can lift some stuff from the cover letter. > Here's what I found out: Each CPU entry holds info regarding the CPU's address / ID as well as an indication of the availability of certain CPU features. With these patches, we lose a CPU entry for one CPU (essentially what would be the CPU at the tail-end of the list). This CPU exists, but is essentially in limbo... the machine cannot access any information regarding it. So, a VM can run with the original N max CPUs, but in reality we can only utilize n-1. >> >>>> [...]
On Mon, 27 Jan 2020 13:52:48 -0500 Collin Walling <walling@linux.ibm.com> wrote: > On 1/27/20 1:21 PM, Collin Walling wrote: > > On 1/27/20 12:55 PM, David Hildenbrand wrote: > >> On 27.01.20 18:29, Cornelia Huck wrote: > >>> On Mon, 27 Jan 2020 18:09:11 +0100 > >>> David Hildenbrand <david@redhat.com> wrote: > >>>> ... I actually thought we have something like this already. Personally, > >>>> I think that would make sense. At least spapr seems to have something > >>>> like this already (hw/ppc/spapr.c:spapr_machine_init(). > >>>> > >>>> @Conny? > >>> > >>> What are you referring to? I only see the one with the FIXME in front > >>> of it... > >> > >> That's the one I mean. The fixme states something about qdev ... but > >> AFAIK that's only applicable if TYPE_DEVICE is involved. So maybe right > >> now there is no other way than registering the vmstate directly. > >> > > > > Hmm okay. I'll take a look at how spapr does it. I think I've registered a > > vmstate via register_savevm_live() in an earlier version, but had difficulties > > figuring out where to store the data. I'll revisit this approach. > > > > Thanks for the feedback! > > > > Err perhaps not entirely in this manner... > > docs/devel/migration.rst declares the register_savevm_live() function as the > "legacy way" of doing things. I'll have to see how other VMStateDescriptions > are modeled. I think vmstate_register() is what I want. > > Sorry for the confusion. Ok, I've now read what the FIXME actually says :) Since the machine does not inherit from device (but from object), vmstate_register() looks like the right thing to do.
On Mon, 27 Jan 2020 18:05:36 -0500 Collin Walling <walling@linux.ibm.com> wrote: > On 1/27/20 12:35 PM, Cornelia Huck wrote: > > On Mon, 27 Jan 2020 11:39:02 -0500 > > Collin Walling <walling@linux.ibm.com> wrote: > > > >> On 1/27/20 6:47 AM, Cornelia Huck wrote: > >>> On Fri, 24 Jan 2020 17:14:04 -0500 > >>> Collin Walling <walling@linux.ibm.com> wrote: > >>> > > [...] > > >>>> > >>>> The availability of this instruction is determined by byte 134, bit 0 > >>>> of the Read Info block. This coincidentally expands into the space used > >>> > >>> "SCLP Read Info" > >>> > >>>> for CPU entries by taking away one byte, which means VMs running with > >>>> the diag318 capability will not be able to retrieve information regarding > >>>> the 248th CPU. This will not effect performance, and VMs can still be > >>>> ran with 248 CPUs. > >>> > >>> Are there other ways in which that might affect guests? I assume Linux > >>> can deal with it? Is it ok architecture-wise? > >>> > >>> In any case, should go into the patch description :) > >>> > >> > >> Same as above. I'll try to provide more information regarding what happens > >> here in my next reply. > > > > I think you can lift some stuff from the cover letter. > > > > Here's what I found out: > > Each CPU entry holds info regarding the CPU's address / ID as well as an > indication of the availability of certain CPU features. With these patches, > we lose a CPU entry for one CPU (essentially what would be the CPU at the > tail-end of the list). This CPU exists, but is essentially in limbo... the > machine cannot access any information regarding it. s/machine/guest/ ? > > So, a VM can run with the original N max CPUs, but in reality we can only > utilize n-1. s/we/the guest/ ? With those changes, it makes sense to put your explanations into the patch description (for later reference). > > >> > >>>> > > [...] > >
On 1/27/20 12:35 PM, Cornelia Huck wrote: > On Mon, 27 Jan 2020 11:39:02 -0500 > Collin Walling <walling@linux.ibm.com> wrote: > >> On 1/27/20 6:47 AM, Cornelia Huck wrote: >>> On Fri, 24 Jan 2020 17:14:04 -0500 >>> Collin Walling <walling@linux.ibm.com> wrote: >>> >>>> DIAGNOSE 0x318 (diag318) is a privileged s390x instruction that must >>>> be intercepted by SIE and handled via KVM. Let's introduce some >>>> functions to communicate between QEMU and KVM via ioctls. These >>>> will be used to get/set the diag318 information. >>> >>> Do you want to give a hint what diag 318 actually does? >>> >> >> For the sake of completeness, I'll have to get back to you on this. >> The DIAGNOSE 318 instruction allows the guest to store diagnostic data that is collected by the firmware in the case of hardware/firmware service events. The instruction is invoked in the Linux kernel and intercepted in KVM. QEMU needs to collect this data for migration so that this data is consistent on the destination host. Perhaps I should add this to the patch description as well? :) [...]
On 1/28/20 6:24 AM, Cornelia Huck wrote: > On Mon, 27 Jan 2020 18:05:36 -0500 > Collin Walling <walling@linux.ibm.com> wrote: > >> On 1/27/20 12:35 PM, Cornelia Huck wrote: >>> On Mon, 27 Jan 2020 11:39:02 -0500 >>> Collin Walling <walling@linux.ibm.com> wrote: >>> >>>> On 1/27/20 6:47 AM, Cornelia Huck wrote: >>>>> On Fri, 24 Jan 2020 17:14:04 -0500 >>>>> Collin Walling <walling@linux.ibm.com> wrote: >>>>> >> >> [...] >> >>>>>> >>>>>> The availability of this instruction is determined by byte 134, bit 0 >>>>>> of the Read Info block. This coincidentally expands into the space used >>>>> >>>>> "SCLP Read Info" >>>>> >>>>>> for CPU entries by taking away one byte, which means VMs running with >>>>>> the diag318 capability will not be able to retrieve information regarding >>>>>> the 248th CPU. This will not effect performance, and VMs can still be >>>>>> ran with 248 CPUs. >>>>> >>>>> Are there other ways in which that might affect guests? I assume Linux >>>>> can deal with it? Is it ok architecture-wise? >>>>> >>>>> In any case, should go into the patch description :) >>>>> >>>> >>>> Same as above. I'll try to provide more information regarding what happens >>>> here in my next reply. >>> >>> I think you can lift some stuff from the cover letter. >>> >> >> Here's what I found out: >> >> Each CPU entry holds info regarding the CPU's address / ID as well as an >> indication of the availability of certain CPU features. With these patches, >> we lose a CPU entry for one CPU (essentially what would be the CPU at the >> tail-end of the list). This CPU exists, but is essentially in limbo... the >> machine cannot access any information regarding it. > > s/machine/guest/ ? > Correct. >> >> So, a VM can run with the original N max CPUs, but in reality we can only >> utilize n-1. > > s/we/the guest/ ? > Correct again. > With those changes, it makes sense to put your explanations into the > patch description (for later reference). > >> >>>> >>>>>> >> >> [...] >> >> > >
On Tue, 28 Jan 2020 09:37:46 -0500 Collin Walling <walling@linux.ibm.com> wrote: > On 1/27/20 12:35 PM, Cornelia Huck wrote: > > On Mon, 27 Jan 2020 11:39:02 -0500 > > Collin Walling <walling@linux.ibm.com> wrote: > > > >> On 1/27/20 6:47 AM, Cornelia Huck wrote: > >>> On Fri, 24 Jan 2020 17:14:04 -0500 > >>> Collin Walling <walling@linux.ibm.com> wrote: > >>> > >>>> DIAGNOSE 0x318 (diag318) is a privileged s390x instruction that must > >>>> be intercepted by SIE and handled via KVM. Let's introduce some > >>>> functions to communicate between QEMU and KVM via ioctls. These > >>>> will be used to get/set the diag318 information. > >>> > >>> Do you want to give a hint what diag 318 actually does? > >>> > >> > >> For the sake of completeness, I'll have to get back to you on this. > >> > > The DIAGNOSE 318 instruction allows the guest to store diagnostic data > that is collected by the firmware in the case of hardware/firmware > service events. The instruction is invoked in the Linux kernel and > intercepted in KVM. QEMU needs to collect this data for migration > so that this data is consistent on the destination host. > > Perhaps I should add this to the patch description as well? :) Yes, please :) It will make things easier for any unfortunate soul wanting to find out what this is about in the future.
diff --git a/hw/s390x/Makefile.objs b/hw/s390x/Makefile.objs index e02ed80..93621dc 100644 --- a/hw/s390x/Makefile.objs +++ b/hw/s390x/Makefile.objs @@ -34,3 +34,4 @@ obj-$(CONFIG_KVM) += s390-stattrib-kvm.o obj-y += s390-ccw.o obj-y += ap-device.o obj-y += ap-bridge.o +obj-y += diag318.o diff --git a/hw/s390x/diag318.c b/hw/s390x/diag318.c new file mode 100644 index 0000000..2d30bb2 --- /dev/null +++ b/hw/s390x/diag318.c @@ -0,0 +1,85 @@ +/* + * DIAGNOSE 0x318 functions for reset and migration + * + * Copyright IBM, Corp. 2019 + * + * Authors: + * Collin Walling <walling@linux.ibm.com> + * + * This work is licensed under the terms of the GNU GPL, version 2 or (at your + * option) any later version. See the COPYING file in the top-level directory. + */ + +#include "hw/s390x/diag318.h" +#include "qapi/error.h" +#include "kvm_s390x.h" +#include "sysemu/kvm.h" + +static int diag318_post_load(void *opaque, int version_id) +{ + DIAG318State *d = opaque; + + if (kvm_enabled()) + kvm_s390_set_diag318_info(d->info); + + return 0; +} + +static int diag318_pre_save(void *opaque) +{ + DIAG318State *d = opaque; + + if (kvm_enabled()) + kvm_s390_get_diag318_info(&d->info); + + return 0; +} + +static bool diag318_needed(void *opaque) +{ + return kvm_enabled() ? s390_has_feat(S390_FEAT_DIAG318) : 0; +} + +const VMStateDescription vmstate_diag318 = { + .name = "vmstate_diag318", + .post_load = diag318_post_load, + .pre_save = diag318_pre_save, + .version_id = 1, + .minimum_version_id = 1, + .needed = diag318_needed, + .fields = (VMStateField[]) { + VMSTATE_UINT64(info, DIAG318State), + VMSTATE_END_OF_LIST() + } +}; + +static void s390_diag318_reset(DeviceState *dev) +{ + if (kvm_enabled()) + kvm_s390_set_diag318_info(0); +} + +static void s390_diag318_class_init(ObjectClass *klass, void *data) +{ + DeviceClass *dc = DEVICE_CLASS(klass); + + dc->reset = s390_diag318_reset; + dc->vmsd = &vmstate_diag318; + dc->hotpluggable = false; + /* Reason: Created automatically during machine instantiation */ + dc->user_creatable = false; +} + +static const TypeInfo s390_diag318_info = { + .class_init = s390_diag318_class_init, + .parent = TYPE_DEVICE, + .name = TYPE_S390_DIAG318, + .instance_size = sizeof(DIAG318State), +}; + +static void s390_diag318_register_types(void) +{ + type_register_static(&s390_diag318_info); +} + +type_init(s390_diag318_register_types) diff --git a/hw/s390x/diag318.h b/hw/s390x/diag318.h new file mode 100644 index 0000000..06d9f67 --- /dev/null +++ b/hw/s390x/diag318.h @@ -0,0 +1,40 @@ +/* + * DIAGNOSE 0x318 functions for reset and migration + * + * Copyright IBM, Corp. 2019 + * + * Authors: + * Collin Walling <walling@linux.ibm.com> + * + * This work is licensed under the terms of the GNU GPL, version 2 or (at your + * option) any later version. See the COPYING file in the top-level directory. + */ + +#ifndef HW_DIAG318_H +#define HW_DIAG318_H + +#include "qemu/osdep.h" +#include "migration/vmstate.h" +#include "qom/object.h" +#include "hw/qdev-core.h" + +#define TYPE_S390_DIAG318 "diag318" +#define DIAG318(obj) \ + OBJECT_CHECK(DIAG318State, (obj), TYPE_S390_DIAG318) + +typedef struct DIAG318State { + /*< private >*/ + DeviceState parent_obj; + + /*< public >*/ + uint64_t info; +} DIAG318State; + +typedef struct DIAG318Class { + /*< private >*/ + DeviceClass parent_class; + + /*< public >*/ +} DIAG318Class; + +#endif /* HW_DIAG318_H */ \ No newline at end of file diff --git a/hw/s390x/s390-virtio-ccw.c b/hw/s390x/s390-virtio-ccw.c index e0e2813..d5b7a33 100644 --- a/hw/s390x/s390-virtio-ccw.c +++ b/hw/s390x/s390-virtio-ccw.c @@ -41,6 +41,7 @@ #include "hw/qdev-properties.h" #include "hw/s390x/tod.h" #include "sysemu/sysemu.h" +#include "hw/s390x/diag318.h" S390CPU *s390_cpu_addr2state(uint16_t cpu_addr) { @@ -97,6 +98,7 @@ static const char *const reset_dev_types[] = { "s390-sclp-event-facility", "s390-flic", "diag288", + TYPE_S390_DIAG318, }; static void subsystem_reset(void) @@ -237,6 +239,17 @@ static void s390_create_sclpconsole(const char *type, Chardev *chardev) qdev_init_nofail(dev); } +static void s390_init_diag318(void) +{ + Object *new = object_new(TYPE_S390_DIAG318); + DeviceState *dev = DEVICE(new); + + object_property_add_child(qdev_get_machine(), TYPE_S390_DIAG318, + new, NULL); + object_unref(new); + qdev_init_nofail(dev); +} + static void ccw_init(MachineState *machine) { int ret; @@ -294,6 +307,9 @@ static void ccw_init(MachineState *machine) /* init the TOD clock */ s390_init_tod(); + + /* init object used for migrating diag318 info */ + s390_init_diag318(); } static void s390_cpu_plug(HotplugHandler *hotplug_dev, @@ -566,6 +582,7 @@ static void machine_set_loadparm(Object *obj, const char *val, Error **errp) ms->loadparm[i] = ' '; /* pad right with spaces */ } } + static inline void s390_machine_initfn(Object *obj) { object_property_add_bool(obj, "aes-key-wrap", diff --git a/hw/s390x/sclp.c b/hw/s390x/sclp.c index f57ce7b..636348c 100644 --- a/hw/s390x/sclp.c +++ b/hw/s390x/sclp.c @@ -15,6 +15,7 @@ #include "qemu/osdep.h" #include "qemu/units.h" #include "qapi/error.h" +#include "qemu/error-report.h" #include "cpu.h" #include "sysemu/sysemu.h" #include "hw/boards.h" @@ -22,6 +23,7 @@ #include "hw/s390x/event-facility.h" #include "hw/s390x/s390-pci-bus.h" #include "hw/s390x/ipl.h" +#include "kvm_s390x.h" static inline SCLPDevice *get_sclp_device(void) { @@ -37,10 +39,19 @@ static void prepare_cpu_entries(SCLPDevice *sclp, CPUEntry *entry, int *count) { MachineState *ms = MACHINE(qdev_get_machine()); uint8_t features[SCCB_CPU_FEATURE_LEN] = { 0 }; + int max_entries; int i; + /* Calculate the max number of CPU entries that can be stored in the SCCB */ + max_entries = (SCCB_SIZE - offsetof(ReadInfo, entries)) / sizeof(CPUEntry); + s390_get_feat_block(S390_FEAT_TYPE_SCLP_CPU, features); for (i = 0, *count = 0; i < ms->possible_cpus->len; i++) { + if (*count == max_entries) { + warn_report("Configuration only supports a max of %d CPU entries.", + max_entries); + break; + } if (!ms->possible_cpus->cpus[i].cpu) { continue; } @@ -80,6 +91,8 @@ static void read_SCP_info(SCLPDevice *sclp, SCCB *sccb) s390_get_feat_block(S390_FEAT_TYPE_SCLP_CONF_CHAR_EXT, read_info->conf_char_ext); + s390_get_feat_block(S390_FEAT_TYPE_SCLP_BYTE_134, read_info->byte_134); + read_info->facilities = cpu_to_be64(SCLP_HAS_CPU_INFO | SCLP_HAS_IOA_RECONFIG); diff --git a/include/hw/s390x/sclp.h b/include/hw/s390x/sclp.h index c54413b..08813b4 100644 --- a/include/hw/s390x/sclp.h +++ b/include/hw/s390x/sclp.h @@ -132,6 +132,8 @@ typedef struct ReadInfo { uint16_t highest_cpu; uint8_t _reserved5[124 - 122]; /* 122-123 */ uint32_t hmfai; + uint8_t _reserved7[134 - 128]; /* 128-133 */ + uint8_t byte_134[1]; struct CPUEntry entries[0]; } QEMU_PACKED ReadInfo; diff --git a/target/s390x/cpu_features.h b/target/s390x/cpu_features.h index da695a8..954544e 100644 --- a/target/s390x/cpu_features.h +++ b/target/s390x/cpu_features.h @@ -23,6 +23,7 @@ typedef enum { S390_FEAT_TYPE_STFL, S390_FEAT_TYPE_SCLP_CONF_CHAR, S390_FEAT_TYPE_SCLP_CONF_CHAR_EXT, + S390_FEAT_TYPE_SCLP_BYTE_134, S390_FEAT_TYPE_SCLP_CPU, S390_FEAT_TYPE_MISC, S390_FEAT_TYPE_PLO, diff --git a/target/s390x/cpu_features_def.inc.h b/target/s390x/cpu_features_def.inc.h index 31dff0d..13d8da5 100644 --- a/target/s390x/cpu_features_def.inc.h +++ b/target/s390x/cpu_features_def.inc.h @@ -120,6 +120,9 @@ DEF_FEAT(SIE_CMMA, "cmma", SCLP_CONF_CHAR_EXT, 1, "SIE: Collaborative-memory-man DEF_FEAT(SIE_PFMFI, "pfmfi", SCLP_CONF_CHAR_EXT, 9, "SIE: PFMF interpretation facility") DEF_FEAT(SIE_IBS, "ibs", SCLP_CONF_CHAR_EXT, 10, "SIE: Interlock-and-broadcast-suppression facility") +/* Features exposed via SCLP SCCB Byte 134 (bit numbers relative to byte-134) */ +DEF_FEAT(DIAG318, "diag318", SCLP_BYTE_134, 0, "Control program name and version codes") + /* Features exposed via SCLP CPU info. */ DEF_FEAT(SIE_F2, "sief2", SCLP_CPU, 4, "SIE: interception format 2 (Virtual SIE)") DEF_FEAT(SIE_SKEY, "skey", SCLP_CPU, 5, "SIE: Storage-key facility") diff --git a/target/s390x/gen-features.c b/target/s390x/gen-features.c index 6278845..eaf91e6 100644 --- a/target/s390x/gen-features.c +++ b/target/s390x/gen-features.c @@ -522,6 +522,7 @@ static uint16_t full_GEN12_GA1[] = { S390_FEAT_AP_QUEUE_INTERRUPT_CONTROL, S390_FEAT_AP_FACILITIES_TEST, S390_FEAT_AP, + S390_FEAT_DIAG318, }; static uint16_t full_GEN12_GA2[] = { diff --git a/target/s390x/kvm-stub.c b/target/s390x/kvm-stub.c index 5152e2b..7c39d6a 100644 --- a/target/s390x/kvm-stub.c +++ b/target/s390x/kvm-stub.c @@ -107,3 +107,13 @@ void kvm_s390_stop_interrupt(S390CPU *cpu) void kvm_s390_restart_interrupt(S390CPU *cpu) { } + +int kvm_s390_get_diag318_info(uint64_t *info) +{ + return 0; +} + +int kvm_s390_set_diag318_info(uint64_t info) +{ + return 0; +} diff --git a/target/s390x/kvm.c b/target/s390x/kvm.c index 15260ae..abc9dc2 100644 --- a/target/s390x/kvm.c +++ b/target/s390x/kvm.c @@ -775,6 +775,28 @@ int kvm_s390_set_clock_ext(uint8_t tod_high, uint64_t tod_low) return kvm_vm_ioctl(kvm_state, KVM_SET_DEVICE_ATTR, &attr); } +int kvm_s390_get_diag318_info(uint64_t *info) +{ + struct kvm_device_attr attr = { + .group = KVM_S390_VM_MISC, + .attr = KVM_S390_VM_MISC_DIAG318, + .addr = (uint64_t)info, + }; + + return kvm_vm_ioctl(kvm_state, KVM_GET_DEVICE_ATTR, &attr); +} + +int kvm_s390_set_diag318_info(uint64_t info) +{ + struct kvm_device_attr attr = { + .group = KVM_S390_VM_MISC, + .attr = KVM_S390_VM_MISC_DIAG318, + .addr = (uint64_t)&info, + }; + + return kvm_vm_ioctl(kvm_state, KVM_SET_DEVICE_ATTR, &attr); +} + /** * kvm_s390_mem_op: * @addr: the logical start address in guest memory @@ -2347,6 +2369,13 @@ void kvm_s390_get_host_cpu_model(S390CPUModel *model, Error **errp) KVM_S390_VM_CRYPTO_ENABLE_APIE)) { set_bit(S390_FEAT_AP, model->features); } + + /* if KVM supports interception of diag318, then let's provide the bit */ + if (kvm_vm_check_attr(kvm_state, KVM_S390_VM_MISC, + KVM_S390_VM_MISC_DIAG318)) { + set_bit(S390_FEAT_DIAG318, model->features); + } + /* strip of features that are not part of the maximum model */ bitmap_and(model->features, model->features, model->def->full_feat, S390_FEAT_MAX); diff --git a/target/s390x/kvm_s390x.h b/target/s390x/kvm_s390x.h index caf9859..50df93e 100644 --- a/target/s390x/kvm_s390x.h +++ b/target/s390x/kvm_s390x.h @@ -29,6 +29,8 @@ int kvm_s390_get_clock(uint8_t *tod_high, uint64_t *tod_clock); int kvm_s390_get_clock_ext(uint8_t *tod_high, uint64_t *tod_clock); int kvm_s390_set_clock(uint8_t tod_high, uint64_t tod_clock); int kvm_s390_set_clock_ext(uint8_t tod_high, uint64_t tod_clock); +int kvm_s390_get_diag318_info(uint64_t *info); +int kvm_s390_set_diag318_info(uint64_t info); void kvm_s390_enable_css_support(S390CPU *cpu); int kvm_s390_assign_subch_ioeventfd(EventNotifier *notifier, uint32_t sch, int vq, bool assign);
DIAGNOSE 0x318 (diag318) is a privileged s390x instruction that must be intercepted by SIE and handled via KVM. Let's introduce some functions to communicate between QEMU and KVM via ioctls. These will be used to get/set the diag318 information. The availability of this instruction is determined by byte 134, bit 0 of the Read Info block. This coincidentally expands into the space used for CPU entries by taking away one byte, which means VMs running with the diag318 capability will not be able to retrieve information regarding the 248th CPU. This will not effect performance, and VMs can still be ran with 248 CPUs. In order to simplify the migration and system reset requirements of the diag318 data, let's introduce it as a device class and include a VMStateDescription. Diag318 is set to 0 during modified clear and load normal resets. Signed-off-by: Collin Walling <walling@linux.ibm.com> --- hw/s390x/Makefile.objs | 1 + hw/s390x/diag318.c | 85 +++++++++++++++++++++++++++++++++++++ hw/s390x/diag318.h | 40 +++++++++++++++++ hw/s390x/s390-virtio-ccw.c | 17 ++++++++ hw/s390x/sclp.c | 13 ++++++ include/hw/s390x/sclp.h | 2 + target/s390x/cpu_features.h | 1 + target/s390x/cpu_features_def.inc.h | 3 ++ target/s390x/gen-features.c | 1 + target/s390x/kvm-stub.c | 10 +++++ target/s390x/kvm.c | 29 +++++++++++++ target/s390x/kvm_s390x.h | 2 + 12 files changed, 204 insertions(+) create mode 100644 hw/s390x/diag318.c create mode 100644 hw/s390x/diag318.h