
* Update to QEMU v9.0.0 --------- Signed-off-by: Peter Maydell <peter.maydell@linaro.org> Signed-off-by: Fabiano Rosas <farosas@suse.de> Signed-off-by: Peter Xu <peterx@redhat.com> Signed-off-by: Thomas Huth <thuth@redhat.com> Signed-off-by: Cédric Le Goater <clg@redhat.com> Signed-off-by: Zheyu Ma <zheyuma97@gmail.com> Signed-off-by: Ido Plat <ido.plat@ibm.com> Signed-off-by: Ilya Leoshkevich <iii@linux.ibm.com> Signed-off-by: Markus Armbruster <armbru@redhat.com> Signed-off-by: Marc-André Lureau <marcandre.lureau@redhat.com> Signed-off-by: Paolo Bonzini <pbonzini@redhat.com> Signed-off-by: Vladimir Sementsov-Ogievskiy <vsementsov@yandex-team.ru> Signed-off-by: David Hildenbrand <david@redhat.com> Signed-off-by: Kevin Wolf <kwolf@redhat.com> Signed-off-by: Thomas Lamprecht <t.lamprecht@proxmox.com> Signed-off-by: Fiona Ebner <f.ebner@proxmox.com> Signed-off-by: Gregory Price <gregory.price@memverge.com> Signed-off-by: Jonathan Cameron <Jonathan.Cameron@huawei.com> Signed-off-by: Philippe Mathieu-Daudé <philmd@linaro.org> Signed-off-by: Lorenz Brun <lorenz@brun.one> Signed-off-by: Yao Xingtao <yaoxt.fnst@fujitsu.com> Signed-off-by: Arnaud Minier <arnaud.minier@telecom-paris.fr> Signed-off-by: Inès Varhol <ines.varhol@telecom-paris.fr> Signed-off-by: BALATON Zoltan <balaton@eik.bme.hu> Signed-off-by: Igor Mammedov <imammedo@redhat.com> Signed-off-by: Akihiko Odaki <akihiko.odaki@daynix.com> Signed-off-by: Richard Henderson <richard.henderson@linaro.org> Signed-off-by: Sven Schnelle <svens@stackframe.org> Signed-off-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com> Signed-off-by: Christian Schoenebeck <qemu_oss@crudebyte.com> Signed-off-by: Jason Wang <jasowang@redhat.com> Signed-off-by: Helge Deller <deller@gmx.de> Signed-off-by: Nicholas Piggin <npiggin@gmail.com> Signed-off-by: Benjamin Gray <bgray@linux.ibm.com> Signed-off-by: Avihai Horon <avihaih@nvidia.com> Signed-off-by: Michael Tokarev <mjt@tls.msk.ru> Signed-off-by: Joonas Kankaala <joonas.a.kankaala@gmail.com> Signed-off-by: Marcin Juszkiewicz <marcin.juszkiewicz@linaro.org> Signed-off-by: Stefan Weil <sw@weilnetz.de> Signed-off-by: Zhao Liu <zhao1.liu@intel.com> Signed-off-by: Glenn Miles <milesg@linux.ibm.com> Signed-off-by: Oleg Sviridov <oleg.sviridov@red-soft.ru> Signed-off-by: Artem Chernyshev <artem.chernyshev@red-soft.ru> Signed-off-by: Yajun Wu <yajunw@nvidia.com> Signed-off-by: Stefan Hajnoczi <stefanha@redhat.com> Signed-off-by: Mark Cave-Ayland <mark.cave-ayland@ilande.co.uk> Signed-off-by: Pierre-Clément Tosi <ptosi@google.com> Signed-off-by: Lei Wang <lei4.wang@intel.com> Signed-off-by: Wei Wang <wei.w.wang@intel.com> Signed-off-by: Martin Hundebøll <martin@geanix.com> Signed-off-by: Michael S. Tsirkin <mst@redhat.com> Signed-off-by: Manos Pitsidianakis <manos.pitsidianakis@linaro.org> Signed-off-by: Wafer <wafer@jaguarmicro.com> Signed-off-by: Yuxue Liu <yuxue.liu@jaguarmicro.com> Signed-off-by: Gerd Hoffmann <kraxel@redhat.com> Signed-off-by: Nguyen Dinh Phi <phind.uet@gmail.com> Signed-off-by: Zack Buhman <zack@buhman.org> Signed-off-by: Keith Packard <keithp@keithp.com> Signed-off-by: Yuquan Wang wangyuquan1236@phytium.com.cn Signed-off-by: Matheus Tavares Bernardino <quic_mathbern@quicinc.com> Signed-off-by: Cindy Lu <lulu@redhat.com> Co-authored-by: Peter Maydell <peter.maydell@linaro.org> Co-authored-by: Fabiano Rosas <farosas@suse.de> Co-authored-by: Peter Xu <peterx@redhat.com> Co-authored-by: Thomas Huth <thuth@redhat.com> Co-authored-by: Cédric Le Goater <clg@redhat.com> Co-authored-by: Zheyu Ma <zheyuma97@gmail.com> Co-authored-by: Ido Plat <ido.plat@ibm.com> Co-authored-by: Ilya Leoshkevich <iii@linux.ibm.com> Co-authored-by: Markus Armbruster <armbru@redhat.com> Co-authored-by: Marc-André Lureau <marcandre.lureau@redhat.com> Co-authored-by: Paolo Bonzini <pbonzini@redhat.com> Co-authored-by: Vladimir Sementsov-Ogievskiy <vsementsov@yandex-team.ru> Co-authored-by: David Hildenbrand <david@redhat.com> Co-authored-by: Kevin Wolf <kwolf@redhat.com> Co-authored-by: Stefan Reiter <s.reiter@proxmox.com> Co-authored-by: Fiona Ebner <f.ebner@proxmox.com> Co-authored-by: Gregory Price <gregory.price@memverge.com> Co-authored-by: Lorenz Brun <lorenz@brun.one> Co-authored-by: Yao Xingtao <yaoxt.fnst@fujitsu.com> Co-authored-by: Philippe Mathieu-Daudé <philmd@linaro.org> Co-authored-by: Arnaud Minier <arnaud.minier@telecom-paris.fr> Co-authored-by: BALATON Zoltan <balaton@eik.bme.hu> Co-authored-by: Igor Mammedov <imammedo@redhat.com> Co-authored-by: Akihiko Odaki <akihiko.odaki@daynix.com> Co-authored-by: Richard Henderson <richard.henderson@linaro.org> Co-authored-by: Sven Schnelle <svens@stackframe.org> Co-authored-by: Daniel Henrique Barboza <dbarboza@ventanamicro.com> Co-authored-by: Helge Deller <deller@kernel.org> Co-authored-by: Harsh Prateek Bora <harshpb@linux.ibm.com> Co-authored-by: Benjamin Gray <bgray@linux.ibm.com> Co-authored-by: Nicholas Piggin <npiggin@gmail.com> Co-authored-by: Avihai Horon <avihaih@nvidia.com> Co-authored-by: Michael Tokarev <mjt@tls.msk.ru> Co-authored-by: Joonas Kankaala <joonas.a.kankaala@gmail.com> Co-authored-by: Marcin Juszkiewicz <marcin.juszkiewicz@linaro.org> Co-authored-by: Stefan Weil <sw@weilnetz.de> Co-authored-by: Dayu Liu <liu.dayu@zte.com.cn> Co-authored-by: Zhao Liu <zhao1.liu@intel.com> Co-authored-by: Glenn Miles <milesg@linux.vnet.ibm.com> Co-authored-by: Artem Chernyshev <artem.chernyshev@red-soft.ru> Co-authored-by: Yajun Wu <yajunw@nvidia.com> Co-authored-by: Mark Cave-Ayland <mark.cave-ayland@ilande.co.uk> Co-authored-by: Pierre-Clément Tosi <ptosi@google.com> Co-authored-by: Wei Wang <wei.w.wang@intel.com> Co-authored-by: Martin Hundebøll <martin@geanix.com> Co-authored-by: Michael S. Tsirkin <mst@redhat.com> Co-authored-by: Manos Pitsidianakis <manos.pitsidianakis@linaro.org> Co-authored-by: Wafer <wafer@jaguarmicro.com> Co-authored-by: lyx634449800 <yuxue.liu@jaguarmicro.com> Co-authored-by: Gerd Hoffmann <kraxel@redhat.com> Co-authored-by: Nguyen Dinh Phi <phind.uet@gmail.com> Co-authored-by: Zack Buhman <zack@buhman.org> Co-authored-by: Keith Packard <keithp@keithp.com> Co-authored-by: Yuquan Wang <wangyuquan1236@phytium.com.cn> Co-authored-by: Matheus Tavares Bernardino <quic_mathbern@quicinc.com> Co-authored-by: Cindy Lu <lulu@redhat.com>
353 lines
9.6 KiB
C
353 lines
9.6 KiB
C
/*
|
|
* QEMU sPAPR PCI host for VFIO
|
|
*
|
|
* Copyright (c) 2011-2014 Alexey Kardashevskiy, IBM Corporation.
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License,
|
|
* or (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#include "qemu/osdep.h"
|
|
#include <sys/ioctl.h>
|
|
#include <linux/vfio.h>
|
|
#include "hw/ppc/spapr.h"
|
|
#include "hw/pci-host/spapr.h"
|
|
#include "hw/pci/msix.h"
|
|
#include "hw/pci/pci_device.h"
|
|
#include "hw/vfio/vfio-common.h"
|
|
#include "qemu/error-report.h"
|
|
#include CONFIG_DEVICES /* CONFIG_VFIO_PCI */
|
|
|
|
/*
|
|
* Interfaces for IBM EEH (Enhanced Error Handling)
|
|
*/
|
|
#ifdef CONFIG_VFIO_PCI
|
|
static bool vfio_eeh_container_ok(VFIOContainer *container)
|
|
{
|
|
/*
|
|
* As of 2016-03-04 (linux-4.5) the host kernel EEH/VFIO
|
|
* implementation is broken if there are multiple groups in a
|
|
* container. The hardware works in units of Partitionable
|
|
* Endpoints (== IOMMU groups) and the EEH operations naively
|
|
* iterate across all groups in the container, without any logic
|
|
* to make sure the groups have their state synchronized. For
|
|
* certain operations (ENABLE) that might be ok, until an error
|
|
* occurs, but for others (GET_STATE) it's clearly broken.
|
|
*/
|
|
|
|
/*
|
|
* XXX Once fixed kernels exist, test for them here
|
|
*/
|
|
|
|
if (QLIST_EMPTY(&container->group_list)) {
|
|
return false;
|
|
}
|
|
|
|
if (QLIST_NEXT(QLIST_FIRST(&container->group_list), container_next)) {
|
|
return false;
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
static int vfio_eeh_container_op(VFIOContainer *container, uint32_t op)
|
|
{
|
|
struct vfio_eeh_pe_op pe_op = {
|
|
.argsz = sizeof(pe_op),
|
|
.op = op,
|
|
};
|
|
int ret;
|
|
|
|
if (!vfio_eeh_container_ok(container)) {
|
|
error_report("vfio/eeh: EEH_PE_OP 0x%x: "
|
|
"kernel requires a container with exactly one group", op);
|
|
return -EPERM;
|
|
}
|
|
|
|
ret = ioctl(container->fd, VFIO_EEH_PE_OP, &pe_op);
|
|
if (ret < 0) {
|
|
error_report("vfio/eeh: EEH_PE_OP 0x%x failed: %m", op);
|
|
return -errno;
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
static VFIOContainer *vfio_eeh_as_container(AddressSpace *as)
|
|
{
|
|
VFIOAddressSpace *space = vfio_get_address_space(as);
|
|
VFIOContainerBase *bcontainer = NULL;
|
|
|
|
if (QLIST_EMPTY(&space->containers)) {
|
|
/* No containers to act on */
|
|
goto out;
|
|
}
|
|
|
|
bcontainer = QLIST_FIRST(&space->containers);
|
|
|
|
if (QLIST_NEXT(bcontainer, next)) {
|
|
/*
|
|
* We don't yet have logic to synchronize EEH state across
|
|
* multiple containers
|
|
*/
|
|
bcontainer = NULL;
|
|
goto out;
|
|
}
|
|
|
|
out:
|
|
vfio_put_address_space(space);
|
|
return container_of(bcontainer, VFIOContainer, bcontainer);
|
|
}
|
|
|
|
static bool vfio_eeh_as_ok(AddressSpace *as)
|
|
{
|
|
VFIOContainer *container = vfio_eeh_as_container(as);
|
|
|
|
return (container != NULL) && vfio_eeh_container_ok(container);
|
|
}
|
|
|
|
static int vfio_eeh_as_op(AddressSpace *as, uint32_t op)
|
|
{
|
|
VFIOContainer *container = vfio_eeh_as_container(as);
|
|
|
|
if (!container) {
|
|
return -ENODEV;
|
|
}
|
|
return vfio_eeh_container_op(container, op);
|
|
}
|
|
|
|
bool spapr_phb_eeh_available(SpaprPhbState *sphb)
|
|
{
|
|
return vfio_eeh_as_ok(&sphb->iommu_as);
|
|
}
|
|
|
|
static void spapr_phb_vfio_eeh_reenable(SpaprPhbState *sphb)
|
|
{
|
|
vfio_eeh_as_op(&sphb->iommu_as, VFIO_EEH_PE_ENABLE);
|
|
}
|
|
|
|
void spapr_phb_vfio_reset(DeviceState *qdev)
|
|
{
|
|
/*
|
|
* The PE might be in frozen state. To reenable the EEH
|
|
* functionality on it will clean the frozen state, which
|
|
* ensures that the contained PCI devices will work properly
|
|
* after reboot.
|
|
*/
|
|
spapr_phb_vfio_eeh_reenable(SPAPR_PCI_HOST_BRIDGE(qdev));
|
|
}
|
|
|
|
static void spapr_eeh_pci_find_device(PCIBus *bus, PCIDevice *pdev,
|
|
void *opaque)
|
|
{
|
|
bool *found = opaque;
|
|
|
|
if (object_dynamic_cast(OBJECT(pdev), "vfio-pci")) {
|
|
*found = true;
|
|
}
|
|
}
|
|
|
|
int spapr_phb_vfio_eeh_set_option(SpaprPhbState *sphb,
|
|
unsigned int addr, int option)
|
|
{
|
|
uint32_t op;
|
|
int ret;
|
|
|
|
switch (option) {
|
|
case RTAS_EEH_DISABLE:
|
|
op = VFIO_EEH_PE_DISABLE;
|
|
break;
|
|
case RTAS_EEH_ENABLE: {
|
|
PCIHostState *phb;
|
|
bool found = false;
|
|
|
|
/*
|
|
* The EEH functionality is enabled per sphb level instead of
|
|
* per PCI device. We have already identified this specific sphb
|
|
* based on buid passed as argument to ibm,set-eeh-option rtas
|
|
* call. Now we just need to check the validity of the PCI
|
|
* pass-through devices (vfio-pci) under this sphb bus.
|
|
* We have already validated that all the devices under this sphb
|
|
* are from same iommu group (within same PE) before coming here.
|
|
*
|
|
* Prior to linux commit 98ba956f6a389 ("powerpc/pseries/eeh:
|
|
* Rework device EEH PE determination") kernel would call
|
|
* eeh-set-option for each device in the PE using the device's
|
|
* config_address as the argument rather than the PE address.
|
|
* Hence if we check validity of supplied config_addr whether
|
|
* it matches to this PHB will cause issues with older kernel
|
|
* versions v5.9 and older. If we return an error from
|
|
* eeh-set-option when the argument isn't a valid PE address
|
|
* then older kernels (v5.9 and older) will interpret that as
|
|
* EEH not being supported.
|
|
*/
|
|
phb = PCI_HOST_BRIDGE(sphb);
|
|
pci_for_each_device(phb->bus, (addr >> 16) & 0xFF,
|
|
spapr_eeh_pci_find_device, &found);
|
|
|
|
if (!found) {
|
|
return RTAS_OUT_PARAM_ERROR;
|
|
}
|
|
|
|
op = VFIO_EEH_PE_ENABLE;
|
|
break;
|
|
}
|
|
case RTAS_EEH_THAW_IO:
|
|
op = VFIO_EEH_PE_UNFREEZE_IO;
|
|
break;
|
|
case RTAS_EEH_THAW_DMA:
|
|
op = VFIO_EEH_PE_UNFREEZE_DMA;
|
|
break;
|
|
default:
|
|
return RTAS_OUT_PARAM_ERROR;
|
|
}
|
|
|
|
ret = vfio_eeh_as_op(&sphb->iommu_as, op);
|
|
if (ret < 0) {
|
|
return RTAS_OUT_HW_ERROR;
|
|
}
|
|
|
|
return RTAS_OUT_SUCCESS;
|
|
}
|
|
|
|
int spapr_phb_vfio_eeh_get_state(SpaprPhbState *sphb, int *state)
|
|
{
|
|
int ret;
|
|
|
|
ret = vfio_eeh_as_op(&sphb->iommu_as, VFIO_EEH_PE_GET_STATE);
|
|
if (ret < 0) {
|
|
return RTAS_OUT_PARAM_ERROR;
|
|
}
|
|
|
|
*state = ret;
|
|
return RTAS_OUT_SUCCESS;
|
|
}
|
|
|
|
static void spapr_phb_vfio_eeh_clear_dev_msix(PCIBus *bus,
|
|
PCIDevice *pdev,
|
|
void *opaque)
|
|
{
|
|
/* Check if the device is VFIO PCI device */
|
|
if (!object_dynamic_cast(OBJECT(pdev), "vfio-pci")) {
|
|
return;
|
|
}
|
|
|
|
/*
|
|
* The MSIx table will be cleaned out by reset. We need
|
|
* disable it so that it can be reenabled properly. Also,
|
|
* the cached MSIx table should be cleared as it's not
|
|
* reflecting the contents in hardware.
|
|
*/
|
|
if (msix_enabled(pdev)) {
|
|
uint16_t flags;
|
|
|
|
flags = pci_host_config_read_common(pdev,
|
|
pdev->msix_cap + PCI_MSIX_FLAGS,
|
|
pci_config_size(pdev), 2);
|
|
flags &= ~PCI_MSIX_FLAGS_ENABLE;
|
|
pci_host_config_write_common(pdev,
|
|
pdev->msix_cap + PCI_MSIX_FLAGS,
|
|
pci_config_size(pdev), flags, 2);
|
|
}
|
|
|
|
msix_reset(pdev);
|
|
}
|
|
|
|
static void spapr_phb_vfio_eeh_clear_bus_msix(PCIBus *bus, void *opaque)
|
|
{
|
|
pci_for_each_device_under_bus(bus, spapr_phb_vfio_eeh_clear_dev_msix,
|
|
NULL);
|
|
}
|
|
|
|
static void spapr_phb_vfio_eeh_pre_reset(SpaprPhbState *sphb)
|
|
{
|
|
PCIHostState *phb = PCI_HOST_BRIDGE(sphb);
|
|
|
|
pci_for_each_bus(phb->bus, spapr_phb_vfio_eeh_clear_bus_msix, NULL);
|
|
}
|
|
|
|
int spapr_phb_vfio_eeh_reset(SpaprPhbState *sphb, int option)
|
|
{
|
|
uint32_t op;
|
|
int ret;
|
|
|
|
switch (option) {
|
|
case RTAS_SLOT_RESET_DEACTIVATE:
|
|
op = VFIO_EEH_PE_RESET_DEACTIVATE;
|
|
break;
|
|
case RTAS_SLOT_RESET_HOT:
|
|
spapr_phb_vfio_eeh_pre_reset(sphb);
|
|
op = VFIO_EEH_PE_RESET_HOT;
|
|
break;
|
|
case RTAS_SLOT_RESET_FUNDAMENTAL:
|
|
spapr_phb_vfio_eeh_pre_reset(sphb);
|
|
op = VFIO_EEH_PE_RESET_FUNDAMENTAL;
|
|
break;
|
|
default:
|
|
return RTAS_OUT_PARAM_ERROR;
|
|
}
|
|
|
|
ret = vfio_eeh_as_op(&sphb->iommu_as, op);
|
|
if (ret < 0) {
|
|
return RTAS_OUT_HW_ERROR;
|
|
}
|
|
|
|
return RTAS_OUT_SUCCESS;
|
|
}
|
|
|
|
int spapr_phb_vfio_eeh_configure(SpaprPhbState *sphb)
|
|
{
|
|
int ret;
|
|
|
|
ret = vfio_eeh_as_op(&sphb->iommu_as, VFIO_EEH_PE_CONFIGURE);
|
|
if (ret < 0) {
|
|
return RTAS_OUT_PARAM_ERROR;
|
|
}
|
|
|
|
return RTAS_OUT_SUCCESS;
|
|
}
|
|
|
|
#else
|
|
|
|
bool spapr_phb_eeh_available(SpaprPhbState *sphb)
|
|
{
|
|
return false;
|
|
}
|
|
|
|
void spapr_phb_vfio_reset(DeviceState *qdev)
|
|
{
|
|
}
|
|
|
|
int spapr_phb_vfio_eeh_set_option(SpaprPhbState *sphb,
|
|
unsigned int addr, int option)
|
|
{
|
|
return RTAS_OUT_NOT_SUPPORTED;
|
|
}
|
|
|
|
int spapr_phb_vfio_eeh_get_state(SpaprPhbState *sphb, int *state)
|
|
{
|
|
return RTAS_OUT_NOT_SUPPORTED;
|
|
}
|
|
|
|
int spapr_phb_vfio_eeh_reset(SpaprPhbState *sphb, int option)
|
|
{
|
|
return RTAS_OUT_NOT_SUPPORTED;
|
|
}
|
|
|
|
int spapr_phb_vfio_eeh_configure(SpaprPhbState *sphb)
|
|
{
|
|
return RTAS_OUT_NOT_SUPPORTED;
|
|
}
|
|
|
|
#endif /* CONFIG_VFIO_PCI */
|