[Date Prev][Date Next][Thread Prev][Thread Next][Date Index][Thread Index] Re: [Xen-devel] [PATCH RFC] VT-d: honor firmware-first mode in XSA-59 workaround code
Jan Beulich wrote on 2014-05-22: > When firmware-first mode is being indicated by firmware, we shouldn't be > modifying AER registers - these ar considered to be owned by firmware in that > case. Violating this is being reported to result in SMI (or was it SCI?) > storms. > While circumventing the workaround means re-exposing affected hosts to the > XSA-59 issues, this in any event seems better than not booting at all. > Respective messages are being issued to the log, so the situation can be > diagnosed. > > The basic building blocks were taken from Linux 3.15-rc. > > Reported-by: Andrew Cooper <andrew.cooper3@xxxxxxxxxx> > Reported-by: Malcolm Crossley <malcolm.crossley@xxxxxxxxxx> > Signed-off-by: Jan Beulich <jbeulich@xxxxxxxx> > > --- a/xen/arch/x86/acpi/boot.c > +++ b/xen/arch/x86/acpi/boot.c > @@ -785,6 +785,8 @@ int __init acpi_boot_init(void) > > erst_init(); > > + acpi_hest_init(); > + > acpi_table_parse(ACPI_SIG_BGRT, acpi_invalidate_bgrt); > > return 0; > --- a/xen/drivers/acpi/apei/Makefile > +++ b/xen/drivers/acpi/apei/Makefile > @@ -1,3 +1,4 @@ > obj-y += erst.o > +obj-y += hest.o > obj-y += apei-base.o > obj-y += apei-io.o > --- /dev/null > +++ b/xen/drivers/acpi/apei/hest.c > @@ -0,0 +1,200 @@ > +/* > + * APEI Hardware Error Souce Table support > + * > + * HEST describes error sources in detail; communicates operational > + * parameters (i.e. severity levels, masking bits, and threshold > + * values) to Linux as necessary. It also allows the BIOS to report > + * non-standard error sources to Linux (for example, chipset-specific > + * error registers). > + * > + * For more information about HEST, please refer to ACPI Specification > + * version 4.0, section 17.3.2. > + * > + * Copyright 2009 Intel Corp. > + * Author: Huang Ying <ying.huang@xxxxxxxxx> > + * > + * This program is free software; you can redistribute it and/or > + * modify it under the terms of the GNU General Public License version > + * 2 as published by the Free Software Foundation; > + * > + * This program is distributed in the hope that it will be useful, > + * but WITHOUT ANY WARRANTY; without even the implied warranty of > + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the > + * GNU General Public License for more details. > + * > + * You should have received a copy of the GNU General Public License > + * along with this program; if not, write to the Free Software > + * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 > +USA */ > + > +#include <xen/errno.h> > +#include <xen/init.h> > +#include <xen/kernel.h> > +#include <xen/mm.h> > +#include <xen/pfn.h> > +#include <acpi/acpi.h> > +#include <acpi/apei.h> > + > +#include "apei-internal.h" > + > +#define HEST_PFX "HEST: " > + > +static bool_t hest_disable; > +boolean_param("hest_disable", hest_disable); > + > +/* HEST table parsing */ > + > +static struct acpi_table_hest *__read_mostly hest_tab; > + > +static const int hest_esrc_len_tab[ACPI_HEST_TYPE_RESERVED] = { > + [ACPI_HEST_TYPE_IA32_CHECK] = -1, /* need further calculation */ > + [ACPI_HEST_TYPE_IA32_CORRECTED_CHECK] = -1, > + [ACPI_HEST_TYPE_IA32_NMI] = sizeof(struct acpi_hest_ia_nmi), > + [ACPI_HEST_TYPE_AER_ROOT_PORT] = sizeof(struct acpi_hest_aer_root), > + [ACPI_HEST_TYPE_AER_ENDPOINT] = sizeof(struct acpi_hest_aer), > + [ACPI_HEST_TYPE_AER_BRIDGE] = sizeof(struct acpi_hest_aer_bridge), > + [ACPI_HEST_TYPE_GENERIC_ERROR] = sizeof(struct > acpi_hest_generic), }; > + > +static int hest_esrc_len(const struct acpi_hest_header *hest_hdr) { > + u16 hest_type = hest_hdr->type; > + int len; > + > + if (hest_type >= ACPI_HEST_TYPE_RESERVED) > + return 0; > + > + len = hest_esrc_len_tab[hest_type]; > + > + if (hest_type == ACPI_HEST_TYPE_IA32_CORRECTED_CHECK) { > + const struct acpi_hest_ia_corrected *cmc = > + container_of(hest_hdr, > + const struct acpi_hest_ia_corrected, > + header); > + > + len = sizeof(*cmc) + cmc->num_hardware_banks * > + sizeof(struct acpi_hest_ia_error_bank); > + } else if (hest_type == ACPI_HEST_TYPE_IA32_CHECK) { > + const struct acpi_hest_ia_machine_check *mc = > + container_of(hest_hdr, > + const struct acpi_hest_ia_machine_check, > + header); > + > + len = sizeof(*mc) + mc->num_hardware_banks * > + sizeof(struct acpi_hest_ia_error_bank); > + } > + BUG_ON(len == -1); > + > + return len; > +}; > + > +int apei_hest_parse(apei_hest_func_t func, void *data) { > + struct acpi_hest_header *hest_hdr; > + int i, rc, len; > + > + if (hest_disable || !hest_tab) > + return -EINVAL; > + > + hest_hdr = (struct acpi_hest_header *)(hest_tab + 1); > + for (i = 0; i < hest_tab->error_source_count; i++) { > + len = hest_esrc_len(hest_hdr); > + if (!len) { > + printk(XENLOG_WARNING HEST_PFX > + "Unknown or unused hardware error source " > + "type: %d for hardware error source: %d\n", > + hest_hdr->type, hest_hdr->source_id); > + return -EINVAL; > + } > + if ((void *)hest_hdr + len > > + (void *)hest_tab + hest_tab->header.length) { > + printk(XENLOG_WARNING HEST_PFX > + "Table contents overflow for hardware error > source: %d\n", > + hest_hdr->source_id); > + return -EINVAL; > + } > + > + rc = func(hest_hdr, data); > + if (rc) > + return rc; > + > + hest_hdr = (void *)hest_hdr + len; > + } > + > + return 0; > +} > + > +/* > + * Check if firmware advertises firmware first mode. We need FF bit to > +be set > + * along with a set of MC banks which work in FF mode. > + */ > +static int __init hest_parse_cmc(const struct acpi_hest_header *hest_hdr, > + void *data) > +{ > +#ifdef CONFIG_X86_MCE I didn't find where CONFIG_X86_MCE is defined. Do you have another patch to define it? > + unsigned int i; > + const struct acpi_hest_ia_corrected *cmc; > + const struct acpi_hest_ia_error_bank *mc_bank; > + > + if (hest_hdr->type != ACPI_HEST_TYPE_IA32_CORRECTED_CHECK) > + return 0; > + > + cmc = container_of(hest_hdr, const struct acpi_hest_ia_corrected, > header); > + if (!cmc->enabled) > + return 0; > + > + /* > + * We expect HEST to provide a list of MC banks that report errors > + * in firmware first mode. Otherwise, return non-zero value to > + * indicate that we are done parsing HEST. > + */ > + if (!(cmc->flags & ACPI_HEST_FIRMWARE_FIRST) > || !cmc->num_hardware_banks) > + return 1; > + > + printk(XENLOG_INFO HEST_PFX "Enabling Firmware First mode for > +corrected errors.\n"); > + > + mc_bank = (const struct acpi_hest_ia_error_bank *)(cmc + 1); > + for (i = 0; i < cmc->num_hardware_banks; i++, mc_bank++) > + mce_disable_bank(mc_bank->bank_number); Also no mce_diable_bak is founded. > +#else > +# define acpi_disable_cmcff 1 You didn't define acpi_disable_cmcff if defined CONFIG_X86_MCE. It will cause build error. > +#endif > + > + return 1; > +} > + > +void __init acpi_hest_init(void) > +{ > + acpi_status status; > + acpi_physical_address hest_addr; > + acpi_native_uint hest_len; > + > + if (acpi_disabled) > + return; > + > + if (hest_disable) { > + printk(XENLOG_INFO HEST_PFX "Table parsing disabled.\n"); > + return; > + } > + > + status = acpi_get_table_phys(ACPI_SIG_HEST, 0, &hest_addr, &hest_len); > + if (status == AE_NOT_FOUND) > + goto err; > + if (ACPI_FAILURE(status)) { > + printk(XENLOG_ERR HEST_PFX "Failed to get table, %s\n", > + acpi_format_exception(status)); > + goto err; > + } > + map_pages_to_xen((unsigned long)__va(hest_addr), > PFN_DOWN(hest_addr), > + PFN_UP(hest_addr + hest_len) - PFN_DOWN(hest_addr), > + PAGE_HYPERVISOR); > + hest_tab = __va(hest_addr); > + > + if (!acpi_disable_cmcff) > + apei_hest_parse(hest_parse_cmc, NULL); > + > + printk(XENLOG_INFO HEST_PFX "Table parsing has been initialized\n"); > + return; > +err: > + hest_disable = 1; > +} > --- a/xen/drivers/passthrough/pci.c > +++ b/xen/drivers/passthrough/pci.c > @@ -1066,6 +1066,105 @@ void __hwdom_init setup_hwdom_pci_device > spin_unlock(&pcidevs_lock); > } > > +#ifdef CONFIG_ACPI > +#include <acpi/acpi.h> > +#include <acpi/apei.h> > + > +static int hest_match_pci(const struct acpi_hest_aer_common *p, > + const struct pci_dev *pdev) { > + return ACPI_HEST_SEGMENT(p->bus) == pdev->seg && > + ACPI_HEST_BUS(p->bus) == pdev->bus && > + p->device == PCI_SLOT(pdev->devfn) && > + p->function == PCI_FUNC(pdev->devfn); > +} > + > +static bool_t hest_match_type(const struct acpi_hest_header *hest_hdr, > + const struct pci_dev *pdev) { > + unsigned int pos = pci_find_cap_offset(pdev->seg, pdev->bus, > + PCI_SLOT(pdev->devfn), > + PCI_FUNC(pdev->devfn), > + PCI_CAP_ID_EXP); > + u8 pcie = (pci_conf_read16(pdev->seg, pdev->bus, > PCI_SLOT(pdev->devfn), > + PCI_FUNC(pdev->devfn), pos + > PCI_EXP_FLAGS) & > + PCI_EXP_FLAGS_TYPE) / > + (PCI_EXP_FLAGS_TYPE & -PCI_EXP_FLAGS_TYPE); I think right shift is much intuitively. u8 pcie = (pci_conf_read16(pdev->seg, pdev->bus,PCI_SLOT(pdev->devfn),PCI_FUNC(pdev->devfn), pos + PCI_EXP_FLAGS) & PCI_EXP_FLAGS_TYPE) >> 4; > + > + switch ( hest_hdr->type ) > + { > + case ACPI_HEST_TYPE_AER_ROOT_PORT: > + return pcie == PCI_EXP_TYPE_ROOT_PORT; > + case ACPI_HEST_TYPE_AER_ENDPOINT: > + return pcie == PCI_EXP_TYPE_ENDPOINT; > + case ACPI_HEST_TYPE_AER_BRIDGE: > + return pci_conf_read16(pdev->seg, pdev->bus, > PCI_SLOT(pdev->devfn), > + PCI_FUNC(pdev->devfn), > PCI_CLASS_DEVICE) == > + PCI_CLASS_BRIDGE_PCI; > + } > + > + return 0; > +} > + > +struct aer_hest_parse_info { > + const struct pci_dev *pdev; > + bool_t firmware_first; > +}; > + > +static bool_t hest_source_is_pcie_aer(const struct acpi_hest_header > +*hest_hdr) { > + if ( hest_hdr->type == ACPI_HEST_TYPE_AER_ROOT_PORT || > + hest_hdr->type == ACPI_HEST_TYPE_AER_ENDPOINT || > + hest_hdr->type == ACPI_HEST_TYPE_AER_BRIDGE ) > + return 1; > + return 0; > +} > + > +static int aer_hest_parse(const struct acpi_hest_header *hest_hdr, void > +*data) { > + struct aer_hest_parse_info *info = data; > + const struct acpi_hest_aer_common *p; > + bool_t ff; > + > + if ( !hest_source_is_pcie_aer(hest_hdr) ) > + return 0; > + > + p = (const struct acpi_hest_aer_common *)(hest_hdr + 1); > + ff = !!(p->flags & ACPI_HEST_FIRMWARE_FIRST); > + > + /* > + * If no specific device is supplied, determine whether > + * FIRMWARE_FIRST is set for *any* PCIe device. > + */ > + if ( !info->pdev ) > + { > + info->firmware_first |= ff; > + return 0; > + } > + > + /* Otherwise, check the specific device */ > + if ( p->flags & ACPI_HEST_GLOBAL ? > + hest_match_type(hest_hdr, info->pdev) : > + hest_match_pci(p, info->pdev) ) > + { > + info->firmware_first = ff; > + return 1; > + } > + > + return 0; > +} > + > +bool_t pcie_aer_get_firmware_first(const struct pci_dev *pdev) { > + struct aer_hest_parse_info info = { .pdev = pdev }; > + > + return pci_find_cap_offset(pdev->seg, pdev->bus, > PCI_SLOT(pdev->devfn), > + PCI_FUNC(pdev->devfn), > PCI_CAP_ID_EXP) && > + apei_hest_parse(aer_hest_parse, &info) >= 0 && > + info.firmware_first; > +} > +#endif > + > static int _dump_pci_devices(struct pci_seg *pseg, void *arg) { > struct pci_dev *pdev; > --- a/xen/drivers/passthrough/vtd/quirks.c > +++ b/xen/drivers/passthrough/vtd/quirks.c > @@ -386,9 +386,10 @@ void pci_vtd_quirk(const struct pci_dev > int dev = PCI_SLOT(pdev->devfn); > int func = PCI_FUNC(pdev->devfn); > int pos; > - u32 val; > + u32 val, val2; > u64 bar; > paddr_t pa; > + const char *action; > > if ( pci_conf_read16(seg, bus, dev, func, PCI_VENDOR_ID) != > PCI_VENDOR_ID_INTEL ) > @@ -447,18 +448,26 @@ void pci_vtd_quirk(const struct pci_dev > } > > val = pci_conf_read32(seg, bus, dev, func, pos + > PCI_ERR_UNCOR_MASK); > - pci_conf_write32(seg, bus, dev, func, pos + PCI_ERR_UNCOR_MASK, > - val | PCI_ERR_UNC_UNSUP); > - val = pci_conf_read32(seg, bus, dev, func, pos + > PCI_ERR_COR_MASK); > - pci_conf_write32(seg, bus, dev, func, pos + PCI_ERR_COR_MASK, > - val | PCI_ERR_COR_ADV_NFAT); > + val2 = pci_conf_read32(seg, bus, dev, func, pos + > PCI_ERR_COR_MASK); > + if ( (val & PCI_ERR_UNC_UNSUP) && (val2 & > PCI_ERR_COR_ADV_NFAT) ) > + action = "Found masked"; What happened if dom0 unmasked it later? > + else if ( !pcie_aer_get_firmware_first(pdev) ) > + { > + pci_conf_write32(seg, bus, dev, func, pos + > PCI_ERR_UNCOR_MASK, > + val | PCI_ERR_UNC_UNSUP); > + pci_conf_write32(seg, bus, dev, func, pos + > PCI_ERR_COR_MASK, > + val2 | PCI_ERR_COR_ADV_NFAT); > + action = "Masked"; > + } > + else > + action = "Cannot mask"; > > /* XPUNCERRMSK Send Completion with Unsupported Request */ > val = pci_conf_read32(seg, bus, dev, func, 0x20c); > pci_conf_write32(seg, bus, dev, func, 0x20c, val | (1 << 4)); > > - printk(XENLOG_INFO "Masked UR signaling > on %04x:%02x:%02x.%u\n", > - seg, bus, dev, func); > + printk(XENLOG_INFO "%s UR signaling on %04x:%02x:%02x.%u\n", > + action, seg, bus, dev, func); > break; > > case 0x100: case 0x104: case 0x108: /* Sandybridge */ > --- a/xen/include/acpi/actbl1.h > +++ b/xen/include/acpi/actbl1.h > @@ -445,6 +445,14 @@ struct acpi_hest_aer_common { > #define ACPI_HEST_FIRMWARE_FIRST (1) > #define ACPI_HEST_GLOBAL (1<<1) > > +/* > + * Macros to access the bus/segment numbers in Bus field above: > + * Bus number is encoded in bits 7:0 > + * Segment number is encoded in bits 23:8 */ > +#define ACPI_HEST_BUS(bus) ((bus) & 0xFF) > +#define ACPI_HEST_SEGMENT(bus) (((bus) >> 8) & 0xFFFF) > + > /* Hardware Error Notification */ > > struct acpi_hest_notify { > --- a/xen/include/acpi/apei.h > +++ b/xen/include/acpi/apei.h > @@ -12,6 +12,9 @@ > > #define FIX_APEI_RANGE_MAX 64 > > +typedef int (*apei_hest_func_t)(const struct acpi_hest_header *, void > +*); int apei_hest_parse(apei_hest_func_t, void *); > + > int erst_write(const struct cper_record_header *record); ssize_t > erst_get_record_count(void); int erst_get_next_record_id(u64 *record_id); > --- a/xen/include/xen/acpi.h > +++ b/xen/include/xen/acpi.h > @@ -61,6 +61,7 @@ int acpi_boot_init (void); int acpi_boot_table_init (void); > int acpi_numa_init (void); int erst_init(void); > +void acpi_hest_init(void); > > int acpi_table_init (void); > int acpi_table_parse(char *id, acpi_table_handler handler); > --- a/xen/include/xen/pci.h > +++ b/xen/include/xen/pci.h > @@ -144,6 +144,8 @@ int pci_find_next_ext_capability(int seg const char > *parse_pci(const char *, unsigned int *seg, unsigned int *bus, > unsigned int *dev, unsigned int *func); > > +bool_t pcie_aer_get_firmware_first(const struct pci_dev *); > + > struct pirq; > int msixtbl_pt_register(struct domain *, struct pirq *, uint64_t gtable); > void > msixtbl_pt_unregister(struct domain *, struct pirq *); > Best regards, Yang _______________________________________________ Xen-devel mailing list Xen-devel@xxxxxxxxxxxxx http://lists.xen.org/xen-devel
|
Lists.xenproject.org is hosted with RackSpace, monitoring our |