0e180d9c8a
The Advanced Error Interrupt Message Number (bits 31:27 of the Root Error Status Register) is updated when the number of msi messages assigned to a device changes. Migration of windows 7 on q35 chipset failed because the check in get_pci_config_device() fails due to cmask being set on these bits. Its valid to update these bits and we must restore this state across migration. Signed-off-by: Jason Baron <jbaron@redhat.com> Signed-off-by: Michael S. Tsirkin <mst@redhat.com>
1033 lines
32 KiB
C
1033 lines
32 KiB
C
/*
|
|
* pcie_aer.c
|
|
*
|
|
* Copyright (c) 2010 Isaku Yamahata <yamahata at valinux co jp>
|
|
* VA Linux Systems Japan K.K.
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License along
|
|
* with this program; if not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#include "sysemu.h"
|
|
#include "qemu-objects.h"
|
|
#include "monitor.h"
|
|
#include "pci_bridge.h"
|
|
#include "pcie.h"
|
|
#include "msix.h"
|
|
#include "msi.h"
|
|
#include "pci_internals.h"
|
|
#include "pcie_regs.h"
|
|
|
|
//#define DEBUG_PCIE
|
|
#ifdef DEBUG_PCIE
|
|
# define PCIE_DPRINTF(fmt, ...) \
|
|
fprintf(stderr, "%s:%d " fmt, __func__, __LINE__, ## __VA_ARGS__)
|
|
#else
|
|
# define PCIE_DPRINTF(fmt, ...) do {} while (0)
|
|
#endif
|
|
#define PCIE_DEV_PRINTF(dev, fmt, ...) \
|
|
PCIE_DPRINTF("%s:%x "fmt, (dev)->name, (dev)->devfn, ## __VA_ARGS__)
|
|
|
|
#define PCI_ERR_SRC_COR_OFFS 0
|
|
#define PCI_ERR_SRC_UNCOR_OFFS 2
|
|
|
|
/* From 6.2.7 Error Listing and Rules. Table 6-2, 6-3 and 6-4 */
|
|
static uint32_t pcie_aer_uncor_default_severity(uint32_t status)
|
|
{
|
|
switch (status) {
|
|
case PCI_ERR_UNC_INTN:
|
|
case PCI_ERR_UNC_DLP:
|
|
case PCI_ERR_UNC_SDN:
|
|
case PCI_ERR_UNC_RX_OVER:
|
|
case PCI_ERR_UNC_FCP:
|
|
case PCI_ERR_UNC_MALF_TLP:
|
|
return PCI_ERR_ROOT_CMD_FATAL_EN;
|
|
case PCI_ERR_UNC_POISON_TLP:
|
|
case PCI_ERR_UNC_ECRC:
|
|
case PCI_ERR_UNC_UNSUP:
|
|
case PCI_ERR_UNC_COMP_TIME:
|
|
case PCI_ERR_UNC_COMP_ABORT:
|
|
case PCI_ERR_UNC_UNX_COMP:
|
|
case PCI_ERR_UNC_ACSV:
|
|
case PCI_ERR_UNC_MCBTLP:
|
|
case PCI_ERR_UNC_ATOP_EBLOCKED:
|
|
case PCI_ERR_UNC_TLP_PRF_BLOCKED:
|
|
return PCI_ERR_ROOT_CMD_NONFATAL_EN;
|
|
default:
|
|
abort();
|
|
break;
|
|
}
|
|
return PCI_ERR_ROOT_CMD_FATAL_EN;
|
|
}
|
|
|
|
static int aer_log_add_err(PCIEAERLog *aer_log, const PCIEAERErr *err)
|
|
{
|
|
if (aer_log->log_num == aer_log->log_max) {
|
|
return -1;
|
|
}
|
|
memcpy(&aer_log->log[aer_log->log_num], err, sizeof *err);
|
|
aer_log->log_num++;
|
|
return 0;
|
|
}
|
|
|
|
static void aer_log_del_err(PCIEAERLog *aer_log, PCIEAERErr *err)
|
|
{
|
|
assert(aer_log->log_num);
|
|
*err = aer_log->log[0];
|
|
aer_log->log_num--;
|
|
memmove(&aer_log->log[0], &aer_log->log[1],
|
|
aer_log->log_num * sizeof *err);
|
|
}
|
|
|
|
static void aer_log_clear_all_err(PCIEAERLog *aer_log)
|
|
{
|
|
aer_log->log_num = 0;
|
|
}
|
|
|
|
int pcie_aer_init(PCIDevice *dev, uint16_t offset)
|
|
{
|
|
PCIExpressDevice *exp;
|
|
|
|
pcie_add_capability(dev, PCI_EXT_CAP_ID_ERR, PCI_ERR_VER,
|
|
offset, PCI_ERR_SIZEOF);
|
|
exp = &dev->exp;
|
|
exp->aer_cap = offset;
|
|
|
|
/* log_max is property */
|
|
if (dev->exp.aer_log.log_max == PCIE_AER_LOG_MAX_UNSET) {
|
|
dev->exp.aer_log.log_max = PCIE_AER_LOG_MAX_DEFAULT;
|
|
}
|
|
/* clip down the value to avoid unreasobale memory usage */
|
|
if (dev->exp.aer_log.log_max > PCIE_AER_LOG_MAX_LIMIT) {
|
|
return -EINVAL;
|
|
}
|
|
dev->exp.aer_log.log = g_malloc0(sizeof dev->exp.aer_log.log[0] *
|
|
dev->exp.aer_log.log_max);
|
|
|
|
pci_set_long(dev->w1cmask + offset + PCI_ERR_UNCOR_STATUS,
|
|
PCI_ERR_UNC_SUPPORTED);
|
|
|
|
pci_set_long(dev->config + offset + PCI_ERR_UNCOR_SEVER,
|
|
PCI_ERR_UNC_SEVERITY_DEFAULT);
|
|
pci_set_long(dev->wmask + offset + PCI_ERR_UNCOR_SEVER,
|
|
PCI_ERR_UNC_SUPPORTED);
|
|
|
|
pci_long_test_and_set_mask(dev->w1cmask + offset + PCI_ERR_COR_STATUS,
|
|
PCI_ERR_COR_STATUS);
|
|
|
|
pci_set_long(dev->config + offset + PCI_ERR_COR_MASK,
|
|
PCI_ERR_COR_MASK_DEFAULT);
|
|
pci_set_long(dev->wmask + offset + PCI_ERR_COR_MASK,
|
|
PCI_ERR_COR_SUPPORTED);
|
|
|
|
/* capabilities and control. multiple header logging is supported */
|
|
if (dev->exp.aer_log.log_max > 0) {
|
|
pci_set_long(dev->config + offset + PCI_ERR_CAP,
|
|
PCI_ERR_CAP_ECRC_GENC | PCI_ERR_CAP_ECRC_CHKC |
|
|
PCI_ERR_CAP_MHRC);
|
|
pci_set_long(dev->wmask + offset + PCI_ERR_CAP,
|
|
PCI_ERR_CAP_ECRC_GENE | PCI_ERR_CAP_ECRC_CHKE |
|
|
PCI_ERR_CAP_MHRE);
|
|
} else {
|
|
pci_set_long(dev->config + offset + PCI_ERR_CAP,
|
|
PCI_ERR_CAP_ECRC_GENC | PCI_ERR_CAP_ECRC_CHKC);
|
|
pci_set_long(dev->wmask + offset + PCI_ERR_CAP,
|
|
PCI_ERR_CAP_ECRC_GENE | PCI_ERR_CAP_ECRC_CHKE);
|
|
}
|
|
|
|
switch (pcie_cap_get_type(dev)) {
|
|
case PCI_EXP_TYPE_ROOT_PORT:
|
|
/* this case will be set by pcie_aer_root_init() */
|
|
/* fallthrough */
|
|
case PCI_EXP_TYPE_DOWNSTREAM:
|
|
case PCI_EXP_TYPE_UPSTREAM:
|
|
pci_word_test_and_set_mask(dev->wmask + PCI_BRIDGE_CONTROL,
|
|
PCI_BRIDGE_CTL_SERR);
|
|
pci_long_test_and_set_mask(dev->w1cmask + PCI_STATUS,
|
|
PCI_SEC_STATUS_RCV_SYSTEM_ERROR);
|
|
break;
|
|
default:
|
|
/* nothing */
|
|
break;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
void pcie_aer_exit(PCIDevice *dev)
|
|
{
|
|
g_free(dev->exp.aer_log.log);
|
|
}
|
|
|
|
static void pcie_aer_update_uncor_status(PCIDevice *dev)
|
|
{
|
|
uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
|
|
PCIEAERLog *aer_log = &dev->exp.aer_log;
|
|
|
|
uint16_t i;
|
|
for (i = 0; i < aer_log->log_num; i++) {
|
|
pci_long_test_and_set_mask(aer_cap + PCI_ERR_UNCOR_STATUS,
|
|
dev->exp.aer_log.log[i].status);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* return value:
|
|
* true: error message needs to be sent up
|
|
* false: error message is masked
|
|
*
|
|
* 6.2.6 Error Message Control
|
|
* Figure 6-3
|
|
* all pci express devices part
|
|
*/
|
|
static bool
|
|
pcie_aer_msg_alldev(PCIDevice *dev, const PCIEAERMsg *msg)
|
|
{
|
|
if (!(pcie_aer_msg_is_uncor(msg) &&
|
|
(pci_get_word(dev->config + PCI_COMMAND) & PCI_COMMAND_SERR))) {
|
|
return false;
|
|
}
|
|
|
|
/* Signaled System Error
|
|
*
|
|
* 7.5.1.1 Command register
|
|
* Bit 8 SERR# Enable
|
|
*
|
|
* When Set, this bit enables reporting of Non-fatal and Fatal
|
|
* errors detected by the Function to the Root Complex. Note that
|
|
* errors are reported if enabled either through this bit or through
|
|
* the PCI Express specific bits in the Device Control register (see
|
|
* Section 7.8.4).
|
|
*/
|
|
pci_word_test_and_set_mask(dev->config + PCI_STATUS,
|
|
PCI_STATUS_SIG_SYSTEM_ERROR);
|
|
|
|
if (!(msg->severity &
|
|
pci_get_word(dev->config + dev->exp.exp_cap + PCI_EXP_DEVCTL))) {
|
|
return false;
|
|
}
|
|
|
|
/* send up error message */
|
|
return true;
|
|
}
|
|
|
|
/*
|
|
* return value:
|
|
* true: error message is sent up
|
|
* false: error message is masked
|
|
*
|
|
* 6.2.6 Error Message Control
|
|
* Figure 6-3
|
|
* virtual pci bridge part
|
|
*/
|
|
static bool pcie_aer_msg_vbridge(PCIDevice *dev, const PCIEAERMsg *msg)
|
|
{
|
|
uint16_t bridge_control = pci_get_word(dev->config + PCI_BRIDGE_CONTROL);
|
|
|
|
if (pcie_aer_msg_is_uncor(msg)) {
|
|
/* Received System Error */
|
|
pci_word_test_and_set_mask(dev->config + PCI_SEC_STATUS,
|
|
PCI_SEC_STATUS_RCV_SYSTEM_ERROR);
|
|
}
|
|
|
|
if (!(bridge_control & PCI_BRIDGE_CTL_SERR)) {
|
|
return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
void pcie_aer_root_set_vector(PCIDevice *dev, unsigned int vector)
|
|
{
|
|
uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
|
|
assert(vector < PCI_ERR_ROOT_IRQ_MAX);
|
|
pci_long_test_and_clear_mask(aer_cap + PCI_ERR_ROOT_STATUS,
|
|
PCI_ERR_ROOT_IRQ);
|
|
pci_long_test_and_set_mask(aer_cap + PCI_ERR_ROOT_STATUS,
|
|
vector << PCI_ERR_ROOT_IRQ_SHIFT);
|
|
}
|
|
|
|
static unsigned int pcie_aer_root_get_vector(PCIDevice *dev)
|
|
{
|
|
uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
|
|
uint32_t root_status = pci_get_long(aer_cap + PCI_ERR_ROOT_STATUS);
|
|
return (root_status & PCI_ERR_ROOT_IRQ) >> PCI_ERR_ROOT_IRQ_SHIFT;
|
|
}
|
|
|
|
/* Given a status register, get corresponding bits in the command register */
|
|
static uint32_t pcie_aer_status_to_cmd(uint32_t status)
|
|
{
|
|
uint32_t cmd = 0;
|
|
if (status & PCI_ERR_ROOT_COR_RCV) {
|
|
cmd |= PCI_ERR_ROOT_CMD_COR_EN;
|
|
}
|
|
if (status & PCI_ERR_ROOT_NONFATAL_RCV) {
|
|
cmd |= PCI_ERR_ROOT_CMD_NONFATAL_EN;
|
|
}
|
|
if (status & PCI_ERR_ROOT_FATAL_RCV) {
|
|
cmd |= PCI_ERR_ROOT_CMD_FATAL_EN;
|
|
}
|
|
return cmd;
|
|
}
|
|
|
|
static void pcie_aer_root_notify(PCIDevice *dev)
|
|
{
|
|
if (msix_enabled(dev)) {
|
|
msix_notify(dev, pcie_aer_root_get_vector(dev));
|
|
} else if (msi_enabled(dev)) {
|
|
msi_notify(dev, pcie_aer_root_get_vector(dev));
|
|
} else {
|
|
qemu_set_irq(dev->irq[dev->exp.aer_intx], 1);
|
|
}
|
|
}
|
|
|
|
/*
|
|
* 6.2.6 Error Message Control
|
|
* Figure 6-3
|
|
* root port part
|
|
*/
|
|
static void pcie_aer_msg_root_port(PCIDevice *dev, const PCIEAERMsg *msg)
|
|
{
|
|
uint16_t cmd;
|
|
uint8_t *aer_cap;
|
|
uint32_t root_cmd;
|
|
uint32_t root_status, prev_status;
|
|
|
|
cmd = pci_get_word(dev->config + PCI_COMMAND);
|
|
aer_cap = dev->config + dev->exp.aer_cap;
|
|
root_cmd = pci_get_long(aer_cap + PCI_ERR_ROOT_COMMAND);
|
|
prev_status = root_status = pci_get_long(aer_cap + PCI_ERR_ROOT_STATUS);
|
|
|
|
if (cmd & PCI_COMMAND_SERR) {
|
|
/* System Error.
|
|
*
|
|
* The way to report System Error is platform specific and
|
|
* it isn't implemented in qemu right now.
|
|
* So just discard the error for now.
|
|
* OS which cares of aer would receive errors via
|
|
* native aer mechanims, so this wouldn't matter.
|
|
*/
|
|
}
|
|
|
|
/* Errro Message Received: Root Error Status register */
|
|
switch (msg->severity) {
|
|
case PCI_ERR_ROOT_CMD_COR_EN:
|
|
if (root_status & PCI_ERR_ROOT_COR_RCV) {
|
|
root_status |= PCI_ERR_ROOT_MULTI_COR_RCV;
|
|
} else {
|
|
pci_set_word(aer_cap + PCI_ERR_ROOT_ERR_SRC + PCI_ERR_SRC_COR_OFFS,
|
|
msg->source_id);
|
|
}
|
|
root_status |= PCI_ERR_ROOT_COR_RCV;
|
|
break;
|
|
case PCI_ERR_ROOT_CMD_NONFATAL_EN:
|
|
root_status |= PCI_ERR_ROOT_NONFATAL_RCV;
|
|
break;
|
|
case PCI_ERR_ROOT_CMD_FATAL_EN:
|
|
if (!(root_status & PCI_ERR_ROOT_UNCOR_RCV)) {
|
|
root_status |= PCI_ERR_ROOT_FIRST_FATAL;
|
|
}
|
|
root_status |= PCI_ERR_ROOT_FATAL_RCV;
|
|
break;
|
|
default:
|
|
abort();
|
|
break;
|
|
}
|
|
if (pcie_aer_msg_is_uncor(msg)) {
|
|
if (root_status & PCI_ERR_ROOT_UNCOR_RCV) {
|
|
root_status |= PCI_ERR_ROOT_MULTI_UNCOR_RCV;
|
|
} else {
|
|
pci_set_word(aer_cap + PCI_ERR_ROOT_ERR_SRC +
|
|
PCI_ERR_SRC_UNCOR_OFFS, msg->source_id);
|
|
}
|
|
root_status |= PCI_ERR_ROOT_UNCOR_RCV;
|
|
}
|
|
pci_set_long(aer_cap + PCI_ERR_ROOT_STATUS, root_status);
|
|
|
|
/* 6.2.4.1.2 Interrupt Generation */
|
|
/* All the above did was set some bits in the status register.
|
|
* Specifically these that match message severity.
|
|
* The below code relies on this fact. */
|
|
if (!(root_cmd & msg->severity) ||
|
|
(pcie_aer_status_to_cmd(prev_status) & root_cmd)) {
|
|
/* Condition is not being set or was already true so nothing to do. */
|
|
return;
|
|
}
|
|
|
|
pcie_aer_root_notify(dev);
|
|
}
|
|
|
|
/*
|
|
* 6.2.6 Error Message Control Figure 6-3
|
|
*
|
|
* Walk up the bus tree from the device, propagate the error message.
|
|
*/
|
|
static void pcie_aer_msg(PCIDevice *dev, const PCIEAERMsg *msg)
|
|
{
|
|
uint8_t type;
|
|
|
|
while (dev) {
|
|
if (!pci_is_express(dev)) {
|
|
/* just ignore it */
|
|
/* TODO: Shouldn't we set PCI_STATUS_SIG_SYSTEM_ERROR?
|
|
* Consider e.g. a PCI bridge above a PCI Express device. */
|
|
return;
|
|
}
|
|
|
|
type = pcie_cap_get_type(dev);
|
|
if ((type == PCI_EXP_TYPE_ROOT_PORT ||
|
|
type == PCI_EXP_TYPE_UPSTREAM ||
|
|
type == PCI_EXP_TYPE_DOWNSTREAM) &&
|
|
!pcie_aer_msg_vbridge(dev, msg)) {
|
|
return;
|
|
}
|
|
if (!pcie_aer_msg_alldev(dev, msg)) {
|
|
return;
|
|
}
|
|
if (type == PCI_EXP_TYPE_ROOT_PORT) {
|
|
pcie_aer_msg_root_port(dev, msg);
|
|
/* Root port can notify system itself,
|
|
or send the error message to root complex event collector. */
|
|
/*
|
|
* if root port is associated with an event collector,
|
|
* return the root complex event collector here.
|
|
* For now root complex event collector isn't supported.
|
|
*/
|
|
return;
|
|
}
|
|
dev = pci_bridge_get_device(dev->bus);
|
|
}
|
|
}
|
|
|
|
static void pcie_aer_update_log(PCIDevice *dev, const PCIEAERErr *err)
|
|
{
|
|
uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
|
|
uint8_t first_bit = ffs(err->status) - 1;
|
|
uint32_t errcap = pci_get_long(aer_cap + PCI_ERR_CAP);
|
|
int i;
|
|
|
|
assert(err->status);
|
|
assert(!(err->status & (err->status - 1)));
|
|
|
|
errcap &= ~(PCI_ERR_CAP_FEP_MASK | PCI_ERR_CAP_TLP);
|
|
errcap |= PCI_ERR_CAP_FEP(first_bit);
|
|
|
|
if (err->flags & PCIE_AER_ERR_HEADER_VALID) {
|
|
for (i = 0; i < ARRAY_SIZE(err->header); ++i) {
|
|
/* 7.10.8 Header Log Register */
|
|
uint8_t *header_log =
|
|
aer_cap + PCI_ERR_HEADER_LOG + i * sizeof err->header[0];
|
|
cpu_to_be32wu((uint32_t*)header_log, err->header[i]);
|
|
}
|
|
} else {
|
|
assert(!(err->flags & PCIE_AER_ERR_TLP_PREFIX_PRESENT));
|
|
memset(aer_cap + PCI_ERR_HEADER_LOG, 0, PCI_ERR_HEADER_LOG_SIZE);
|
|
}
|
|
|
|
if ((err->flags & PCIE_AER_ERR_TLP_PREFIX_PRESENT) &&
|
|
(pci_get_long(dev->config + dev->exp.exp_cap + PCI_EXP_DEVCTL2) &
|
|
PCI_EXP_DEVCAP2_EETLPP)) {
|
|
for (i = 0; i < ARRAY_SIZE(err->prefix); ++i) {
|
|
/* 7.10.12 tlp prefix log register */
|
|
uint8_t *prefix_log =
|
|
aer_cap + PCI_ERR_TLP_PREFIX_LOG + i * sizeof err->prefix[0];
|
|
cpu_to_be32wu((uint32_t*)prefix_log, err->prefix[i]);
|
|
}
|
|
errcap |= PCI_ERR_CAP_TLP;
|
|
} else {
|
|
memset(aer_cap + PCI_ERR_TLP_PREFIX_LOG, 0,
|
|
PCI_ERR_TLP_PREFIX_LOG_SIZE);
|
|
}
|
|
pci_set_long(aer_cap + PCI_ERR_CAP, errcap);
|
|
}
|
|
|
|
static void pcie_aer_clear_log(PCIDevice *dev)
|
|
{
|
|
uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
|
|
|
|
pci_long_test_and_clear_mask(aer_cap + PCI_ERR_CAP,
|
|
PCI_ERR_CAP_FEP_MASK | PCI_ERR_CAP_TLP);
|
|
|
|
memset(aer_cap + PCI_ERR_HEADER_LOG, 0, PCI_ERR_HEADER_LOG_SIZE);
|
|
memset(aer_cap + PCI_ERR_TLP_PREFIX_LOG, 0, PCI_ERR_TLP_PREFIX_LOG_SIZE);
|
|
}
|
|
|
|
static void pcie_aer_clear_error(PCIDevice *dev)
|
|
{
|
|
uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
|
|
uint32_t errcap = pci_get_long(aer_cap + PCI_ERR_CAP);
|
|
PCIEAERLog *aer_log = &dev->exp.aer_log;
|
|
PCIEAERErr err;
|
|
|
|
if (!(errcap & PCI_ERR_CAP_MHRE) || !aer_log->log_num) {
|
|
pcie_aer_clear_log(dev);
|
|
return;
|
|
}
|
|
|
|
/*
|
|
* If more errors are queued, set corresponding bits in uncorrectable
|
|
* error status.
|
|
* We emulate uncorrectable error status register as W1CS.
|
|
* So set bit in uncorrectable error status here again for multiple
|
|
* error recording support.
|
|
*
|
|
* 6.2.4.2 Multiple Error Handling(Advanced Error Reporting Capability)
|
|
*/
|
|
pcie_aer_update_uncor_status(dev);
|
|
|
|
aer_log_del_err(aer_log, &err);
|
|
pcie_aer_update_log(dev, &err);
|
|
}
|
|
|
|
static int pcie_aer_record_error(PCIDevice *dev,
|
|
const PCIEAERErr *err)
|
|
{
|
|
uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
|
|
uint32_t errcap = pci_get_long(aer_cap + PCI_ERR_CAP);
|
|
int fep = PCI_ERR_CAP_FEP(errcap);
|
|
|
|
assert(err->status);
|
|
assert(!(err->status & (err->status - 1)));
|
|
|
|
if (errcap & PCI_ERR_CAP_MHRE &&
|
|
(pci_get_long(aer_cap + PCI_ERR_UNCOR_STATUS) & (1U << fep))) {
|
|
/* Not first error. queue error */
|
|
if (aer_log_add_err(&dev->exp.aer_log, err) < 0) {
|
|
/* overflow */
|
|
return -1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
pcie_aer_update_log(dev, err);
|
|
return 0;
|
|
}
|
|
|
|
typedef struct PCIEAERInject {
|
|
PCIDevice *dev;
|
|
uint8_t *aer_cap;
|
|
const PCIEAERErr *err;
|
|
uint16_t devctl;
|
|
uint16_t devsta;
|
|
uint32_t error_status;
|
|
bool unsupported_request;
|
|
bool log_overflow;
|
|
PCIEAERMsg msg;
|
|
} PCIEAERInject;
|
|
|
|
static bool pcie_aer_inject_cor_error(PCIEAERInject *inj,
|
|
uint32_t uncor_status,
|
|
bool is_advisory_nonfatal)
|
|
{
|
|
PCIDevice *dev = inj->dev;
|
|
|
|
inj->devsta |= PCI_EXP_DEVSTA_CED;
|
|
if (inj->unsupported_request) {
|
|
inj->devsta |= PCI_EXP_DEVSTA_URD;
|
|
}
|
|
pci_set_word(dev->config + dev->exp.exp_cap + PCI_EXP_DEVSTA, inj->devsta);
|
|
|
|
if (inj->aer_cap) {
|
|
uint32_t mask;
|
|
pci_long_test_and_set_mask(inj->aer_cap + PCI_ERR_COR_STATUS,
|
|
inj->error_status);
|
|
mask = pci_get_long(inj->aer_cap + PCI_ERR_COR_MASK);
|
|
if (mask & inj->error_status) {
|
|
return false;
|
|
}
|
|
if (is_advisory_nonfatal) {
|
|
uint32_t uncor_mask =
|
|
pci_get_long(inj->aer_cap + PCI_ERR_UNCOR_MASK);
|
|
if (!(uncor_mask & uncor_status)) {
|
|
inj->log_overflow = !!pcie_aer_record_error(dev, inj->err);
|
|
}
|
|
pci_long_test_and_set_mask(inj->aer_cap + PCI_ERR_UNCOR_STATUS,
|
|
uncor_status);
|
|
}
|
|
}
|
|
|
|
if (inj->unsupported_request && !(inj->devctl & PCI_EXP_DEVCTL_URRE)) {
|
|
return false;
|
|
}
|
|
if (!(inj->devctl & PCI_EXP_DEVCTL_CERE)) {
|
|
return false;
|
|
}
|
|
|
|
inj->msg.severity = PCI_ERR_ROOT_CMD_COR_EN;
|
|
return true;
|
|
}
|
|
|
|
static bool pcie_aer_inject_uncor_error(PCIEAERInject *inj, bool is_fatal)
|
|
{
|
|
PCIDevice *dev = inj->dev;
|
|
uint16_t cmd;
|
|
|
|
if (is_fatal) {
|
|
inj->devsta |= PCI_EXP_DEVSTA_FED;
|
|
} else {
|
|
inj->devsta |= PCI_EXP_DEVSTA_NFED;
|
|
}
|
|
if (inj->unsupported_request) {
|
|
inj->devsta |= PCI_EXP_DEVSTA_URD;
|
|
}
|
|
pci_set_long(dev->config + dev->exp.exp_cap + PCI_EXP_DEVSTA, inj->devsta);
|
|
|
|
if (inj->aer_cap) {
|
|
uint32_t mask = pci_get_long(inj->aer_cap + PCI_ERR_UNCOR_MASK);
|
|
if (mask & inj->error_status) {
|
|
pci_long_test_and_set_mask(inj->aer_cap + PCI_ERR_UNCOR_STATUS,
|
|
inj->error_status);
|
|
return false;
|
|
}
|
|
|
|
inj->log_overflow = !!pcie_aer_record_error(dev, inj->err);
|
|
pci_long_test_and_set_mask(inj->aer_cap + PCI_ERR_UNCOR_STATUS,
|
|
inj->error_status);
|
|
}
|
|
|
|
cmd = pci_get_word(dev->config + PCI_COMMAND);
|
|
if (inj->unsupported_request &&
|
|
!(inj->devctl & PCI_EXP_DEVCTL_URRE) && !(cmd & PCI_COMMAND_SERR)) {
|
|
return false;
|
|
}
|
|
if (is_fatal) {
|
|
if (!((cmd & PCI_COMMAND_SERR) ||
|
|
(inj->devctl & PCI_EXP_DEVCTL_FERE))) {
|
|
return false;
|
|
}
|
|
inj->msg.severity = PCI_ERR_ROOT_CMD_FATAL_EN;
|
|
} else {
|
|
if (!((cmd & PCI_COMMAND_SERR) ||
|
|
(inj->devctl & PCI_EXP_DEVCTL_NFERE))) {
|
|
return false;
|
|
}
|
|
inj->msg.severity = PCI_ERR_ROOT_CMD_NONFATAL_EN;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
/*
|
|
* non-Function specific error must be recorded in all functions.
|
|
* It is the responsibility of the caller of this function.
|
|
* It is also caller's responsibility to determine which function should
|
|
* report the rerror.
|
|
*
|
|
* 6.2.4 Error Logging
|
|
* 6.2.5 Sqeunce of Device Error Signaling and Logging Operations
|
|
* table 6-2: Flowchard Showing Sequence of Device Error Signaling and Logging
|
|
* Operations
|
|
*/
|
|
int pcie_aer_inject_error(PCIDevice *dev, const PCIEAERErr *err)
|
|
{
|
|
uint8_t *aer_cap = NULL;
|
|
uint16_t devctl = 0;
|
|
uint16_t devsta = 0;
|
|
uint32_t error_status = err->status;
|
|
PCIEAERInject inj;
|
|
|
|
if (!pci_is_express(dev)) {
|
|
return -ENOSYS;
|
|
}
|
|
|
|
if (err->flags & PCIE_AER_ERR_IS_CORRECTABLE) {
|
|
error_status &= PCI_ERR_COR_SUPPORTED;
|
|
} else {
|
|
error_status &= PCI_ERR_UNC_SUPPORTED;
|
|
}
|
|
|
|
/* invalid status bit. one and only one bit must be set */
|
|
if (!error_status || (error_status & (error_status - 1))) {
|
|
return -EINVAL;
|
|
}
|
|
|
|
if (dev->exp.aer_cap) {
|
|
uint8_t *exp_cap = dev->config + dev->exp.exp_cap;
|
|
aer_cap = dev->config + dev->exp.aer_cap;
|
|
devctl = pci_get_long(exp_cap + PCI_EXP_DEVCTL);
|
|
devsta = pci_get_long(exp_cap + PCI_EXP_DEVSTA);
|
|
}
|
|
|
|
inj.dev = dev;
|
|
inj.aer_cap = aer_cap;
|
|
inj.err = err;
|
|
inj.devctl = devctl;
|
|
inj.devsta = devsta;
|
|
inj.error_status = error_status;
|
|
inj.unsupported_request = !(err->flags & PCIE_AER_ERR_IS_CORRECTABLE) &&
|
|
err->status == PCI_ERR_UNC_UNSUP;
|
|
inj.log_overflow = false;
|
|
|
|
if (err->flags & PCIE_AER_ERR_IS_CORRECTABLE) {
|
|
if (!pcie_aer_inject_cor_error(&inj, 0, false)) {
|
|
return 0;
|
|
}
|
|
} else {
|
|
bool is_fatal =
|
|
pcie_aer_uncor_default_severity(error_status) ==
|
|
PCI_ERR_ROOT_CMD_FATAL_EN;
|
|
if (aer_cap) {
|
|
is_fatal =
|
|
error_status & pci_get_long(aer_cap + PCI_ERR_UNCOR_SEVER);
|
|
}
|
|
if (!is_fatal && (err->flags & PCIE_AER_ERR_MAYBE_ADVISORY)) {
|
|
inj.error_status = PCI_ERR_COR_ADV_NONFATAL;
|
|
if (!pcie_aer_inject_cor_error(&inj, error_status, true)) {
|
|
return 0;
|
|
}
|
|
} else {
|
|
if (!pcie_aer_inject_uncor_error(&inj, is_fatal)) {
|
|
return 0;
|
|
}
|
|
}
|
|
}
|
|
|
|
/* send up error message */
|
|
inj.msg.source_id = err->source_id;
|
|
pcie_aer_msg(dev, &inj.msg);
|
|
|
|
if (inj.log_overflow) {
|
|
PCIEAERErr header_log_overflow = {
|
|
.status = PCI_ERR_COR_HL_OVERFLOW,
|
|
.flags = PCIE_AER_ERR_IS_CORRECTABLE,
|
|
};
|
|
int ret = pcie_aer_inject_error(dev, &header_log_overflow);
|
|
assert(!ret);
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
void pcie_aer_write_config(PCIDevice *dev,
|
|
uint32_t addr, uint32_t val, int len)
|
|
{
|
|
uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
|
|
uint32_t errcap = pci_get_long(aer_cap + PCI_ERR_CAP);
|
|
uint32_t first_error = 1U << PCI_ERR_CAP_FEP(errcap);
|
|
uint32_t uncorsta = pci_get_long(aer_cap + PCI_ERR_UNCOR_STATUS);
|
|
|
|
/* uncorrectable error */
|
|
if (!(uncorsta & first_error)) {
|
|
/* the bit that corresponds to the first error is cleared */
|
|
pcie_aer_clear_error(dev);
|
|
} else if (errcap & PCI_ERR_CAP_MHRE) {
|
|
/* When PCI_ERR_CAP_MHRE is enabled and the first error isn't cleared
|
|
* nothing should happen. So we have to revert the modification to
|
|
* the register.
|
|
*/
|
|
pcie_aer_update_uncor_status(dev);
|
|
} else {
|
|
/* capability & control
|
|
* PCI_ERR_CAP_MHRE might be cleared, so clear of header log.
|
|
*/
|
|
aer_log_clear_all_err(&dev->exp.aer_log);
|
|
}
|
|
}
|
|
|
|
void pcie_aer_root_init(PCIDevice *dev)
|
|
{
|
|
uint16_t pos = dev->exp.aer_cap;
|
|
|
|
pci_set_long(dev->wmask + pos + PCI_ERR_ROOT_COMMAND,
|
|
PCI_ERR_ROOT_CMD_EN_MASK);
|
|
pci_set_long(dev->w1cmask + pos + PCI_ERR_ROOT_STATUS,
|
|
PCI_ERR_ROOT_STATUS_REPORT_MASK);
|
|
/* PCI_ERR_ROOT_IRQ is RO but devices change it using a
|
|
* device-specific method.
|
|
*/
|
|
pci_set_long(dev->cmask + pos + PCI_ERR_ROOT_STATUS,
|
|
~PCI_ERR_ROOT_IRQ);
|
|
}
|
|
|
|
void pcie_aer_root_reset(PCIDevice *dev)
|
|
{
|
|
uint8_t* aer_cap = dev->config + dev->exp.aer_cap;
|
|
|
|
pci_set_long(aer_cap + PCI_ERR_ROOT_COMMAND, 0);
|
|
|
|
/*
|
|
* Advanced Error Interrupt Message Number in Root Error Status Register
|
|
* must be updated by chip dependent code because it's chip dependent
|
|
* which number is used.
|
|
*/
|
|
}
|
|
|
|
void pcie_aer_root_write_config(PCIDevice *dev,
|
|
uint32_t addr, uint32_t val, int len,
|
|
uint32_t root_cmd_prev)
|
|
{
|
|
uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
|
|
uint32_t root_status = pci_get_long(aer_cap + PCI_ERR_ROOT_STATUS);
|
|
uint32_t enabled_cmd = pcie_aer_status_to_cmd(root_status);
|
|
uint32_t root_cmd = pci_get_long(aer_cap + PCI_ERR_ROOT_COMMAND);
|
|
/* 6.2.4.1.2 Interrupt Generation */
|
|
if (!msix_enabled(dev) && !msi_enabled(dev)) {
|
|
qemu_set_irq(dev->irq[dev->exp.aer_intx], !!(root_cmd & enabled_cmd));
|
|
return;
|
|
}
|
|
|
|
if ((root_cmd_prev & enabled_cmd) || !(root_cmd & enabled_cmd)) {
|
|
/* Send MSI on transition from false to true. */
|
|
return;
|
|
}
|
|
|
|
pcie_aer_root_notify(dev);
|
|
}
|
|
|
|
static const VMStateDescription vmstate_pcie_aer_err = {
|
|
.name = "PCIE_AER_ERROR",
|
|
.version_id = 1,
|
|
.minimum_version_id = 1,
|
|
.minimum_version_id_old = 1,
|
|
.fields = (VMStateField[]) {
|
|
VMSTATE_UINT32(status, PCIEAERErr),
|
|
VMSTATE_UINT16(source_id, PCIEAERErr),
|
|
VMSTATE_UINT16(flags, PCIEAERErr),
|
|
VMSTATE_UINT32_ARRAY(header, PCIEAERErr, 4),
|
|
VMSTATE_UINT32_ARRAY(prefix, PCIEAERErr, 4),
|
|
VMSTATE_END_OF_LIST()
|
|
}
|
|
};
|
|
|
|
const VMStateDescription vmstate_pcie_aer_log = {
|
|
.name = "PCIE_AER_ERROR_LOG",
|
|
.version_id = 1,
|
|
.minimum_version_id = 1,
|
|
.minimum_version_id_old = 1,
|
|
.fields = (VMStateField[]) {
|
|
VMSTATE_UINT16(log_num, PCIEAERLog),
|
|
VMSTATE_UINT16(log_max, PCIEAERLog),
|
|
VMSTATE_STRUCT_VARRAY_POINTER_UINT16(log, PCIEAERLog, log_num,
|
|
vmstate_pcie_aer_err, PCIEAERErr),
|
|
VMSTATE_END_OF_LIST()
|
|
}
|
|
};
|
|
|
|
void pcie_aer_inject_error_print(Monitor *mon, const QObject *data)
|
|
{
|
|
QDict *qdict;
|
|
int devfn;
|
|
assert(qobject_type(data) == QTYPE_QDICT);
|
|
qdict = qobject_to_qdict(data);
|
|
|
|
devfn = (int)qdict_get_int(qdict, "devfn");
|
|
monitor_printf(mon, "OK id: %s domain: %x, bus: %x devfn: %x.%x\n",
|
|
qdict_get_str(qdict, "id"),
|
|
(int) qdict_get_int(qdict, "domain"),
|
|
(int) qdict_get_int(qdict, "bus"),
|
|
PCI_SLOT(devfn), PCI_FUNC(devfn));
|
|
}
|
|
|
|
typedef struct PCIEAERErrorName {
|
|
const char *name;
|
|
uint32_t val;
|
|
bool correctable;
|
|
} PCIEAERErrorName;
|
|
|
|
/*
|
|
* AER error name -> value conversion table
|
|
* This naming scheme is same to linux aer-injection tool.
|
|
*/
|
|
static const struct PCIEAERErrorName pcie_aer_error_list[] = {
|
|
{
|
|
.name = "TRAIN",
|
|
.val = PCI_ERR_UNC_TRAIN,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "DLP",
|
|
.val = PCI_ERR_UNC_DLP,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "SDN",
|
|
.val = PCI_ERR_UNC_SDN,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "POISON_TLP",
|
|
.val = PCI_ERR_UNC_POISON_TLP,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "FCP",
|
|
.val = PCI_ERR_UNC_FCP,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "COMP_TIME",
|
|
.val = PCI_ERR_UNC_COMP_TIME,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "COMP_ABORT",
|
|
.val = PCI_ERR_UNC_COMP_ABORT,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "UNX_COMP",
|
|
.val = PCI_ERR_UNC_UNX_COMP,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "RX_OVER",
|
|
.val = PCI_ERR_UNC_RX_OVER,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "MALF_TLP",
|
|
.val = PCI_ERR_UNC_MALF_TLP,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "ECRC",
|
|
.val = PCI_ERR_UNC_ECRC,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "UNSUP",
|
|
.val = PCI_ERR_UNC_UNSUP,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "ACSV",
|
|
.val = PCI_ERR_UNC_ACSV,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "INTN",
|
|
.val = PCI_ERR_UNC_INTN,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "MCBTLP",
|
|
.val = PCI_ERR_UNC_MCBTLP,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "ATOP_EBLOCKED",
|
|
.val = PCI_ERR_UNC_ATOP_EBLOCKED,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "TLP_PRF_BLOCKED",
|
|
.val = PCI_ERR_UNC_TLP_PRF_BLOCKED,
|
|
.correctable = false,
|
|
}, {
|
|
.name = "RCVR",
|
|
.val = PCI_ERR_COR_RCVR,
|
|
.correctable = true,
|
|
}, {
|
|
.name = "BAD_TLP",
|
|
.val = PCI_ERR_COR_BAD_TLP,
|
|
.correctable = true,
|
|
}, {
|
|
.name = "BAD_DLLP",
|
|
.val = PCI_ERR_COR_BAD_DLLP,
|
|
.correctable = true,
|
|
}, {
|
|
.name = "REP_ROLL",
|
|
.val = PCI_ERR_COR_REP_ROLL,
|
|
.correctable = true,
|
|
}, {
|
|
.name = "REP_TIMER",
|
|
.val = PCI_ERR_COR_REP_TIMER,
|
|
.correctable = true,
|
|
}, {
|
|
.name = "ADV_NONFATAL",
|
|
.val = PCI_ERR_COR_ADV_NONFATAL,
|
|
.correctable = true,
|
|
}, {
|
|
.name = "INTERNAL",
|
|
.val = PCI_ERR_COR_INTERNAL,
|
|
.correctable = true,
|
|
}, {
|
|
.name = "HL_OVERFLOW",
|
|
.val = PCI_ERR_COR_HL_OVERFLOW,
|
|
.correctable = true,
|
|
},
|
|
};
|
|
|
|
static int pcie_aer_parse_error_string(const char *error_name,
|
|
uint32_t *status, bool *correctable)
|
|
{
|
|
int i;
|
|
|
|
for (i = 0; i < ARRAY_SIZE(pcie_aer_error_list); i++) {
|
|
const PCIEAERErrorName *e = &pcie_aer_error_list[i];
|
|
if (strcmp(error_name, e->name)) {
|
|
continue;
|
|
}
|
|
|
|
*status = e->val;
|
|
*correctable = e->correctable;
|
|
return 0;
|
|
}
|
|
return -EINVAL;
|
|
}
|
|
|
|
int do_pcie_aer_inject_error(Monitor *mon,
|
|
const QDict *qdict, QObject **ret_data)
|
|
{
|
|
const char *id = qdict_get_str(qdict, "id");
|
|
const char *error_name;
|
|
uint32_t error_status;
|
|
bool correctable;
|
|
PCIDevice *dev;
|
|
PCIEAERErr err;
|
|
int ret;
|
|
|
|
ret = pci_qdev_find_device(id, &dev);
|
|
if (ret < 0) {
|
|
monitor_printf(mon,
|
|
"id or pci device path is invalid or device not "
|
|
"found. %s\n", id);
|
|
return ret;
|
|
}
|
|
if (!pci_is_express(dev)) {
|
|
monitor_printf(mon, "the device doesn't support pci express. %s\n",
|
|
id);
|
|
return -ENOSYS;
|
|
}
|
|
|
|
error_name = qdict_get_str(qdict, "error_status");
|
|
if (pcie_aer_parse_error_string(error_name, &error_status, &correctable)) {
|
|
char *e = NULL;
|
|
error_status = strtoul(error_name, &e, 0);
|
|
correctable = qdict_get_try_bool(qdict, "correctable", 0);
|
|
if (!e || *e != '\0') {
|
|
monitor_printf(mon, "invalid error status value. \"%s\"",
|
|
error_name);
|
|
return -EINVAL;
|
|
}
|
|
}
|
|
err.status = error_status;
|
|
err.source_id = (pci_bus_num(dev->bus) << 8) | dev->devfn;
|
|
|
|
err.flags = 0;
|
|
if (correctable) {
|
|
err.flags |= PCIE_AER_ERR_IS_CORRECTABLE;
|
|
}
|
|
if (qdict_get_try_bool(qdict, "advisory_non_fatal", 0)) {
|
|
err.flags |= PCIE_AER_ERR_MAYBE_ADVISORY;
|
|
}
|
|
if (qdict_haskey(qdict, "header0")) {
|
|
err.flags |= PCIE_AER_ERR_HEADER_VALID;
|
|
}
|
|
if (qdict_haskey(qdict, "prefix0")) {
|
|
err.flags |= PCIE_AER_ERR_TLP_PREFIX_PRESENT;
|
|
}
|
|
|
|
err.header[0] = qdict_get_try_int(qdict, "header0", 0);
|
|
err.header[1] = qdict_get_try_int(qdict, "header1", 0);
|
|
err.header[2] = qdict_get_try_int(qdict, "header2", 0);
|
|
err.header[3] = qdict_get_try_int(qdict, "header3", 0);
|
|
|
|
err.prefix[0] = qdict_get_try_int(qdict, "prefix0", 0);
|
|
err.prefix[1] = qdict_get_try_int(qdict, "prefix1", 0);
|
|
err.prefix[2] = qdict_get_try_int(qdict, "prefix2", 0);
|
|
err.prefix[3] = qdict_get_try_int(qdict, "prefix3", 0);
|
|
|
|
ret = pcie_aer_inject_error(dev, &err);
|
|
*ret_data = qobject_from_jsonf("{'id': %s, "
|
|
"'domain': %d, 'bus': %d, 'devfn': %d, "
|
|
"'ret': %d}",
|
|
id,
|
|
pci_find_domain(dev->bus),
|
|
pci_bus_num(dev->bus), dev->devfn,
|
|
ret);
|
|
assert(*ret_data);
|
|
|
|
return 0;
|
|
}
|