mirror: clarify mirror_do_read return code
[qemu.git] / hw / pci / pcie_aer.c
blobe2d4e68ba3db2b8a048c8cead7ef082612b24fcd
1 /*
2 * pcie_aer.c
4 * Copyright (c) 2010 Isaku Yamahata <yamahata at valinux co jp>
5 * VA Linux Systems Japan K.K.
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2 of the License, or
10 * (at your option) any later version.
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License along
18 * with this program; if not, see <http://www.gnu.org/licenses/>.
21 #include "qemu/osdep.h"
22 #include "sysemu/sysemu.h"
23 #include "qapi/qmp/types.h"
24 #include "monitor/monitor.h"
25 #include "hw/pci/pci_bridge.h"
26 #include "hw/pci/pcie.h"
27 #include "hw/pci/msix.h"
28 #include "hw/pci/msi.h"
29 #include "hw/pci/pci_bus.h"
30 #include "hw/pci/pcie_regs.h"
32 //#define DEBUG_PCIE
33 #ifdef DEBUG_PCIE
34 # define PCIE_DPRINTF(fmt, ...) \
35 fprintf(stderr, "%s:%d " fmt, __func__, __LINE__, ## __VA_ARGS__)
36 #else
37 # define PCIE_DPRINTF(fmt, ...) do {} while (0)
38 #endif
39 #define PCIE_DEV_PRINTF(dev, fmt, ...) \
40 PCIE_DPRINTF("%s:%x "fmt, (dev)->name, (dev)->devfn, ## __VA_ARGS__)
42 #define PCI_ERR_SRC_COR_OFFS 0
43 #define PCI_ERR_SRC_UNCOR_OFFS 2
45 /* From 6.2.7 Error Listing and Rules. Table 6-2, 6-3 and 6-4 */
46 static uint32_t pcie_aer_uncor_default_severity(uint32_t status)
48 switch (status) {
49 case PCI_ERR_UNC_INTN:
50 case PCI_ERR_UNC_DLP:
51 case PCI_ERR_UNC_SDN:
52 case PCI_ERR_UNC_RX_OVER:
53 case PCI_ERR_UNC_FCP:
54 case PCI_ERR_UNC_MALF_TLP:
55 return PCI_ERR_ROOT_CMD_FATAL_EN;
56 case PCI_ERR_UNC_POISON_TLP:
57 case PCI_ERR_UNC_ECRC:
58 case PCI_ERR_UNC_UNSUP:
59 case PCI_ERR_UNC_COMP_TIME:
60 case PCI_ERR_UNC_COMP_ABORT:
61 case PCI_ERR_UNC_UNX_COMP:
62 case PCI_ERR_UNC_ACSV:
63 case PCI_ERR_UNC_MCBTLP:
64 case PCI_ERR_UNC_ATOP_EBLOCKED:
65 case PCI_ERR_UNC_TLP_PRF_BLOCKED:
66 return PCI_ERR_ROOT_CMD_NONFATAL_EN;
67 default:
68 abort();
69 break;
71 return PCI_ERR_ROOT_CMD_FATAL_EN;
74 static int aer_log_add_err(PCIEAERLog *aer_log, const PCIEAERErr *err)
76 if (aer_log->log_num == aer_log->log_max) {
77 return -1;
79 memcpy(&aer_log->log[aer_log->log_num], err, sizeof *err);
80 aer_log->log_num++;
81 return 0;
84 static void aer_log_del_err(PCIEAERLog *aer_log, PCIEAERErr *err)
86 assert(aer_log->log_num);
87 *err = aer_log->log[0];
88 aer_log->log_num--;
89 memmove(&aer_log->log[0], &aer_log->log[1],
90 aer_log->log_num * sizeof *err);
93 static void aer_log_clear_all_err(PCIEAERLog *aer_log)
95 aer_log->log_num = 0;
98 int pcie_aer_init(PCIDevice *dev, uint16_t offset, uint16_t size)
100 PCIExpressDevice *exp;
102 pcie_add_capability(dev, PCI_EXT_CAP_ID_ERR, PCI_ERR_VER,
103 offset, size);
104 exp = &dev->exp;
105 exp->aer_cap = offset;
107 /* log_max is property */
108 if (dev->exp.aer_log.log_max == PCIE_AER_LOG_MAX_UNSET) {
109 dev->exp.aer_log.log_max = PCIE_AER_LOG_MAX_DEFAULT;
111 /* clip down the value to avoid unreasobale memory usage */
112 if (dev->exp.aer_log.log_max > PCIE_AER_LOG_MAX_LIMIT) {
113 return -EINVAL;
115 dev->exp.aer_log.log = g_malloc0(sizeof dev->exp.aer_log.log[0] *
116 dev->exp.aer_log.log_max);
118 pci_set_long(dev->w1cmask + offset + PCI_ERR_UNCOR_STATUS,
119 PCI_ERR_UNC_SUPPORTED);
121 pci_set_long(dev->config + offset + PCI_ERR_UNCOR_SEVER,
122 PCI_ERR_UNC_SEVERITY_DEFAULT);
123 pci_set_long(dev->wmask + offset + PCI_ERR_UNCOR_SEVER,
124 PCI_ERR_UNC_SUPPORTED);
126 pci_long_test_and_set_mask(dev->w1cmask + offset + PCI_ERR_COR_STATUS,
127 PCI_ERR_COR_SUPPORTED);
129 pci_set_long(dev->config + offset + PCI_ERR_COR_MASK,
130 PCI_ERR_COR_MASK_DEFAULT);
131 pci_set_long(dev->wmask + offset + PCI_ERR_COR_MASK,
132 PCI_ERR_COR_SUPPORTED);
134 /* capabilities and control. multiple header logging is supported */
135 if (dev->exp.aer_log.log_max > 0) {
136 pci_set_long(dev->config + offset + PCI_ERR_CAP,
137 PCI_ERR_CAP_ECRC_GENC | PCI_ERR_CAP_ECRC_CHKC |
138 PCI_ERR_CAP_MHRC);
139 pci_set_long(dev->wmask + offset + PCI_ERR_CAP,
140 PCI_ERR_CAP_ECRC_GENE | PCI_ERR_CAP_ECRC_CHKE |
141 PCI_ERR_CAP_MHRE);
142 } else {
143 pci_set_long(dev->config + offset + PCI_ERR_CAP,
144 PCI_ERR_CAP_ECRC_GENC | PCI_ERR_CAP_ECRC_CHKC);
145 pci_set_long(dev->wmask + offset + PCI_ERR_CAP,
146 PCI_ERR_CAP_ECRC_GENE | PCI_ERR_CAP_ECRC_CHKE);
149 switch (pcie_cap_get_type(dev)) {
150 case PCI_EXP_TYPE_ROOT_PORT:
151 /* this case will be set by pcie_aer_root_init() */
152 /* fallthrough */
153 case PCI_EXP_TYPE_DOWNSTREAM:
154 case PCI_EXP_TYPE_UPSTREAM:
155 pci_word_test_and_set_mask(dev->wmask + PCI_BRIDGE_CONTROL,
156 PCI_BRIDGE_CTL_SERR);
157 pci_long_test_and_set_mask(dev->w1cmask + PCI_STATUS,
158 PCI_SEC_STATUS_RCV_SYSTEM_ERROR);
159 break;
160 default:
161 /* nothing */
162 break;
164 return 0;
167 void pcie_aer_exit(PCIDevice *dev)
169 g_free(dev->exp.aer_log.log);
172 static void pcie_aer_update_uncor_status(PCIDevice *dev)
174 uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
175 PCIEAERLog *aer_log = &dev->exp.aer_log;
177 uint16_t i;
178 for (i = 0; i < aer_log->log_num; i++) {
179 pci_long_test_and_set_mask(aer_cap + PCI_ERR_UNCOR_STATUS,
180 dev->exp.aer_log.log[i].status);
185 * return value:
186 * true: error message needs to be sent up
187 * false: error message is masked
189 * 6.2.6 Error Message Control
190 * Figure 6-3
191 * all pci express devices part
193 static bool
194 pcie_aer_msg_alldev(PCIDevice *dev, const PCIEAERMsg *msg)
196 if (!(pcie_aer_msg_is_uncor(msg) &&
197 (pci_get_word(dev->config + PCI_COMMAND) & PCI_COMMAND_SERR))) {
198 return false;
201 /* Signaled System Error
203 * 7.5.1.1 Command register
204 * Bit 8 SERR# Enable
206 * When Set, this bit enables reporting of Non-fatal and Fatal
207 * errors detected by the Function to the Root Complex. Note that
208 * errors are reported if enabled either through this bit or through
209 * the PCI Express specific bits in the Device Control register (see
210 * Section 7.8.4).
212 pci_word_test_and_set_mask(dev->config + PCI_STATUS,
213 PCI_STATUS_SIG_SYSTEM_ERROR);
215 if (!(msg->severity &
216 pci_get_word(dev->config + dev->exp.exp_cap + PCI_EXP_DEVCTL))) {
217 return false;
220 /* send up error message */
221 return true;
225 * return value:
226 * true: error message is sent up
227 * false: error message is masked
229 * 6.2.6 Error Message Control
230 * Figure 6-3
231 * virtual pci bridge part
233 static bool pcie_aer_msg_vbridge(PCIDevice *dev, const PCIEAERMsg *msg)
235 uint16_t bridge_control = pci_get_word(dev->config + PCI_BRIDGE_CONTROL);
237 if (pcie_aer_msg_is_uncor(msg)) {
238 /* Received System Error */
239 pci_word_test_and_set_mask(dev->config + PCI_SEC_STATUS,
240 PCI_SEC_STATUS_RCV_SYSTEM_ERROR);
243 if (!(bridge_control & PCI_BRIDGE_CTL_SERR)) {
244 return false;
246 return true;
249 void pcie_aer_root_set_vector(PCIDevice *dev, unsigned int vector)
251 uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
252 assert(vector < PCI_ERR_ROOT_IRQ_MAX);
253 pci_long_test_and_clear_mask(aer_cap + PCI_ERR_ROOT_STATUS,
254 PCI_ERR_ROOT_IRQ);
255 pci_long_test_and_set_mask(aer_cap + PCI_ERR_ROOT_STATUS,
256 vector << PCI_ERR_ROOT_IRQ_SHIFT);
259 static unsigned int pcie_aer_root_get_vector(PCIDevice *dev)
261 uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
262 uint32_t root_status = pci_get_long(aer_cap + PCI_ERR_ROOT_STATUS);
263 return (root_status & PCI_ERR_ROOT_IRQ) >> PCI_ERR_ROOT_IRQ_SHIFT;
266 /* Given a status register, get corresponding bits in the command register */
267 static uint32_t pcie_aer_status_to_cmd(uint32_t status)
269 uint32_t cmd = 0;
270 if (status & PCI_ERR_ROOT_COR_RCV) {
271 cmd |= PCI_ERR_ROOT_CMD_COR_EN;
273 if (status & PCI_ERR_ROOT_NONFATAL_RCV) {
274 cmd |= PCI_ERR_ROOT_CMD_NONFATAL_EN;
276 if (status & PCI_ERR_ROOT_FATAL_RCV) {
277 cmd |= PCI_ERR_ROOT_CMD_FATAL_EN;
279 return cmd;
282 static void pcie_aer_root_notify(PCIDevice *dev)
284 if (msix_enabled(dev)) {
285 msix_notify(dev, pcie_aer_root_get_vector(dev));
286 } else if (msi_enabled(dev)) {
287 msi_notify(dev, pcie_aer_root_get_vector(dev));
288 } else {
289 pci_irq_assert(dev);
294 * 6.2.6 Error Message Control
295 * Figure 6-3
296 * root port part
298 static void pcie_aer_msg_root_port(PCIDevice *dev, const PCIEAERMsg *msg)
300 uint16_t cmd;
301 uint8_t *aer_cap;
302 uint32_t root_cmd;
303 uint32_t root_status, prev_status;
305 cmd = pci_get_word(dev->config + PCI_COMMAND);
306 aer_cap = dev->config + dev->exp.aer_cap;
307 root_cmd = pci_get_long(aer_cap + PCI_ERR_ROOT_COMMAND);
308 prev_status = root_status = pci_get_long(aer_cap + PCI_ERR_ROOT_STATUS);
310 if (cmd & PCI_COMMAND_SERR) {
311 /* System Error.
313 * The way to report System Error is platform specific and
314 * it isn't implemented in qemu right now.
315 * So just discard the error for now.
316 * OS which cares of aer would receive errors via
317 * native aer mechanims, so this wouldn't matter.
321 /* Errro Message Received: Root Error Status register */
322 switch (msg->severity) {
323 case PCI_ERR_ROOT_CMD_COR_EN:
324 if (root_status & PCI_ERR_ROOT_COR_RCV) {
325 root_status |= PCI_ERR_ROOT_MULTI_COR_RCV;
326 } else {
327 pci_set_word(aer_cap + PCI_ERR_ROOT_ERR_SRC + PCI_ERR_SRC_COR_OFFS,
328 msg->source_id);
330 root_status |= PCI_ERR_ROOT_COR_RCV;
331 break;
332 case PCI_ERR_ROOT_CMD_NONFATAL_EN:
333 root_status |= PCI_ERR_ROOT_NONFATAL_RCV;
334 break;
335 case PCI_ERR_ROOT_CMD_FATAL_EN:
336 if (!(root_status & PCI_ERR_ROOT_UNCOR_RCV)) {
337 root_status |= PCI_ERR_ROOT_FIRST_FATAL;
339 root_status |= PCI_ERR_ROOT_FATAL_RCV;
340 break;
341 default:
342 abort();
343 break;
345 if (pcie_aer_msg_is_uncor(msg)) {
346 if (root_status & PCI_ERR_ROOT_UNCOR_RCV) {
347 root_status |= PCI_ERR_ROOT_MULTI_UNCOR_RCV;
348 } else {
349 pci_set_word(aer_cap + PCI_ERR_ROOT_ERR_SRC +
350 PCI_ERR_SRC_UNCOR_OFFS, msg->source_id);
352 root_status |= PCI_ERR_ROOT_UNCOR_RCV;
354 pci_set_long(aer_cap + PCI_ERR_ROOT_STATUS, root_status);
356 /* 6.2.4.1.2 Interrupt Generation */
357 /* All the above did was set some bits in the status register.
358 * Specifically these that match message severity.
359 * The below code relies on this fact. */
360 if (!(root_cmd & msg->severity) ||
361 (pcie_aer_status_to_cmd(prev_status) & root_cmd)) {
362 /* Condition is not being set or was already true so nothing to do. */
363 return;
366 pcie_aer_root_notify(dev);
370 * 6.2.6 Error Message Control Figure 6-3
372 * Walk up the bus tree from the device, propagate the error message.
374 void pcie_aer_msg(PCIDevice *dev, const PCIEAERMsg *msg)
376 uint8_t type;
378 while (dev) {
379 if (!pci_is_express(dev)) {
380 /* just ignore it */
381 /* TODO: Shouldn't we set PCI_STATUS_SIG_SYSTEM_ERROR?
382 * Consider e.g. a PCI bridge above a PCI Express device. */
383 return;
386 type = pcie_cap_get_type(dev);
387 if ((type == PCI_EXP_TYPE_ROOT_PORT ||
388 type == PCI_EXP_TYPE_UPSTREAM ||
389 type == PCI_EXP_TYPE_DOWNSTREAM) &&
390 !pcie_aer_msg_vbridge(dev, msg)) {
391 return;
393 if (!pcie_aer_msg_alldev(dev, msg)) {
394 return;
396 if (type == PCI_EXP_TYPE_ROOT_PORT) {
397 pcie_aer_msg_root_port(dev, msg);
398 /* Root port can notify system itself,
399 or send the error message to root complex event collector. */
401 * if root port is associated with an event collector,
402 * return the root complex event collector here.
403 * For now root complex event collector isn't supported.
405 return;
407 dev = pci_bridge_get_device(dev->bus);
411 static void pcie_aer_update_log(PCIDevice *dev, const PCIEAERErr *err)
413 uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
414 uint8_t first_bit = ctz32(err->status);
415 uint32_t errcap = pci_get_long(aer_cap + PCI_ERR_CAP);
416 int i;
418 assert(err->status);
419 assert(!(err->status & (err->status - 1)));
421 errcap &= ~(PCI_ERR_CAP_FEP_MASK | PCI_ERR_CAP_TLP);
422 errcap |= PCI_ERR_CAP_FEP(first_bit);
424 if (err->flags & PCIE_AER_ERR_HEADER_VALID) {
425 for (i = 0; i < ARRAY_SIZE(err->header); ++i) {
426 /* 7.10.8 Header Log Register */
427 uint8_t *header_log =
428 aer_cap + PCI_ERR_HEADER_LOG + i * sizeof err->header[0];
429 stl_be_p(header_log, err->header[i]);
431 } else {
432 assert(!(err->flags & PCIE_AER_ERR_TLP_PREFIX_PRESENT));
433 memset(aer_cap + PCI_ERR_HEADER_LOG, 0, PCI_ERR_HEADER_LOG_SIZE);
436 if ((err->flags & PCIE_AER_ERR_TLP_PREFIX_PRESENT) &&
437 (pci_get_long(dev->config + dev->exp.exp_cap + PCI_EXP_DEVCAP2) &
438 PCI_EXP_DEVCAP2_EETLPP)) {
439 for (i = 0; i < ARRAY_SIZE(err->prefix); ++i) {
440 /* 7.10.12 tlp prefix log register */
441 uint8_t *prefix_log =
442 aer_cap + PCI_ERR_TLP_PREFIX_LOG + i * sizeof err->prefix[0];
443 stl_be_p(prefix_log, err->prefix[i]);
445 errcap |= PCI_ERR_CAP_TLP;
446 } else {
447 memset(aer_cap + PCI_ERR_TLP_PREFIX_LOG, 0,
448 PCI_ERR_TLP_PREFIX_LOG_SIZE);
450 pci_set_long(aer_cap + PCI_ERR_CAP, errcap);
453 static void pcie_aer_clear_log(PCIDevice *dev)
455 uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
457 pci_long_test_and_clear_mask(aer_cap + PCI_ERR_CAP,
458 PCI_ERR_CAP_FEP_MASK | PCI_ERR_CAP_TLP);
460 memset(aer_cap + PCI_ERR_HEADER_LOG, 0, PCI_ERR_HEADER_LOG_SIZE);
461 memset(aer_cap + PCI_ERR_TLP_PREFIX_LOG, 0, PCI_ERR_TLP_PREFIX_LOG_SIZE);
464 static void pcie_aer_clear_error(PCIDevice *dev)
466 uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
467 uint32_t errcap = pci_get_long(aer_cap + PCI_ERR_CAP);
468 PCIEAERLog *aer_log = &dev->exp.aer_log;
469 PCIEAERErr err;
471 if (!(errcap & PCI_ERR_CAP_MHRE) || !aer_log->log_num) {
472 pcie_aer_clear_log(dev);
473 return;
477 * If more errors are queued, set corresponding bits in uncorrectable
478 * error status.
479 * We emulate uncorrectable error status register as W1CS.
480 * So set bit in uncorrectable error status here again for multiple
481 * error recording support.
483 * 6.2.4.2 Multiple Error Handling(Advanced Error Reporting Capability)
485 pcie_aer_update_uncor_status(dev);
487 aer_log_del_err(aer_log, &err);
488 pcie_aer_update_log(dev, &err);
491 static int pcie_aer_record_error(PCIDevice *dev,
492 const PCIEAERErr *err)
494 uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
495 uint32_t errcap = pci_get_long(aer_cap + PCI_ERR_CAP);
496 int fep = PCI_ERR_CAP_FEP(errcap);
498 assert(err->status);
499 assert(!(err->status & (err->status - 1)));
501 if (errcap & PCI_ERR_CAP_MHRE &&
502 (pci_get_long(aer_cap + PCI_ERR_UNCOR_STATUS) & (1U << fep))) {
503 /* Not first error. queue error */
504 if (aer_log_add_err(&dev->exp.aer_log, err) < 0) {
505 /* overflow */
506 return -1;
508 return 0;
511 pcie_aer_update_log(dev, err);
512 return 0;
515 typedef struct PCIEAERInject {
516 PCIDevice *dev;
517 uint8_t *aer_cap;
518 const PCIEAERErr *err;
519 uint16_t devctl;
520 uint16_t devsta;
521 uint32_t error_status;
522 bool unsupported_request;
523 bool log_overflow;
524 PCIEAERMsg msg;
525 } PCIEAERInject;
527 static bool pcie_aer_inject_cor_error(PCIEAERInject *inj,
528 uint32_t uncor_status,
529 bool is_advisory_nonfatal)
531 PCIDevice *dev = inj->dev;
533 inj->devsta |= PCI_EXP_DEVSTA_CED;
534 if (inj->unsupported_request) {
535 inj->devsta |= PCI_EXP_DEVSTA_URD;
537 pci_set_word(dev->config + dev->exp.exp_cap + PCI_EXP_DEVSTA, inj->devsta);
539 if (inj->aer_cap) {
540 uint32_t mask;
541 pci_long_test_and_set_mask(inj->aer_cap + PCI_ERR_COR_STATUS,
542 inj->error_status);
543 mask = pci_get_long(inj->aer_cap + PCI_ERR_COR_MASK);
544 if (mask & inj->error_status) {
545 return false;
547 if (is_advisory_nonfatal) {
548 uint32_t uncor_mask =
549 pci_get_long(inj->aer_cap + PCI_ERR_UNCOR_MASK);
550 if (!(uncor_mask & uncor_status)) {
551 inj->log_overflow = !!pcie_aer_record_error(dev, inj->err);
553 pci_long_test_and_set_mask(inj->aer_cap + PCI_ERR_UNCOR_STATUS,
554 uncor_status);
558 if (inj->unsupported_request && !(inj->devctl & PCI_EXP_DEVCTL_URRE)) {
559 return false;
561 if (!(inj->devctl & PCI_EXP_DEVCTL_CERE)) {
562 return false;
565 inj->msg.severity = PCI_ERR_ROOT_CMD_COR_EN;
566 return true;
569 static bool pcie_aer_inject_uncor_error(PCIEAERInject *inj, bool is_fatal)
571 PCIDevice *dev = inj->dev;
572 uint16_t cmd;
574 if (is_fatal) {
575 inj->devsta |= PCI_EXP_DEVSTA_FED;
576 } else {
577 inj->devsta |= PCI_EXP_DEVSTA_NFED;
579 if (inj->unsupported_request) {
580 inj->devsta |= PCI_EXP_DEVSTA_URD;
582 pci_set_long(dev->config + dev->exp.exp_cap + PCI_EXP_DEVSTA, inj->devsta);
584 if (inj->aer_cap) {
585 uint32_t mask = pci_get_long(inj->aer_cap + PCI_ERR_UNCOR_MASK);
586 if (mask & inj->error_status) {
587 pci_long_test_and_set_mask(inj->aer_cap + PCI_ERR_UNCOR_STATUS,
588 inj->error_status);
589 return false;
592 inj->log_overflow = !!pcie_aer_record_error(dev, inj->err);
593 pci_long_test_and_set_mask(inj->aer_cap + PCI_ERR_UNCOR_STATUS,
594 inj->error_status);
597 cmd = pci_get_word(dev->config + PCI_COMMAND);
598 if (inj->unsupported_request &&
599 !(inj->devctl & PCI_EXP_DEVCTL_URRE) && !(cmd & PCI_COMMAND_SERR)) {
600 return false;
602 if (is_fatal) {
603 if (!((cmd & PCI_COMMAND_SERR) ||
604 (inj->devctl & PCI_EXP_DEVCTL_FERE))) {
605 return false;
607 inj->msg.severity = PCI_ERR_ROOT_CMD_FATAL_EN;
608 } else {
609 if (!((cmd & PCI_COMMAND_SERR) ||
610 (inj->devctl & PCI_EXP_DEVCTL_NFERE))) {
611 return false;
613 inj->msg.severity = PCI_ERR_ROOT_CMD_NONFATAL_EN;
615 return true;
619 * non-Function specific error must be recorded in all functions.
620 * It is the responsibility of the caller of this function.
621 * It is also caller's responsibility to determine which function should
622 * report the error.
624 * 6.2.4 Error Logging
625 * 6.2.5 Sequence of Device Error Signaling and Logging Operations
626 * Figure 6-2: Flowchart Showing Sequence of Device Error Signaling and Logging
627 * Operations
629 int pcie_aer_inject_error(PCIDevice *dev, const PCIEAERErr *err)
631 uint8_t *aer_cap = NULL;
632 uint16_t devctl = 0;
633 uint16_t devsta = 0;
634 uint32_t error_status = err->status;
635 PCIEAERInject inj;
637 if (!pci_is_express(dev)) {
638 return -ENOSYS;
641 if (err->flags & PCIE_AER_ERR_IS_CORRECTABLE) {
642 error_status &= PCI_ERR_COR_SUPPORTED;
643 } else {
644 error_status &= PCI_ERR_UNC_SUPPORTED;
647 /* invalid status bit. one and only one bit must be set */
648 if (!error_status || (error_status & (error_status - 1))) {
649 return -EINVAL;
652 if (dev->exp.aer_cap) {
653 uint8_t *exp_cap = dev->config + dev->exp.exp_cap;
654 aer_cap = dev->config + dev->exp.aer_cap;
655 devctl = pci_get_long(exp_cap + PCI_EXP_DEVCTL);
656 devsta = pci_get_long(exp_cap + PCI_EXP_DEVSTA);
659 inj.dev = dev;
660 inj.aer_cap = aer_cap;
661 inj.err = err;
662 inj.devctl = devctl;
663 inj.devsta = devsta;
664 inj.error_status = error_status;
665 inj.unsupported_request = !(err->flags & PCIE_AER_ERR_IS_CORRECTABLE) &&
666 err->status == PCI_ERR_UNC_UNSUP;
667 inj.log_overflow = false;
669 if (err->flags & PCIE_AER_ERR_IS_CORRECTABLE) {
670 if (!pcie_aer_inject_cor_error(&inj, 0, false)) {
671 return 0;
673 } else {
674 bool is_fatal =
675 pcie_aer_uncor_default_severity(error_status) ==
676 PCI_ERR_ROOT_CMD_FATAL_EN;
677 if (aer_cap) {
678 is_fatal =
679 error_status & pci_get_long(aer_cap + PCI_ERR_UNCOR_SEVER);
681 if (!is_fatal && (err->flags & PCIE_AER_ERR_MAYBE_ADVISORY)) {
682 inj.error_status = PCI_ERR_COR_ADV_NONFATAL;
683 if (!pcie_aer_inject_cor_error(&inj, error_status, true)) {
684 return 0;
686 } else {
687 if (!pcie_aer_inject_uncor_error(&inj, is_fatal)) {
688 return 0;
693 /* send up error message */
694 inj.msg.source_id = err->source_id;
695 pcie_aer_msg(dev, &inj.msg);
697 if (inj.log_overflow) {
698 PCIEAERErr header_log_overflow = {
699 .status = PCI_ERR_COR_HL_OVERFLOW,
700 .flags = PCIE_AER_ERR_IS_CORRECTABLE,
702 int ret = pcie_aer_inject_error(dev, &header_log_overflow);
703 assert(!ret);
705 return 0;
708 void pcie_aer_write_config(PCIDevice *dev,
709 uint32_t addr, uint32_t val, int len)
711 uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
712 uint32_t errcap = pci_get_long(aer_cap + PCI_ERR_CAP);
713 uint32_t first_error = 1U << PCI_ERR_CAP_FEP(errcap);
714 uint32_t uncorsta = pci_get_long(aer_cap + PCI_ERR_UNCOR_STATUS);
716 /* uncorrectable error */
717 if (!(uncorsta & first_error)) {
718 /* the bit that corresponds to the first error is cleared */
719 pcie_aer_clear_error(dev);
720 } else if (errcap & PCI_ERR_CAP_MHRE) {
721 /* When PCI_ERR_CAP_MHRE is enabled and the first error isn't cleared
722 * nothing should happen. So we have to revert the modification to
723 * the register.
725 pcie_aer_update_uncor_status(dev);
726 } else {
727 /* capability & control
728 * PCI_ERR_CAP_MHRE might be cleared, so clear of header log.
730 aer_log_clear_all_err(&dev->exp.aer_log);
734 void pcie_aer_root_init(PCIDevice *dev)
736 uint16_t pos = dev->exp.aer_cap;
738 pci_set_long(dev->wmask + pos + PCI_ERR_ROOT_COMMAND,
739 PCI_ERR_ROOT_CMD_EN_MASK);
740 pci_set_long(dev->w1cmask + pos + PCI_ERR_ROOT_STATUS,
741 PCI_ERR_ROOT_STATUS_REPORT_MASK);
742 /* PCI_ERR_ROOT_IRQ is RO but devices change it using a
743 * device-specific method.
745 pci_set_long(dev->cmask + pos + PCI_ERR_ROOT_STATUS,
746 ~PCI_ERR_ROOT_IRQ);
749 void pcie_aer_root_reset(PCIDevice *dev)
751 uint8_t* aer_cap = dev->config + dev->exp.aer_cap;
753 pci_set_long(aer_cap + PCI_ERR_ROOT_COMMAND, 0);
756 * Advanced Error Interrupt Message Number in Root Error Status Register
757 * must be updated by chip dependent code because it's chip dependent
758 * which number is used.
762 void pcie_aer_root_write_config(PCIDevice *dev,
763 uint32_t addr, uint32_t val, int len,
764 uint32_t root_cmd_prev)
766 uint8_t *aer_cap = dev->config + dev->exp.aer_cap;
767 uint32_t root_status = pci_get_long(aer_cap + PCI_ERR_ROOT_STATUS);
768 uint32_t enabled_cmd = pcie_aer_status_to_cmd(root_status);
769 uint32_t root_cmd = pci_get_long(aer_cap + PCI_ERR_ROOT_COMMAND);
770 /* 6.2.4.1.2 Interrupt Generation */
771 if (!msix_enabled(dev) && !msi_enabled(dev)) {
772 pci_set_irq(dev, !!(root_cmd & enabled_cmd));
773 return;
776 if ((root_cmd_prev & enabled_cmd) || !(root_cmd & enabled_cmd)) {
777 /* Send MSI on transition from false to true. */
778 return;
781 pcie_aer_root_notify(dev);
784 static const VMStateDescription vmstate_pcie_aer_err = {
785 .name = "PCIE_AER_ERROR",
786 .version_id = 1,
787 .minimum_version_id = 1,
788 .fields = (VMStateField[]) {
789 VMSTATE_UINT32(status, PCIEAERErr),
790 VMSTATE_UINT16(source_id, PCIEAERErr),
791 VMSTATE_UINT16(flags, PCIEAERErr),
792 VMSTATE_UINT32_ARRAY(header, PCIEAERErr, 4),
793 VMSTATE_UINT32_ARRAY(prefix, PCIEAERErr, 4),
794 VMSTATE_END_OF_LIST()
798 static bool pcie_aer_state_log_num_valid(void *opaque, int version_id)
800 PCIEAERLog *s = opaque;
802 return s->log_num <= s->log_max;
805 const VMStateDescription vmstate_pcie_aer_log = {
806 .name = "PCIE_AER_ERROR_LOG",
807 .version_id = 1,
808 .minimum_version_id = 1,
809 .fields = (VMStateField[]) {
810 VMSTATE_UINT16(log_num, PCIEAERLog),
811 VMSTATE_UINT16_EQUAL(log_max, PCIEAERLog),
812 VMSTATE_VALIDATE("log_num <= log_max", pcie_aer_state_log_num_valid),
813 VMSTATE_STRUCT_VARRAY_POINTER_UINT16(log, PCIEAERLog, log_num,
814 vmstate_pcie_aer_err, PCIEAERErr),
815 VMSTATE_END_OF_LIST()
819 typedef struct PCIEAERErrorName {
820 const char *name;
821 uint32_t val;
822 bool correctable;
823 } PCIEAERErrorName;
826 * AER error name -> value conversion table
827 * This naming scheme is same to linux aer-injection tool.
829 static const struct PCIEAERErrorName pcie_aer_error_list[] = {
831 .name = "DLP",
832 .val = PCI_ERR_UNC_DLP,
833 .correctable = false,
834 }, {
835 .name = "SDN",
836 .val = PCI_ERR_UNC_SDN,
837 .correctable = false,
838 }, {
839 .name = "POISON_TLP",
840 .val = PCI_ERR_UNC_POISON_TLP,
841 .correctable = false,
842 }, {
843 .name = "FCP",
844 .val = PCI_ERR_UNC_FCP,
845 .correctable = false,
846 }, {
847 .name = "COMP_TIME",
848 .val = PCI_ERR_UNC_COMP_TIME,
849 .correctable = false,
850 }, {
851 .name = "COMP_ABORT",
852 .val = PCI_ERR_UNC_COMP_ABORT,
853 .correctable = false,
854 }, {
855 .name = "UNX_COMP",
856 .val = PCI_ERR_UNC_UNX_COMP,
857 .correctable = false,
858 }, {
859 .name = "RX_OVER",
860 .val = PCI_ERR_UNC_RX_OVER,
861 .correctable = false,
862 }, {
863 .name = "MALF_TLP",
864 .val = PCI_ERR_UNC_MALF_TLP,
865 .correctable = false,
866 }, {
867 .name = "ECRC",
868 .val = PCI_ERR_UNC_ECRC,
869 .correctable = false,
870 }, {
871 .name = "UNSUP",
872 .val = PCI_ERR_UNC_UNSUP,
873 .correctable = false,
874 }, {
875 .name = "ACSV",
876 .val = PCI_ERR_UNC_ACSV,
877 .correctable = false,
878 }, {
879 .name = "INTN",
880 .val = PCI_ERR_UNC_INTN,
881 .correctable = false,
882 }, {
883 .name = "MCBTLP",
884 .val = PCI_ERR_UNC_MCBTLP,
885 .correctable = false,
886 }, {
887 .name = "ATOP_EBLOCKED",
888 .val = PCI_ERR_UNC_ATOP_EBLOCKED,
889 .correctable = false,
890 }, {
891 .name = "TLP_PRF_BLOCKED",
892 .val = PCI_ERR_UNC_TLP_PRF_BLOCKED,
893 .correctable = false,
894 }, {
895 .name = "RCVR",
896 .val = PCI_ERR_COR_RCVR,
897 .correctable = true,
898 }, {
899 .name = "BAD_TLP",
900 .val = PCI_ERR_COR_BAD_TLP,
901 .correctable = true,
902 }, {
903 .name = "BAD_DLLP",
904 .val = PCI_ERR_COR_BAD_DLLP,
905 .correctable = true,
906 }, {
907 .name = "REP_ROLL",
908 .val = PCI_ERR_COR_REP_ROLL,
909 .correctable = true,
910 }, {
911 .name = "REP_TIMER",
912 .val = PCI_ERR_COR_REP_TIMER,
913 .correctable = true,
914 }, {
915 .name = "ADV_NONFATAL",
916 .val = PCI_ERR_COR_ADV_NONFATAL,
917 .correctable = true,
918 }, {
919 .name = "INTERNAL",
920 .val = PCI_ERR_COR_INTERNAL,
921 .correctable = true,
922 }, {
923 .name = "HL_OVERFLOW",
924 .val = PCI_ERR_COR_HL_OVERFLOW,
925 .correctable = true,
929 static int pcie_aer_parse_error_string(const char *error_name,
930 uint32_t *status, bool *correctable)
932 int i;
934 for (i = 0; i < ARRAY_SIZE(pcie_aer_error_list); i++) {
935 const PCIEAERErrorName *e = &pcie_aer_error_list[i];
936 if (strcmp(error_name, e->name)) {
937 continue;
940 *status = e->val;
941 *correctable = e->correctable;
942 return 0;
944 return -EINVAL;
947 static int do_pcie_aer_inject_error(Monitor *mon,
948 const QDict *qdict, QObject **ret_data)
950 const char *id = qdict_get_str(qdict, "id");
951 const char *error_name;
952 uint32_t error_status;
953 bool correctable;
954 PCIDevice *dev;
955 PCIEAERErr err;
956 int ret;
958 ret = pci_qdev_find_device(id, &dev);
959 if (ret < 0) {
960 monitor_printf(mon,
961 "id or pci device path is invalid or device not "
962 "found. %s\n", id);
963 return ret;
965 if (!pci_is_express(dev)) {
966 monitor_printf(mon, "the device doesn't support pci express. %s\n",
967 id);
968 return -ENOSYS;
971 error_name = qdict_get_str(qdict, "error_status");
972 if (pcie_aer_parse_error_string(error_name, &error_status, &correctable)) {
973 char *e = NULL;
974 error_status = strtoul(error_name, &e, 0);
975 correctable = qdict_get_try_bool(qdict, "correctable", false);
976 if (!e || *e != '\0') {
977 monitor_printf(mon, "invalid error status value. \"%s\"",
978 error_name);
979 return -EINVAL;
982 err.status = error_status;
983 err.source_id = pci_requester_id(dev);
985 err.flags = 0;
986 if (correctable) {
987 err.flags |= PCIE_AER_ERR_IS_CORRECTABLE;
989 if (qdict_get_try_bool(qdict, "advisory_non_fatal", false)) {
990 err.flags |= PCIE_AER_ERR_MAYBE_ADVISORY;
992 if (qdict_haskey(qdict, "header0")) {
993 err.flags |= PCIE_AER_ERR_HEADER_VALID;
995 if (qdict_haskey(qdict, "prefix0")) {
996 err.flags |= PCIE_AER_ERR_TLP_PREFIX_PRESENT;
999 err.header[0] = qdict_get_try_int(qdict, "header0", 0);
1000 err.header[1] = qdict_get_try_int(qdict, "header1", 0);
1001 err.header[2] = qdict_get_try_int(qdict, "header2", 0);
1002 err.header[3] = qdict_get_try_int(qdict, "header3", 0);
1004 err.prefix[0] = qdict_get_try_int(qdict, "prefix0", 0);
1005 err.prefix[1] = qdict_get_try_int(qdict, "prefix1", 0);
1006 err.prefix[2] = qdict_get_try_int(qdict, "prefix2", 0);
1007 err.prefix[3] = qdict_get_try_int(qdict, "prefix3", 0);
1009 ret = pcie_aer_inject_error(dev, &err);
1010 *ret_data = qobject_from_jsonf("{'id': %s, "
1011 "'root_bus': %s, 'bus': %d, 'devfn': %d, "
1012 "'ret': %d}",
1013 id, pci_root_bus_path(dev),
1014 pci_bus_num(dev->bus), dev->devfn,
1015 ret);
1016 assert(*ret_data);
1018 return 0;
1021 void hmp_pcie_aer_inject_error(Monitor *mon, const QDict *qdict)
1023 QObject *data;
1024 int devfn;
1026 if (do_pcie_aer_inject_error(mon, qdict, &data) < 0) {
1027 return;
1030 assert(qobject_type(data) == QTYPE_QDICT);
1031 qdict = qobject_to_qdict(data);
1033 devfn = (int)qdict_get_int(qdict, "devfn");
1034 monitor_printf(mon, "OK id: %s root bus: %s, bus: %x devfn: %x.%x\n",
1035 qdict_get_str(qdict, "id"),
1036 qdict_get_str(qdict, "root_bus"),
1037 (int) qdict_get_int(qdict, "bus"),
1038 PCI_SLOT(devfn), PCI_FUNC(devfn));