diff options
Diffstat (limited to 'Documentation/edac.txt')
| -rw-r--r-- | Documentation/edac.txt | 151 |
1 files changed, 72 insertions, 79 deletions
diff --git a/Documentation/edac.txt b/Documentation/edac.txt index a5c36842ecef..ced527388001 100644 --- a/Documentation/edac.txt +++ b/Documentation/edac.txt | |||
| @@ -222,74 +222,9 @@ both csrow2 and csrow3 are populated, this indicates a dual ranked | |||
| 222 | set of DIMMs for channels 0 and 1. | 222 | set of DIMMs for channels 0 and 1. |
| 223 | 223 | ||
| 224 | 224 | ||
| 225 | Within each of the 'mc','mcX' and 'csrowX' directories are several | 225 | Within each of the 'mcX' and 'csrowX' directories are several |
| 226 | EDAC control and attribute files. | 226 | EDAC control and attribute files. |
| 227 | 227 | ||
| 228 | |||
| 229 | ============================================================================ | ||
| 230 | DIRECTORY 'mc' | ||
| 231 | |||
| 232 | In directory 'mc' are EDAC system overall control and attribute files: | ||
| 233 | |||
| 234 | |||
| 235 | Panic on UE control file: | ||
| 236 | |||
| 237 | 'edac_mc_panic_on_ue' | ||
| 238 | |||
| 239 | An uncorrectable error will cause a machine panic. This is usually | ||
| 240 | desirable. It is a bad idea to continue when an uncorrectable error | ||
| 241 | occurs - it is indeterminate what was uncorrected and the operating | ||
| 242 | system context might be so mangled that continuing will lead to further | ||
| 243 | corruption. If the kernel has MCE configured, then EDAC will never | ||
| 244 | notice the UE. | ||
| 245 | |||
| 246 | LOAD TIME: module/kernel parameter: panic_on_ue=[0|1] | ||
| 247 | |||
| 248 | RUN TIME: echo "1" >/sys/devices/system/edac/mc/edac_mc_panic_on_ue | ||
| 249 | |||
| 250 | |||
| 251 | Log UE control file: | ||
| 252 | |||
| 253 | 'edac_mc_log_ue' | ||
| 254 | |||
| 255 | Generate kernel messages describing uncorrectable errors. These errors | ||
| 256 | are reported through the system message log system. UE statistics | ||
| 257 | will be accumulated even when UE logging is disabled. | ||
| 258 | |||
| 259 | LOAD TIME: module/kernel parameter: log_ue=[0|1] | ||
| 260 | |||
| 261 | RUN TIME: echo "1" >/sys/devices/system/edac/mc/edac_mc_log_ue | ||
| 262 | |||
| 263 | |||
| 264 | Log CE control file: | ||
| 265 | |||
| 266 | 'edac_mc_log_ce' | ||
| 267 | |||
| 268 | Generate kernel messages describing correctable errors. These | ||
| 269 | errors are reported through the system message log system. | ||
| 270 | CE statistics will be accumulated even when CE logging is disabled. | ||
| 271 | |||
| 272 | LOAD TIME: module/kernel parameter: log_ce=[0|1] | ||
| 273 | |||
| 274 | RUN TIME: echo "1" >/sys/devices/system/edac/mc/edac_mc_log_ce | ||
| 275 | |||
| 276 | |||
| 277 | Polling period control file: | ||
| 278 | |||
| 279 | 'edac_mc_poll_msec' | ||
| 280 | |||
| 281 | The time period, in milliseconds, for polling for error information. | ||
| 282 | Too small a value wastes resources. Too large a value might delay | ||
| 283 | necessary handling of errors and might loose valuable information for | ||
| 284 | locating the error. 1000 milliseconds (once each second) is the current | ||
| 285 | default. Systems which require all the bandwidth they can get, may | ||
| 286 | increase this. | ||
| 287 | |||
| 288 | LOAD TIME: module/kernel parameter: poll_msec=[0|1] | ||
| 289 | |||
| 290 | RUN TIME: echo "1000" >/sys/devices/system/edac/mc/edac_mc_poll_msec | ||
| 291 | |||
| 292 | |||
| 293 | ============================================================================ | 228 | ============================================================================ |
| 294 | 'mcX' DIRECTORIES | 229 | 'mcX' DIRECTORIES |
| 295 | 230 | ||
| @@ -537,7 +472,6 @@ Channel 1 DIMM Label control file: | |||
| 537 | motherboard specific and determination of this information | 472 | motherboard specific and determination of this information |
| 538 | must occur in userland at this time. | 473 | must occur in userland at this time. |
| 539 | 474 | ||
| 540 | |||
| 541 | ============================================================================ | 475 | ============================================================================ |
| 542 | SYSTEM LOGGING | 476 | SYSTEM LOGGING |
| 543 | 477 | ||
| @@ -570,7 +504,6 @@ error type, a notice of "no info" and then an optional, | |||
| 570 | driver-specific error message. | 504 | driver-specific error message. |
| 571 | 505 | ||
| 572 | 506 | ||
| 573 | |||
| 574 | ============================================================================ | 507 | ============================================================================ |
| 575 | PCI Bus Parity Detection | 508 | PCI Bus Parity Detection |
| 576 | 509 | ||
| @@ -604,6 +537,74 @@ Enable/Disable PCI Parity checking control file: | |||
| 604 | echo "0" >/sys/devices/system/edac/pci/check_pci_parity | 537 | echo "0" >/sys/devices/system/edac/pci/check_pci_parity |
| 605 | 538 | ||
| 606 | 539 | ||
| 540 | Parity Count: | ||
| 541 | |||
| 542 | 'pci_parity_count' | ||
| 543 | |||
| 544 | This attribute file will display the number of parity errors that | ||
| 545 | have been detected. | ||
| 546 | |||
| 547 | |||
| 548 | ============================================================================ | ||
| 549 | MODULE PARAMETERS | ||
| 550 | |||
| 551 | Panic on UE control file: | ||
| 552 | |||
| 553 | 'edac_mc_panic_on_ue' | ||
| 554 | |||
| 555 | An uncorrectable error will cause a machine panic. This is usually | ||
| 556 | desirable. It is a bad idea to continue when an uncorrectable error | ||
| 557 | occurs - it is indeterminate what was uncorrected and the operating | ||
| 558 | system context might be so mangled that continuing will lead to further | ||
| 559 | corruption. If the kernel has MCE configured, then EDAC will never | ||
| 560 | notice the UE. | ||
| 561 | |||
| 562 | LOAD TIME: module/kernel parameter: edac_mc_panic_on_ue=[0|1] | ||
| 563 | |||
| 564 | RUN TIME: echo "1" > /sys/module/edac_core/parameters/edac_mc_panic_on_ue | ||
| 565 | |||
| 566 | |||
| 567 | Log UE control file: | ||
| 568 | |||
| 569 | 'edac_mc_log_ue' | ||
| 570 | |||
| 571 | Generate kernel messages describing uncorrectable errors. These errors | ||
| 572 | are reported through the system message log system. UE statistics | ||
| 573 | will be accumulated even when UE logging is disabled. | ||
| 574 | |||
| 575 | LOAD TIME: module/kernel parameter: edac_mc_log_ue=[0|1] | ||
| 576 | |||
| 577 | RUN TIME: echo "1" > /sys/module/edac_core/parameters/edac_mc_log_ue | ||
| 578 | |||
| 579 | |||
| 580 | Log CE control file: | ||
| 581 | |||
| 582 | 'edac_mc_log_ce' | ||
| 583 | |||
| 584 | Generate kernel messages describing correctable errors. These | ||
| 585 | errors are reported through the system message log system. | ||
| 586 | CE statistics will be accumulated even when CE logging is disabled. | ||
| 587 | |||
| 588 | LOAD TIME: module/kernel parameter: edac_mc_log_ce=[0|1] | ||
| 589 | |||
| 590 | RUN TIME: echo "1" > /sys/module/edac_core/parameters/edac_mc_log_ce | ||
| 591 | |||
| 592 | |||
| 593 | Polling period control file: | ||
| 594 | |||
| 595 | 'edac_mc_poll_msec' | ||
| 596 | |||
| 597 | The time period, in milliseconds, for polling for error information. | ||
| 598 | Too small a value wastes resources. Too large a value might delay | ||
| 599 | necessary handling of errors and might loose valuable information for | ||
| 600 | locating the error. 1000 milliseconds (once each second) is the current | ||
| 601 | default. Systems which require all the bandwidth they can get, may | ||
| 602 | increase this. | ||
| 603 | |||
| 604 | LOAD TIME: module/kernel parameter: edac_mc_poll_msec=[0|1] | ||
| 605 | |||
| 606 | RUN TIME: echo "1000" > /sys/module/edac_core/parameters/edac_mc_poll_msec | ||
| 607 | |||
| 607 | 608 | ||
| 608 | Panic on PCI PARITY Error: | 609 | Panic on PCI PARITY Error: |
| 609 | 610 | ||
| @@ -614,21 +615,13 @@ Panic on PCI PARITY Error: | |||
| 614 | error has been detected. | 615 | error has been detected. |
| 615 | 616 | ||
| 616 | 617 | ||
| 617 | module/kernel parameter: panic_on_pci_parity=[0|1] | 618 | module/kernel parameter: edac_panic_on_pci_pe=[0|1] |
| 618 | 619 | ||
| 619 | Enable: | 620 | Enable: |
| 620 | echo "1" >/sys/devices/system/edac/pci/panic_on_pci_parity | 621 | echo "1" > /sys/module/edac_core/parameters/edac_panic_on_pci_pe |
| 621 | 622 | ||
| 622 | Disable: | 623 | Disable: |
| 623 | echo "0" >/sys/devices/system/edac/pci/panic_on_pci_parity | 624 | echo "0" > /sys/module/edac_core/parameters/edac_panic_on_pci_pe |
| 624 | |||
| 625 | |||
| 626 | Parity Count: | ||
| 627 | |||
| 628 | 'pci_parity_count' | ||
| 629 | |||
| 630 | This attribute file will display the number of parity errors that | ||
| 631 | have been detected. | ||
| 632 | 625 | ||
| 633 | 626 | ||
| 634 | 627 | ||
