f3ecc7
#
f3ecc7
# config file for mcelog
f3ecc7
# For further options, see the mcelog manpage and documentation
f3ecc7
#
f3ecc7
f3ecc7
# Filter out known broken events by default
f3ecc7
filter = yes
f3ecc7
# don't log memory errors individually
f3ecc7
#filter-memory-errors = yes
f3ecc7
f3ecc7
# output in undecoded raw format to be easier machine readable
f3ecc7
#raw = yes
f3ecc7
f3ecc7
[server]
f3ecc7
# An upstream bug prevents this from being disabled
f3ecc7
# Only allow root to connect by default
f3ecc7
client-user = root
f3ecc7
# Path to socket client uses to connect
f3ecc7
socket-path = /var/run/mcelog-client
f3ecc7
f3ecc7
[dimm]
f3ecc7
# Enable DIMM-tracking
f3ecc7
dimm-tracking-enabled = yes
f3ecc7
# Disable DIMM DMI pre-population unless supported on your system
f3ecc7
dmi-prepopulate = no
f3ecc7
f3ecc7
# execute these triggers when the rate of corrected or uncorrected
f3ecc7
# errors per DIMM exceeds the threshold
c02d22
# The default of 10/24h was reasonable for server quality
c02d22
# DDR3 DIMMs as of 2009/10. Newer systems can benefit from
c02d22
# more aggressive page offline when corrected errors are seen
c02d22
# See:
c02d22
# https://www.intel.com/content/dam/www/public/us/en/documents/intel-and-samsung-mrt-improving-memory-reliability-at-data-centers.pdf
c02d22
# for details.
f3ecc7
uc-error-trigger = dimm-error-trigger
f3ecc7
uc-error-threshold = 1 / 24h
f3ecc7
ce-error-trigger = dimm-error-trigger
c02d22
ce-error-threshold = 2 / 24h
f3ecc7
f3ecc7
[socket]
f3ecc7
# Memory error accounting per socket
f3ecc7
socket-tracing-enabled = yes
f3ecc7
mem-uc-error-threshold = 100 / 24h
f3ecc7
mem-ce-error-trigger = socket-memory-error-trigger
f3ecc7
mem-ce-error-threshold = 100 / 24h
f3ecc7
mem-ce-error-log = yes
f3ecc7
f3ecc7
[cache]
f3ecc7
# Attempt to off-line CPUs causing cache errors
f3ecc7
cache-threshold-trigger = cache-error-trigger
f3ecc7
cache-threshold-log = yes
f3ecc7
f3ecc7
[page]
f3ecc7
# Try to soft-offline a 4K page if it exceeds the threshold
f3ecc7
memory-ce-threshold = 10 / 24h
f3ecc7
memory-ce-trigger = page-error-trigger
f3ecc7
memory-ce-log = yes
f3ecc7
memory-ce-action = soft
f3ecc7
f3ecc7
[trigger]
f3ecc7
# Maximum number of running triggers
f3ecc7
children-max = 2
f3ecc7
directory = /etc/mcelog/triggers