Saltstack Official Linux Formula

200 lines
6.9KB

  1. {%- from "linux/map.jinja" import system with context %}
  2. {%- set mcelog = system.mcelog %}
  3. #
  4. # Example config file for mcelog
  5. # mcelog is the user space backend that decodes and process machine check events
  6. # (cpu hardware errors) reported by the CPU to the kernel
  7. #
  8. # general format
  9. #optionname = value
  10. # white space is not allowed in value currently, except at the end where it is dropped
  11. #
  12. # In general all command line options that are not commands work here.
  13. # See man mcelog or mcelog --help for a list.
  14. # e.g. to enable the --no-syslog option use
  15. #no-syslog = yes (or no to disable)
  16. # when the option has a argument
  17. #logfile = /tmp/logfile
  18. # below are the options which are not command line options.
  19. # Set CPU type for which mcelog decodes events:
  20. #cpu = type
  21. # For valid values for type please see mcelog --help.
  22. # If this value is set incorrectly the decoded output will be likely incorrect.
  23. # By default when this parameter is not set mcelog uses the CPU it is running on
  24. # on very new kernels the mcelog events reported by the kernel also carry
  25. # the CPU type which is used too when available and not overriden.
  26. # Enable daemon mode:
  27. #daemon = yes
  28. # By default mcelog just processes the currently pending events and exits.
  29. # In daemon mode it will keep running as a daemon in the background and poll
  30. # the kernel for events and then decode them.
  31. # Filter out known broken events by default.
  32. filter = yes
  33. # Don't log memory errors individually.
  34. # They still get accounted if that is enabled.
  35. #filter-memory-errors = yes
  36. # output in undecoded raw format to be easier machine readable
  37. # (default is decoded).
  38. #raw = yes
  39. # Set CPU Mhz to decode uptime from time stamp counter (output
  40. # unreliable, not needed on new kernels which report the event time
  41. # directly. A lot of systems don't have a linear time stamp clock
  42. # and the output is wrong then.
  43. # Normally mcelog tries to figure out if it the TSC is reliable
  44. # and only uses the current frequency then.
  45. # Setting a frequency forces timestamp decoding.
  46. # This setting is obsolete with modern kernels which report the time
  47. # directly.
  48. #cpumhz = 1800.00
  49. # log output options
  50. # Log decoded machine checks in syslog (default stdout or syslog for daemon)
  51. #syslog = yes
  52. # Log decoded machine checks in syslog with error level
  53. #syslog-error = yes
  54. # Never log anything to syslog
  55. #no-syslog = yes
  56. # Append log output to logfile instead of stdout. Only when no syslog logging is active
  57. #logfile = filename
  58. {%- if mcelog.logging is defined %}
  59. {%- if mcelog.logging.syslog is defined %}
  60. syslog = {{ 'yes' if mcelog.logging.syslog else 'no' }}
  61. {%- endif %}
  62. {%- if mcelog.logging.syslog_error is defined %}
  63. syslog-error = {{ 'yes' if mcelog.logging.syslog_error else 'no' }}
  64. {%- endif %}
  65. {%- if mcelog.logging.no_syslog is defined %}
  66. no-syslog = {{ 'yes' if mcelog.logging.no_syslog else 'no' }}
  67. {%- endif %}
  68. {%- if mcelog.logging.logfile is defined %}
  69. logfile = {{ mcelog.logging.logfile }}
  70. {%- endif %}
  71. {%- endif %}
  72. # Use SMBIOS information to decode DIMMs (needs root).
  73. # This function is not recommended to use right now and generally not needed.
  74. # The exception is memdb prepopulation, which is configured separately below.
  75. #dmi = no
  76. # When in daemon mode run as this user after set up.
  77. # Note that the triggers will run as this user too.
  78. # Setting this to non root will mean that triggers cannot take some corrective
  79. # action, like offlining objects.
  80. #run-credentials-user = root
  81. # group to run as daemon with
  82. # default to the group of the run-credentials-user
  83. #run-credentials-group = nobody
  84. [server]
  85. # user allowed to access client socket.
  86. # when set to * match any
  87. # root is always allowed to access.
  88. # default: root only
  89. client-user = root
  90. # group allowed to access mcelog
  91. # When no group is configured any group matches (but still user checking).
  92. # when set to * match any
  93. #client-group = root
  94. # Path to the unix socket for client<->server communication.
  95. # When no socket-path is configured the server will not start
  96. #socket-path = /var/run/mcelog-client
  97. # When mcelog starts it checks if a server is already running. This configures the timeout
  98. # for this check.
  99. #initial-ping-timeout = 2
  100. #
  101. [dimm]
  102. # Is the in memory DIMM error tracking enabled?
  103. # Only works on systems with integrated memory controller and
  104. # which are supported.
  105. # Only takes effect in daemon mode.
  106. dimm-tracking-enabled = yes
  107. # Use DMI information from the BIOS to prepopulate DIMM database.
  108. # Note this might not work with all BIOS and requires mcelog to run as root.
  109. # Alternative is to let mcelog create DIMM objects on demand.
  110. dmi-prepopulate = yes
  111. #
  112. # Execute these triggers when the rate of corrected or uncorrected
  113. # Errors per DIMM exceeds the threshold.
  114. # Note when the hardware does not report DIMMs this might also
  115. # be per channel.
  116. # The default of 10/24h is reasonable for server quality
  117. # DDR3 DIMMs as of 2009/10.
  118. #uc-error-trigger = dimm-error-trigger
  119. uc-error-threshold = 1 / 24h
  120. #ce-error-trigger = dimm-error-trigger
  121. ce-error-threshold = 10 / 24h
  122. [socket]
  123. # Enable memory error accounting per socket.
  124. socket-tracking-enabled = yes
  125. # Threshold and trigger for uncorrected memory errors on a socket.
  126. # mem-uc-error-trigger = socket-memory-error-trigger
  127. mem-uc-error-threshold = 100 / 24h
  128. # Trigger script for corrected memory errors on a socket.
  129. mem-ce-error-trigger = socket-memory-error-trigger
  130. # Threshold on when to trigger a correct error for the socket.
  131. mem-ce-error-threshold = 100 / 24h
  132. # Log socket error threshold explicitely?
  133. mem-ce-error-log = yes
  134. # Trigger script for uncorrected bus error events
  135. bus-uc-threshold-trigger = bus-error-trigger
  136. # Trigger script for uncorrected IOMCA erors
  137. iomca-threshold-trigger = iomca-error-trigger
  138. # Trigger script for other uncategorized errors
  139. unknown-threshold-trigger = unknown-error-trigger
  140. [cache]
  141. # Processing of cache error thresholds reported by Intel CPUs.
  142. cache-threshold-trigger = cache-error-trigger
  143. # Should cache threshold events be logged explicitely?
  144. cache-threshold-log = yes
  145. [page]
  146. # Memory error accouting per 4K memory page.
  147. # Threshold for the correct memory errors trigger script.
  148. memory-ce-threshold = 10 / 24h
  149. # Trigger script for corrected errors.
  150. # memory-ce-trigger = page-error-trigger
  151. # Should page threshold events be logged explicitely?
  152. memory-ce-log = yes
  153. # specify the internal action in mcelog to exceeding a page error threshold
  154. # this is done in addition to executing the trigger script if available
  155. # off no action
  156. # account only account errors
  157. # soft try to soft-offline page without killing any processes
  158. # This requires an uptodate kernel. Might not be successfull.
  159. # hard try to hard-offline page by killing processes
  160. # Requires an uptodate kernel. Might not be successfull.
  161. # soft-then-hard First try to soft offline, then try hard offlining
  162. #memory-ce-action = off|account|soft|hard|soft-then-hard
  163. memory-ce-action = soft
  164. [trigger]
  165. # Maximum number of running triggers
  166. children-max = 2
  167. # execute triggers in this directory
  168. directory = /etc/mcelog