--- projects/cms/source/server/build/etc/system.conf 2001/03/05 04:21:20 1.21 +++ projects/cms/source/server/build/etc/system.conf 2001/03/06 02:35:18 1.23 @@ -5,8 +5,8 @@ # configuration system has this file as its # root of configuration # -# $Author: tdb $ -# $Id: system.conf,v 1.21 2001/03/05 04:21:20 tdb Exp $ +# $Author: ajm $ +# $Id: system.conf,v 1.23 2001/03/06 02:35:18 ajm Exp $ # ############################################################ #### Configuration Files & Groups @@ -94,7 +94,7 @@ ClientInterface.listenPort=4510 ############################################################ # The default filter for a new host -Host.filter=computingFilter; +Host.filter=filter1; # The default update times for a new host Host.UDPUpdateTime=10 @@ -113,9 +113,9 @@ Host.serviceChecks=HTTP;SMTP # the monitors to run Monitor.PluginsPackage=uk.ac.ukc.iscream.client.monitors -Monitor.Plugins=CPU; +Monitor.Plugins=CPU;Heartbeat -# CPU monitor configuration +## CPU monitor configuration # threshold values # # note: if the UPPER threshold is broken, @@ -130,11 +130,48 @@ Monitor.CPU.alertTimeout.WARNING=900 Monitor.CPU.alertTimeout.CAUTION=1800 Monitor.CPU.alertTimeout.CRITICAL=3600 +## Heartbeat monitor configuration +# threshold values +# +# note: if the UPPER threshold is broken, +# the alertTimeout values are halved. +# This is to escalate the alert quicker. +Monitor.Heartbeat.checkPeriod=50 +Monitor.Heartbeat.threshold.LOWER=120 +Monitor.Heartbeat.threshold.LOWER=300 +# timings of the alerts (in seconds) +Monitor.Heartbeat.alertTimeout.NOTICE=60 +Monitor.Heartbeat.alertTimeout.WARNING=900 +Monitor.Heartbeat.alertTimeout.CAUTION=1800 +Monitor.Heartbeat.alertTimeout.CRITICAL=3600 +# this means it will reach a FINAL level, +# and thus the host will be removed from the monitor list, +# if the highest level alert is reached and occours this +# number of times. +# +# int this setup, that means 5 CRITICAL alerts would occour +# on a Heartbeat before reaching FINAL. +# If this value is wrong or not present, FINAL is never reached +# +Monitor.Heartbeat.reachFINALcount=5 + ############################################################ #### Alerter Configuration ############################################################ +# The following var's are understood by ALL alerters for messages +# +# %level% - the alert level (eg, WARNING) +# %threshold% - the threshold broken (eg, LOWER) +# %source% - the source of the alert (eg, raptor.ukc.ac.uk) +# %value% - the value reached (eg, 95) +# %thresholdValue% - the value of the threshold broken (eg, 90) +# %attributeName% - the attribute that has caused the alert (eg, CPU User) +# %timeTillNextAlert% - the time the next alert will be sent out +# %timeSinceFirstAlert% - the time elapsed since the first alert for this problem +# %timeOfFirstAlert% - the time the first alert was sent +# # alerters to run Alerter.PluginsPackage=uk.ac.ukc.iscream.client.alerters