| 14 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 15 |  | # for computing machines | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 16 |  | group.computing=Host.129.12.4.*; | 
 
 
 
 
 
 
 
 | 17 | + | group.rocks=Host.agate.ukc.ac.uk;Host.arkose.ukc.ac.uk;Host.basalt.ukc.ac.uk;Host.chalk.ukc.ac.uk;\ | 
 
 
 
 
 
 
 
 | 18 | + | Host.chert.ukc.ac.uk;Host.granite.ukc.ac.uk;Host.jade.ukc.ac.uk;Host.jasper.ukc.ac.uk;\ | 
 
 
 
 
 
 
 
 | 19 | + | Host.magnetite.ukc.ac.uk;Host.obsidian.ukc.ac.uk;Host.pumice.ukc.ac.uk;\ | 
 
 
 
 
 
 
 
 | 20 | + | Host.pyrite.ukc.ac.uk;Host.slate.ukc.ac.uk;Host.topaz.ukc.ac.uk; | 
 
 
 
 
 
 
 
 | 21 | + | group.compsoc=Host.compsoc1.ukc.ac.uk | 
 
 
 
 
 
 
 
 | 22 | + |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 23 |  | config.computing=computing.conf | 
 
 
 
 
 
 
 
 | 24 | + | config.rocks=rocks.conf | 
 
 
 
 
 
 
 
 | 25 | + | config.compsoc1=rocks.conf | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 26 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 27 |  | # for library machines | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 28 |  | group.library=Host.129.12.58.*; | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 45 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 46 |  | # The time interval at which the Queue's should be monitored | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 47 |  | Queue.MonitorInterval=15 | 
 
 
 
 
 
 
 
 | 48 | + | # The upper limit for a Queue | 
 
 
 
 
 
 
 
 | 49 | + | Queue.SizeLimit=1000 | 
 
 
 
 
 
 
 
 | 50 | + | # The removal algorithm | 
 
 
 
 
 
 
 
 | 51 | + | Queue.RemoveAlgorithm=FIRST | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 52 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 53 |  |  | 
 
 
 
 
 
 
 
 
 | 42 | – |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 54 |  | ############################################################ | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 55 |  | #### FilterManager configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 56 |  | ############################################################ | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 114 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 115 |  | # The services checks to run on a host | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 116 |  | Host.serviceChecksPackage=uk.org.iscream.filter.plugins | 
 
 
 
 
 
 
 
 
 | 106 | – | Host.serviceChecks=HTTP;SMTP;POP3;SSH;FTP;IMAP;Telnet | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 117 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 118 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 119 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 123 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 124 |  | # the monitors to run | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 125 |  | Monitor.PluginsPackage=uk.org.iscream.client.monitors | 
 
 
 
 
 
 
 
 
 
 
 | 126 | < | Monitor.Plugins=CPU;Disk;Memory;Swap;Services;Heartbeat;WebFeeder; | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 126 | > | Monitor.Plugins=CPU;Load;Process;Disk;Memory;Swap;Services;Heartbeat;Queue;WebFeeder; | 
 
 
 
 
 | 127 | > | #Monitor.Plugins=CPU;WebFeeder; | 
 
 
 
 
 | 128 | > | #Monitor.Plugins= | 
 
 
 
 
 
 
 
 
 
 
 | 129 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 130 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 131 |  | ## CPU monitor configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 144 |  | Monitor.CPU.alertTimeout.CRITICAL=3600 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 145 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 146 |  |  | 
 
 
 
 
 
 
 
 | 147 | + | ## Load monitor configuration | 
 
 
 
 
 
 
 
 | 148 | + | # threshold values | 
 
 
 
 
 
 
 
 | 149 | + | # | 
 
 
 
 
 
 
 
 | 150 | + | # note: if the UPPER threshold is broken, | 
 
 
 
 
 
 
 
 | 151 | + | # the alertTimeout values are halved. | 
 
 
 
 
 
 
 
 | 152 | + | # This is to escalate the alert quicker. | 
 
 
 
 
 
 
 
 | 153 | + | Monitor.Load.threshold.LOWER=10.0 | 
 
 
 
 
 
 
 
 | 154 | + | Monitor.Load.threshold.UPPER=20.0 | 
 
 
 
 
 
 
 
 | 155 | + |  | 
 
 
 
 
 
 
 
 | 156 | + | # timings of the alerts (in seconds) | 
 
 
 
 
 
 
 
 | 157 | + | Monitor.Load.alertTimeout.NOTICE=60 | 
 
 
 
 
 
 
 
 | 158 | + | Monitor.Load.alertTimeout.WARNING=900 | 
 
 
 
 
 
 
 
 | 159 | + | Monitor.Load.alertTimeout.CAUTION=1800 | 
 
 
 
 
 
 
 
 | 160 | + | Monitor.Load.alertTimeout.CRITICAL=3600 | 
 
 
 
 
 
 
 
 | 161 | + |  | 
 
 
 
 
 
 
 
 | 162 | + |  | 
 
 
 
 
 
 
 
 | 163 | + | ## Process Count monitor configuration | 
 
 
 
 
 
 
 
 | 164 | + | # threshold values | 
 
 
 
 
 
 
 
 | 165 | + | # | 
 
 
 
 
 
 
 
 | 166 | + | # note: if the UPPER threshold is broken, | 
 
 
 
 
 
 
 
 | 167 | + | # the alertTimeout values are halved. | 
 
 
 
 
 
 
 
 | 168 | + | # This is to escalate the alert quicker. | 
 
 
 
 
 
 
 
 | 169 | + | Monitor.Process.threshold.LOWER=1000 | 
 
 
 
 
 
 
 
 | 170 | + | Monitor.Process.threshold.UPPER=1500 | 
 
 
 
 
 
 
 
 | 171 | + |  | 
 
 
 
 
 
 
 
 | 172 | + | # timings of the alerts (in seconds) | 
 
 
 
 
 
 
 
 | 173 | + | Monitor.Process.alertTimeout.NOTICE=60 | 
 
 
 
 
 
 
 
 | 174 | + | Monitor.Process.alertTimeout.WARNING=900 | 
 
 
 
 
 
 
 
 | 175 | + | Monitor.Process.alertTimeout.CAUTION=1800 | 
 
 
 
 
 
 
 
 | 176 | + | Monitor.Process.alertTimeout.CRITICAL=3600 | 
 
 
 
 
 
 
 
 | 177 | + |  | 
 
 
 
 
 
 
 
 | 178 | + |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 179 |  | ## Memory monitor configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 180 |  | # threshold values | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 181 |  | # | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 214 |  | # note: if the UPPER threshold is broken, | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 215 |  | # the alertTimeout values are halved. | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 216 |  | # This is to escalate the alert quicker. | 
 
 
 
 
 
 
 
 
 
 
 | 217 | < | Monitor.Disk.threshold.LOWER=80 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 218 | < | Monitor.Disk.threshold.UPPER=90 | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 217 | > | Monitor.Disk.threshold.LOWER=90 | 
 
 
 
 
 | 218 | > | Monitor.Disk.threshold.UPPER=95 | 
 
 
 
 
 | 219 | > | Monitor.Disk.thresholdMeasure=PERCENTAGE | 
 
 
 
 
 
 
 
 
 
 
 | 220 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 221 |  | # timings of the alerts (in seconds) | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 222 |  | Monitor.Disk.alertTimeout.NOTICE=60 | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 225 |  | Monitor.Disk.alertTimeout.CRITICAL=3600 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 226 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 227 |  |  | 
 
 
 
 
 
 
 
 | 228 | + | ## Disk monitor configuration | 
 
 
 
 
 
 
 
 | 229 | + | # threshold values | 
 
 
 
 
 
 
 
 | 230 | + | # | 
 
 
 
 
 
 
 
 | 231 | + | # note: if the UPPER threshold is broken, | 
 
 
 
 
 
 
 
 | 232 | + | # the alertTimeout values are halved. | 
 
 
 
 
 
 
 
 | 233 | + | # This is to escalate the alert quicker. | 
 
 
 
 
 
 
 
 | 234 | + | Monitor.Queue.threshold.LOWER=90 | 
 
 
 
 
 
 
 
 | 235 | + | Monitor.Queue.threshold.UPPER=95 | 
 
 
 
 
 
 
 
 | 236 | + | Monitor.Queue.thresholdMeasure=PERCENTAGE | 
 
 
 
 
 
 
 
 | 237 | + |  | 
 
 
 
 
 
 
 
 | 238 | + | # timings of the alerts (in seconds) | 
 
 
 
 
 
 
 
 | 239 | + | Monitor.Queue.alertTimeout.NOTICE=60 | 
 
 
 
 
 
 
 
 | 240 | + | Monitor.Queue.alertTimeout.WARNING=900 | 
 
 
 
 
 
 
 
 | 241 | + | Monitor.Queue.alertTimeout.CAUTION=1800 | 
 
 
 
 
 
 
 
 | 242 | + | Monitor.Queue.alertTimeout.CRITICAL=3600 | 
 
 
 
 
 
 
 
 | 243 | + |  | 
 
 
 
 
 
 
 
 | 244 | + |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 245 |  | ## Services monitor configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 246 |  | # threshold values | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 247 |  | # | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 313 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 314 |  | # alerters to run | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 315 |  | Alerter.PluginsPackage=uk.org.iscream.client.alerters | 
 
 
 
 
 
 
 
 
 
 
 | 316 | < | Alerter.Plugins=EMail;IRC;WebFeeder; | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 316 | > | #Alerter.Plugins=EMail;IRC;WebFeeder; | 
 
 
 
 
 | 317 | > | Alerter.Plugins=IRC;WebFeeder; | 
 
 
 
 
 | 318 | > | #Alerter.Plugins=WebFeeder; | 
 
 
 
 
 | 319 | > | #Alerter.Plugins= | 
 
 
 
 
 
 
 
 
 
 
 | 320 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 321 |  | # EMail alerter configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 322 |  | Alerter.EMail.level = WARNING | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 359 |  | WebFeeder.latestActive = true | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 360 |  | WebFeeder.alertActive = true | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 361 |  |  | 
 
 
 
 
 
 
 
 | 362 | + | # Only pass on alerts past this level | 
 
 
 
 
 
 
 
 | 363 | + | WebFeeder.alertLevel = OK | 
 
 
 
 
 
 
 
 | 364 | + |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 365 |  | # Check period in seconds (for cleaning stale/old alerts) | 
 
 
 
 
 
 
 
 
 
 
 | 366 | < | WebFeeder.checkPeriod = 1800 | 
 
 
 
 
 
 
 
 
 | 366 | > | WebFeeder.checkPeriod = 120 | 
 
 
 
 
 
 
 
 
 
 
 | 367 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 368 |  | # Delete alerts older than this, in seconds. | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 369 |  | # Files are only check every WebFeeder.checkPeriod seconds. | 
 
 
 
 
 
 
 
 
 
 
 | 370 | < | WebFeeder.alertDeleteOlderThan = 3600 | 
 
 
 
 
 
 
 
 
 | 370 | > | WebFeeder.alertDeleteOlderThan = 300 | 
 
 
 
 
 
 
 
 
 
 
 | 371 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 372 |  | # Root Path | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 373 |  | WebFeeder.rootPath = /usr/local/proj/co600_10/webroot |