ViewVC Help
View File | Revision Log | Show Annotations | Revision Graph | Root Listing
root/i-scream/projects/cms/source/server/build/etc/system.conf
Revision: 1.58
Committed: Mon Nov 26 12:56:33 2001 UTC (22 years, 9 months ago) by tdb
Branch: MAIN
Branch point for: SERVER_PIRCBOT
Changes since 1.57: +5 -1 lines
Log Message:
Completing this feature request:
  [ #479631 ] heartbeat monitor - starting list

Adds hosts defined in this configuration value to the heartbeat monitor on
startup.

Monitor.Heartbeat.initialHosts=raptor.ukc.ac.uk;myrtle.ukc.ac.uk

This means the Heartbeat Monitor will generate heartbeat alerts if these
hosts don't send in a heartbeat within the expected time. This is useful in
situations where the i-scream server comes up after the hosts have gone
down, which usually wouldn't have generated an alert - because the server
would never have seen the hosts to know they're gone.

File Contents

# User Rev Content
1 tdb 1.2 # This is the default system configuration file
2     # used by all components of the i-scream system
3     #
4     # ALL configuration that uses the centralised
5     # configuration system has this file as its
6     # root of configuration
7     #
8 tdb 1.36 # $Author: tdb1 $
9 tdb 1.58 # $Id: system.conf,v 1.57 2001/11/07 17:51:41 tdb1 Exp $
10 ajm 1.14 #
11     ############################################################
12     #### Configuration Files & Groups
13     ############################################################
14    
15     # for computing machines
16 tdb 1.15 group.computing=Host.129.12.4.*;
17 tdb 1.41 group.rocks=Host.agate.ukc.ac.uk;Host.arkose.ukc.ac.uk;Host.basalt.ukc.ac.uk;Host.chalk.ukc.ac.uk;\
18     Host.chert.ukc.ac.uk;Host.granite.ukc.ac.uk;Host.jade.ukc.ac.uk;Host.jasper.ukc.ac.uk;\
19     Host.magnetite.ukc.ac.uk;Host.obsidian.ukc.ac.uk;Host.pumice.ukc.ac.uk;\
20     Host.pyrite.ukc.ac.uk;Host.slate.ukc.ac.uk;Host.topaz.ukc.ac.uk;
21 tdb 1.42 group.compsoc=Host.compsoc1.ukc.ac.uk
22 tdb 1.41
23 tdb 1.15 config.computing=computing.conf
24 tdb 1.41 config.rocks=rocks.conf
25 tdb 1.42 config.compsoc1=rocks.conf
26 ajm 1.14
27     # for library machines
28 tdb 1.15 group.library=Host.129.12.58.*;
29 ajm 1.14 config.library=library.conf
30    
31 tdb 1.15 # for SSB machines
32     group.ssb=Host.stue*.ukc.ac.uk;
33     config.ssb=ssb.conf
34    
35 ajm 1.14 # mySQL configuration
36     config.mySQL=mySQL.conf
37    
38 ajm 1.16 ############################################################
39     #### Misc system-wide configuration
40     ############################################################
41    
42     # the time (in seconds) that checks should be made for
43     # changes in configuration
44     ConfigurationProxy.updateTime=60
45    
46     # The time interval at which the Queue's should be monitored
47     Queue.MonitorInterval=15
48 tdb 1.40 # The upper limit for a Queue
49     Queue.SizeLimit=1000
50     # The removal algorithm
51     Queue.RemoveAlgorithm=FIRST
52 tdb 1.2
53 ajm 1.14
54     ############################################################
55     #### FilterManager configuration
56     ############################################################
57 tdb 1.2
58     # The default port to listen for new host connections
59     FilterManager.listenPort=4567
60    
61 ajm 1.14
62    
63     ############################################################
64     #### Filter configuration
65     ############################################################
66    
67 tdb 1.2 # The default port for Filter's to listen on
68     Filter.UDPListenPort=4589
69     Filter.TCPListenPort=4589
70    
71 ajm 1.14 # Plugin Information
72 tdb 1.55 Filter.PluginsPackage=uk.org.iscream.cms.server.filter.plugins
73 ajm 1.14 Filter.Plugins=TypeChecker;EnforceEssentialData
74    
75 tdb 1.2 # The name for the root filter
76     RootFilter.name=root
77 ajm 1.14
78     # The default parent filter (should almost always be the same as Filter.rootFilter)
79     Filter.parentFilter=root
80    
81    
82    
83     ############################################################
84     #### Root filter interfaces configuration
85     ############################################################
86    
87 tdb 1.2 # Comment either of these (or delete them) and
88     # that interface won't be started
89     RootFilter.realtimeInterfaceName=realtimeclients
90 tdb 1.6 RootFilter.dbInterfaceName=database
91 tdb 1.2
92 ajm 1.14
93    
94     ############################################################
95     #### Client interface configuration
96     ############################################################
97    
98 tdb 1.2 # The port for the client interface to listen on
99     ClientInterface.listenPort=4510
100 tdb 1.52 # The name for the client interface
101     ClientInterface.name=realtimeclients
102    
103    
104    
105     ############################################################
106     #### Database interface configuration
107     ############################################################
108    
109     # The name for the Database interface
110     DBInterface.name=database
111 tdb 1.2
112 ajm 1.14
113    
114     ############################################################
115     #### Host Configuration
116     ############################################################
117 tdb 1.2
118     # The default filter for a new host
119 tdb 1.36 Host.filter=computingFilter;
120 tdb 1.13
121 tdb 1.2 # The default update times for a new host
122 tdb 1.7 Host.UDPUpdateTime=10
123 tdb 1.2 Host.TCPUpdateTime=60
124 tdb 1.15 Host.AveragerUpdateTime=5
125 tdb 1.2
126 ajm 1.8 # The services checks to run on a host
127 tdb 1.55 Host.serviceChecksPackage=uk.org.iscream.cms.server.filter.plugins
128 tdb 1.2
129 ajm 1.14
130 tdb 1.12
131 ajm 1.14 ############################################################
132     #### Monitor Configuration
133     ############################################################
134    
135 tdb 1.47 ## The monitors to run
136 tdb 1.55 Monitor.PluginsPackage=uk.org.iscream.cms.server.client.monitors
137 tdb 1.51 Monitor.Plugins=CPU;Load;Process;Disk;Memory;Swap;Services;\
138     Heartbeat;Queue;UserCount;WebFeeder;
139 tdb 1.24
140 tdb 1.47 ## Default alert timeouts
141     # these can be override on a per-monitor basis
142     # timings of the alerts (in seconds)
143     Monitor.alertTimeout.NOTICE=60
144     Monitor.alertTimeout.WARNING=900
145     Monitor.alertTimeout.CAUTION=1800
146     Monitor.alertTimeout.CRITICAL=3600
147 ajm 1.14
148 tdb 1.47 ## Threshold values
149 ajm 1.16 #
150     # note: if the UPPER threshold is broken,
151     # the alertTimeout values are halved.
152     # This is to escalate the alert quicker.
153 tdb 1.47 #
154    
155     # CPU monitor threshold values
156 ajm 1.16 Monitor.CPU.threshold.LOWER=90
157     Monitor.CPU.threshold.UPPER=99
158    
159 tdb 1.44
160 tdb 1.47 # Load monitor threshold values
161 tdb 1.44 Monitor.Load.threshold.LOWER=10.0
162     Monitor.Load.threshold.UPPER=20.0
163    
164    
165 tdb 1.47 # Process Count threshold values
166 tdb 1.44 Monitor.Process.threshold.LOWER=1000
167     Monitor.Process.threshold.UPPER=1500
168    
169 tdb 1.24
170 tdb 1.47 # Memory monitor threshold values
171 tdb 1.24 Monitor.Memory.threshold.LOWER=80
172     Monitor.Memory.threshold.UPPER=90
173    
174    
175 tdb 1.47 # Swap monitor threshold values
176 tdb 1.24 Monitor.Swap.threshold.LOWER=80
177     Monitor.Swap.threshold.UPPER=90
178 tdb 1.50
179    
180     # UserCount monitor threshold values
181     Monitor.UserCount.threshold.LOWER=100
182     Monitor.UserCount.threshold.UPPER=200
183 tdb 1.24
184 ajm 1.33
185 tdb 1.47 # Disk monitor threshold values
186 tdb 1.42 Monitor.Disk.threshold.LOWER=90
187     Monitor.Disk.threshold.UPPER=95
188 tdb 1.47 # Thresholds given are PERCENTAGE or VALUE
189     # where PERCENTAGE is a percentage of disk in use
190     # and VALUE is an absolute value of space free
191 tdb 1.46 Monitor.Disk.thresholdMeasure=PERCENTAGE
192 ajm 1.33
193 tdb 1.46
194 tdb 1.56 # Queue monitor threshold values
195 tdb 1.49 Monitor.Queue.threshold.LOWER=50
196     Monitor.Queue.threshold.UPPER=80
197 tdb 1.47 # Thresholds given are PERCENTAGE or VALUE
198     # where PERCENTAGE is a percentage of disk in use
199     # and VALUE is an absolute value of space free
200 tdb 1.46 Monitor.Queue.thresholdMeasure=PERCENTAGE
201    
202 ajm 1.34
203 tdb 1.47 # Services monitor threshold values
204 ajm 1.34 #
205     # THE SERVICES MONITOR USES A HACK
206     # WHEREBY IT USES THE SERVICE STATUS
207     # AS THE THRESHOLD LEVEL. THIS SHOULD
208     # BE LOOKED AT!
209     #
210 tdb 1.47 # how many times we should be at the highest level before
211     # we go to a FINAL alert
212 tdb 1.38 Monitor.Services.reachFINALcount=5
213    
214 ajm 1.14
215 tdb 1.47 # Heartbeat threshold values
216 tdb 1.25 # these are values in seconds from when the heartbeat
217     # was *expected* to arrive (ie. last + hearbeat period)
218 tdb 1.48 Monitor.Heartbeat.threshold.LOWER=180
219 tdb 1.38 Monitor.Heartbeat.threshold.UPPER=300
220 tdb 1.47 # this is how often we will run a "check" of heartbeats
221 tdb 1.48 Monitor.Heartbeat.checkPeriod=50
222 tdb 1.47 # how many times we should be at the highest level before
223     # we go to a FINAL alert
224     Monitor.Heartbeat.reachFINALcount=5
225 tdb 1.58 # list of hosts we expect to have at startup
226     # this ensures we notice hosts that aren't running, not
227     # just those that have gone down recently.
228     Monitor.Heartbeat.initialHosts=raptor.ukc.ac.uk;myrtle.ukc.ac.uk;kestrel.ukc.ac.uk
229 tdb 1.47
230 ajm 1.14
231 ajm 1.23
232 ajm 1.14 ############################################################
233     #### Alerter Configuration
234     ############################################################
235 ajm 1.23 # The following var's are understood by ALL alerters for messages
236     #
237     # %level% - the alert level (eg, WARNING)
238     # %threshold% - the threshold broken (eg, LOWER)
239     # %source% - the source of the alert (eg, raptor.ukc.ac.uk)
240     # %value% - the value reached (eg, 95)
241     # %thresholdValue% - the value of the threshold broken (eg, 90)
242     # %attributeName% - the attribute that has caused the alert (eg, CPU User)
243     # %timeTillNextAlert% - the time the next alert will be sent out
244     # %timeSinceFirstAlert% - the time elapsed since the first alert for this problem
245     # %timeOfFirstAlert% - the time the first alert was sent
246     #
247 ajm 1.14
248     # alerters to run
249 tdb 1.55 Alerter.PluginsPackage=uk.org.iscream.cms.server.client.alerters
250 tdb 1.54 Alerter.Plugins=EMail;IRC;WebFeeder;Logging;
251 tdb 1.47
252 ajm 1.14
253     # EMail alerter configuration
254 tdb 1.38 Alerter.EMail.level = WARNING
255     Alerter.EMail.destList = dev@i-scream.org.uk
256 ajm 1.14 Alerter.EMail.sender = dev@i-scream.org.uk
257     Alerter.EMail.smtpServer = mercury.ukc.ac.uk
258 ajm 1.16 Alerter.EMail.subject = i-scream alert: %level% alert on %source% for %attributeName%
259 tdb 1.38 Alerter.EMail.message = The i-scream distributed central monitoring system has\nraised a %level% alert for the host %source%.\n\nThe value for %attributeName% of %value% has exceeded the\n%threshold% threshold value of %thresholdValue%.\n\nThis alert was originally raised at %timeOfFirstAlert%,\nwhich was %timeSinceFirstAlert% ago.\n\nThe next alert (should one occur) will be sent in %timeTillNextAlert%.
260    
261 ajm 1.14
262     # IRC alerter configuration
263 ajm 1.16 Alerter.IRC.level = OK
264 ajm 1.14 Alerter.IRC.IRCServer = killigrew.ukc.ac.uk
265     Alerter.IRC.IRCPort = 6667
266 tdb 1.19 Alerter.IRC.nickList = iscreamBot;_iscreamBot;i-screamBot
267 tdb 1.17 Alerter.IRC.user = i-scream
268     Alerter.IRC.comment = i-scream alerting bot
269 ajm 1.14 Alerter.IRC.channel = #i-scream
270 ajm 1.16 Alerter.IRC.message = %level%: %attributeName% on %source% has passed %threshold%(%thresholdValue%) threshold with %value% - time till next alert (should one occur), %timeTillNextAlert%
271 tdb 1.17 Alerter.IRC.reconnectDelay = 30
272     Alerter.IRC.startupNotice = i-scream alerting bot activated
273     Alerter.IRC.stopCommand = stop alerts
274     Alerter.IRC.startCommand = start alerts
275     Alerter.IRC.lastAlertCommand = last alert
276     Alerter.IRC.joinCommand = join
277 tdb 1.18 Alerter.IRC.nickChangeCommand = nick
278     Alerter.IRC.statCommand = statistics
279     Alerter.IRC.uptimeCommand = uptime
280     Alerter.IRC.timeSinceLastAlertCommand = time since last alert
281 tdb 1.19 Alerter.IRC.versionCommand = version
282 tdb 1.17 Alerter.IRC.helpCommand = help
283     Alerter.IRC.rejectMessage = sorry, I don't understand your request
284 tdb 1.54
285    
286     # Logging alerter configuration
287     Alerter.Logging.level = WARNING
288 tdb 1.57 Alerter.Logging.message = %level%: %attributeName% on %source% has passed %threshold%(%thresholdValue%) threshold with %value%
289 tdb 1.29
290 tdb 1.47
291    
292 tdb 1.29 ############################################################
293     #### WebFeeder Configuration
294     ############################################################
295    
296 tdb 1.32 # Define these (one or both_ to turn on the WebFeeder's,
297     # comment it to turn them off
298     WebFeeder.latestActive = true
299     WebFeeder.alertActive = true
300 tdb 1.43
301     # Only pass on alerts past this level
302 tdb 1.53 Alerter.WebFeeder.level = OK
303 tdb 1.37
304     # Check period in seconds (for cleaning stale/old alerts)
305 tdb 1.42 WebFeeder.checkPeriod = 120
306 tdb 1.37
307     # Delete alerts older than this, in seconds.
308     # Files are only check every WebFeeder.checkPeriod seconds.
309 tdb 1.42 WebFeeder.alertDeleteOlderThan = 300
310 tdb 1.32
311 tdb 1.29 # Root Path
312     WebFeeder.rootPath = /usr/local/proj/co600_10/webroot
313    
314     # Latest Data
315     WebFeeder.latestSubDir = latest
316 tdb 1.31 WebFeeder.latestFileName = latest_data
317 tdb 1.32
318     # Alert Data
319     WebFeeder.alertSubDir = alert
320     WebFeeder.alertFileName = alert_data
321 ajm 1.16
322 tdb 1.47
323 tdb 1.17 ############################################################