ViewVC Help
View File | Revision Log | Show Annotations | Revision Graph | Root Listing
root/i-scream/projects/cms/source/server/build/etc/system.conf
Revision: 1.58
Committed: Mon Nov 26 12:56:33 2001 UTC (22 years, 5 months ago) by tdb
Branch: MAIN
Branch point for: SERVER_PIRCBOT
Changes since 1.57: +5 -1 lines
Log Message:
Completing this feature request:
  [ #479631 ] heartbeat monitor - starting list

Adds hosts defined in this configuration value to the heartbeat monitor on
startup.

Monitor.Heartbeat.initialHosts=raptor.ukc.ac.uk;myrtle.ukc.ac.uk

This means the Heartbeat Monitor will generate heartbeat alerts if these
hosts don't send in a heartbeat within the expected time. This is useful in
situations where the i-scream server comes up after the hosts have gone
down, which usually wouldn't have generated an alert - because the server
would never have seen the hosts to know they're gone.

File Contents

# Content
1 # This is the default system configuration file
2 # used by all components of the i-scream system
3 #
4 # ALL configuration that uses the centralised
5 # configuration system has this file as its
6 # root of configuration
7 #
8 # $Author: tdb1 $
9 # $Id: system.conf,v 1.57 2001/11/07 17:51:41 tdb1 Exp $
10 #
11 ############################################################
12 #### Configuration Files & Groups
13 ############################################################
14
15 # for computing machines
16 group.computing=Host.129.12.4.*;
17 group.rocks=Host.agate.ukc.ac.uk;Host.arkose.ukc.ac.uk;Host.basalt.ukc.ac.uk;Host.chalk.ukc.ac.uk;\
18 Host.chert.ukc.ac.uk;Host.granite.ukc.ac.uk;Host.jade.ukc.ac.uk;Host.jasper.ukc.ac.uk;\
19 Host.magnetite.ukc.ac.uk;Host.obsidian.ukc.ac.uk;Host.pumice.ukc.ac.uk;\
20 Host.pyrite.ukc.ac.uk;Host.slate.ukc.ac.uk;Host.topaz.ukc.ac.uk;
21 group.compsoc=Host.compsoc1.ukc.ac.uk
22
23 config.computing=computing.conf
24 config.rocks=rocks.conf
25 config.compsoc1=rocks.conf
26
27 # for library machines
28 group.library=Host.129.12.58.*;
29 config.library=library.conf
30
31 # for SSB machines
32 group.ssb=Host.stue*.ukc.ac.uk;
33 config.ssb=ssb.conf
34
35 # mySQL configuration
36 config.mySQL=mySQL.conf
37
38 ############################################################
39 #### Misc system-wide configuration
40 ############################################################
41
42 # the time (in seconds) that checks should be made for
43 # changes in configuration
44 ConfigurationProxy.updateTime=60
45
46 # The time interval at which the Queue's should be monitored
47 Queue.MonitorInterval=15
48 # The upper limit for a Queue
49 Queue.SizeLimit=1000
50 # The removal algorithm
51 Queue.RemoveAlgorithm=FIRST
52
53
54 ############################################################
55 #### FilterManager configuration
56 ############################################################
57
58 # The default port to listen for new host connections
59 FilterManager.listenPort=4567
60
61
62
63 ############################################################
64 #### Filter configuration
65 ############################################################
66
67 # The default port for Filter's to listen on
68 Filter.UDPListenPort=4589
69 Filter.TCPListenPort=4589
70
71 # Plugin Information
72 Filter.PluginsPackage=uk.org.iscream.cms.server.filter.plugins
73 Filter.Plugins=TypeChecker;EnforceEssentialData
74
75 # The name for the root filter
76 RootFilter.name=root
77
78 # The default parent filter (should almost always be the same as Filter.rootFilter)
79 Filter.parentFilter=root
80
81
82
83 ############################################################
84 #### Root filter interfaces configuration
85 ############################################################
86
87 # Comment either of these (or delete them) and
88 # that interface won't be started
89 RootFilter.realtimeInterfaceName=realtimeclients
90 RootFilter.dbInterfaceName=database
91
92
93
94 ############################################################
95 #### Client interface configuration
96 ############################################################
97
98 # The port for the client interface to listen on
99 ClientInterface.listenPort=4510
100 # The name for the client interface
101 ClientInterface.name=realtimeclients
102
103
104
105 ############################################################
106 #### Database interface configuration
107 ############################################################
108
109 # The name for the Database interface
110 DBInterface.name=database
111
112
113
114 ############################################################
115 #### Host Configuration
116 ############################################################
117
118 # The default filter for a new host
119 Host.filter=computingFilter;
120
121 # The default update times for a new host
122 Host.UDPUpdateTime=10
123 Host.TCPUpdateTime=60
124 Host.AveragerUpdateTime=5
125
126 # The services checks to run on a host
127 Host.serviceChecksPackage=uk.org.iscream.cms.server.filter.plugins
128
129
130
131 ############################################################
132 #### Monitor Configuration
133 ############################################################
134
135 ## The monitors to run
136 Monitor.PluginsPackage=uk.org.iscream.cms.server.client.monitors
137 Monitor.Plugins=CPU;Load;Process;Disk;Memory;Swap;Services;\
138 Heartbeat;Queue;UserCount;WebFeeder;
139
140 ## Default alert timeouts
141 # these can be override on a per-monitor basis
142 # timings of the alerts (in seconds)
143 Monitor.alertTimeout.NOTICE=60
144 Monitor.alertTimeout.WARNING=900
145 Monitor.alertTimeout.CAUTION=1800
146 Monitor.alertTimeout.CRITICAL=3600
147
148 ## Threshold values
149 #
150 # note: if the UPPER threshold is broken,
151 # the alertTimeout values are halved.
152 # This is to escalate the alert quicker.
153 #
154
155 # CPU monitor threshold values
156 Monitor.CPU.threshold.LOWER=90
157 Monitor.CPU.threshold.UPPER=99
158
159
160 # Load monitor threshold values
161 Monitor.Load.threshold.LOWER=10.0
162 Monitor.Load.threshold.UPPER=20.0
163
164
165 # Process Count threshold values
166 Monitor.Process.threshold.LOWER=1000
167 Monitor.Process.threshold.UPPER=1500
168
169
170 # Memory monitor threshold values
171 Monitor.Memory.threshold.LOWER=80
172 Monitor.Memory.threshold.UPPER=90
173
174
175 # Swap monitor threshold values
176 Monitor.Swap.threshold.LOWER=80
177 Monitor.Swap.threshold.UPPER=90
178
179
180 # UserCount monitor threshold values
181 Monitor.UserCount.threshold.LOWER=100
182 Monitor.UserCount.threshold.UPPER=200
183
184
185 # Disk monitor threshold values
186 Monitor.Disk.threshold.LOWER=90
187 Monitor.Disk.threshold.UPPER=95
188 # Thresholds given are PERCENTAGE or VALUE
189 # where PERCENTAGE is a percentage of disk in use
190 # and VALUE is an absolute value of space free
191 Monitor.Disk.thresholdMeasure=PERCENTAGE
192
193
194 # Queue monitor threshold values
195 Monitor.Queue.threshold.LOWER=50
196 Monitor.Queue.threshold.UPPER=80
197 # Thresholds given are PERCENTAGE or VALUE
198 # where PERCENTAGE is a percentage of disk in use
199 # and VALUE is an absolute value of space free
200 Monitor.Queue.thresholdMeasure=PERCENTAGE
201
202
203 # Services monitor threshold values
204 #
205 # THE SERVICES MONITOR USES A HACK
206 # WHEREBY IT USES THE SERVICE STATUS
207 # AS THE THRESHOLD LEVEL. THIS SHOULD
208 # BE LOOKED AT!
209 #
210 # how many times we should be at the highest level before
211 # we go to a FINAL alert
212 Monitor.Services.reachFINALcount=5
213
214
215 # Heartbeat threshold values
216 # these are values in seconds from when the heartbeat
217 # was *expected* to arrive (ie. last + hearbeat period)
218 Monitor.Heartbeat.threshold.LOWER=180
219 Monitor.Heartbeat.threshold.UPPER=300
220 # this is how often we will run a "check" of heartbeats
221 Monitor.Heartbeat.checkPeriod=50
222 # how many times we should be at the highest level before
223 # we go to a FINAL alert
224 Monitor.Heartbeat.reachFINALcount=5
225 # list of hosts we expect to have at startup
226 # this ensures we notice hosts that aren't running, not
227 # just those that have gone down recently.
228 Monitor.Heartbeat.initialHosts=raptor.ukc.ac.uk;myrtle.ukc.ac.uk;kestrel.ukc.ac.uk
229
230
231
232 ############################################################
233 #### Alerter Configuration
234 ############################################################
235 # The following var's are understood by ALL alerters for messages
236 #
237 # %level% - the alert level (eg, WARNING)
238 # %threshold% - the threshold broken (eg, LOWER)
239 # %source% - the source of the alert (eg, raptor.ukc.ac.uk)
240 # %value% - the value reached (eg, 95)
241 # %thresholdValue% - the value of the threshold broken (eg, 90)
242 # %attributeName% - the attribute that has caused the alert (eg, CPU User)
243 # %timeTillNextAlert% - the time the next alert will be sent out
244 # %timeSinceFirstAlert% - the time elapsed since the first alert for this problem
245 # %timeOfFirstAlert% - the time the first alert was sent
246 #
247
248 # alerters to run
249 Alerter.PluginsPackage=uk.org.iscream.cms.server.client.alerters
250 Alerter.Plugins=EMail;IRC;WebFeeder;Logging;
251
252
253 # EMail alerter configuration
254 Alerter.EMail.level = WARNING
255 Alerter.EMail.destList = dev@i-scream.org.uk
256 Alerter.EMail.sender = dev@i-scream.org.uk
257 Alerter.EMail.smtpServer = mercury.ukc.ac.uk
258 Alerter.EMail.subject = i-scream alert: %level% alert on %source% for %attributeName%
259 Alerter.EMail.message = The i-scream distributed central monitoring system has\nraised a %level% alert for the host %source%.\n\nThe value for %attributeName% of %value% has exceeded the\n%threshold% threshold value of %thresholdValue%.\n\nThis alert was originally raised at %timeOfFirstAlert%,\nwhich was %timeSinceFirstAlert% ago.\n\nThe next alert (should one occur) will be sent in %timeTillNextAlert%.
260
261
262 # IRC alerter configuration
263 Alerter.IRC.level = OK
264 Alerter.IRC.IRCServer = killigrew.ukc.ac.uk
265 Alerter.IRC.IRCPort = 6667
266 Alerter.IRC.nickList = iscreamBot;_iscreamBot;i-screamBot
267 Alerter.IRC.user = i-scream
268 Alerter.IRC.comment = i-scream alerting bot
269 Alerter.IRC.channel = #i-scream
270 Alerter.IRC.message = %level%: %attributeName% on %source% has passed %threshold%(%thresholdValue%) threshold with %value% - time till next alert (should one occur), %timeTillNextAlert%
271 Alerter.IRC.reconnectDelay = 30
272 Alerter.IRC.startupNotice = i-scream alerting bot activated
273 Alerter.IRC.stopCommand = stop alerts
274 Alerter.IRC.startCommand = start alerts
275 Alerter.IRC.lastAlertCommand = last alert
276 Alerter.IRC.joinCommand = join
277 Alerter.IRC.nickChangeCommand = nick
278 Alerter.IRC.statCommand = statistics
279 Alerter.IRC.uptimeCommand = uptime
280 Alerter.IRC.timeSinceLastAlertCommand = time since last alert
281 Alerter.IRC.versionCommand = version
282 Alerter.IRC.helpCommand = help
283 Alerter.IRC.rejectMessage = sorry, I don't understand your request
284
285
286 # Logging alerter configuration
287 Alerter.Logging.level = WARNING
288 Alerter.Logging.message = %level%: %attributeName% on %source% has passed %threshold%(%thresholdValue%) threshold with %value%
289
290
291
292 ############################################################
293 #### WebFeeder Configuration
294 ############################################################
295
296 # Define these (one or both_ to turn on the WebFeeder's,
297 # comment it to turn them off
298 WebFeeder.latestActive = true
299 WebFeeder.alertActive = true
300
301 # Only pass on alerts past this level
302 Alerter.WebFeeder.level = OK
303
304 # Check period in seconds (for cleaning stale/old alerts)
305 WebFeeder.checkPeriod = 120
306
307 # Delete alerts older than this, in seconds.
308 # Files are only check every WebFeeder.checkPeriod seconds.
309 WebFeeder.alertDeleteOlderThan = 300
310
311 # Root Path
312 WebFeeder.rootPath = /usr/local/proj/co600_10/webroot
313
314 # Latest Data
315 WebFeeder.latestSubDir = latest
316 WebFeeder.latestFileName = latest_data
317
318 # Alert Data
319 WebFeeder.alertSubDir = alert
320 WebFeeder.alertFileName = alert_data
321
322
323 ############################################################