ViewVC Help
View File | Revision Log | Show Annotations | Revision Graph | Root Listing
root/i-scream/projects/cms/source/server/build/etc/system.conf
Revision: 1.47
Committed: Thu Mar 22 02:18:05 2001 UTC (23 years, 6 months ago) by tdb
Branch: MAIN
Changes since 1.46: +40 -127 lines
Log Message:
Tidied up the Monitor's section. Alert timeouts are stored as defaults, which
can be overridden. This saves repeating the same values.
Also neatened the layout and comments. More detailed explanation could be given
in the user documentation.

File Contents

# Content
1 # This is the default system configuration file
2 # used by all components of the i-scream system
3 #
4 # ALL configuration that uses the centralised
5 # configuration system has this file as its
6 # root of configuration
7 #
8 # $Author: tdb1 $
9 # $Id: system.conf,v 1.46 2001/03/22 02:06:07 tdb1 Exp $
10 #
11 ############################################################
12 #### Configuration Files & Groups
13 ############################################################
14
15 # for computing machines
16 group.computing=Host.129.12.4.*;
17 group.rocks=Host.agate.ukc.ac.uk;Host.arkose.ukc.ac.uk;Host.basalt.ukc.ac.uk;Host.chalk.ukc.ac.uk;\
18 Host.chert.ukc.ac.uk;Host.granite.ukc.ac.uk;Host.jade.ukc.ac.uk;Host.jasper.ukc.ac.uk;\
19 Host.magnetite.ukc.ac.uk;Host.obsidian.ukc.ac.uk;Host.pumice.ukc.ac.uk;\
20 Host.pyrite.ukc.ac.uk;Host.slate.ukc.ac.uk;Host.topaz.ukc.ac.uk;
21 group.compsoc=Host.compsoc1.ukc.ac.uk
22
23 config.computing=computing.conf
24 config.rocks=rocks.conf
25 config.compsoc1=rocks.conf
26
27 # for library machines
28 group.library=Host.129.12.58.*;
29 config.library=library.conf
30
31 # for SSB machines
32 group.ssb=Host.stue*.ukc.ac.uk;
33 config.ssb=ssb.conf
34
35 # mySQL configuration
36 config.mySQL=mySQL.conf
37
38 ############################################################
39 #### Misc system-wide configuration
40 ############################################################
41
42 # the time (in seconds) that checks should be made for
43 # changes in configuration
44 ConfigurationProxy.updateTime=60
45
46 # The time interval at which the Queue's should be monitored
47 Queue.MonitorInterval=15
48 # The upper limit for a Queue
49 Queue.SizeLimit=1000
50 # The removal algorithm
51 Queue.RemoveAlgorithm=FIRST
52
53
54 ############################################################
55 #### FilterManager configuration
56 ############################################################
57
58 # The default port to listen for new host connections
59 FilterManager.listenPort=4567
60
61
62
63 ############################################################
64 #### Filter configuration
65 ############################################################
66
67 # The default port for Filter's to listen on
68 Filter.UDPListenPort=4589
69 Filter.TCPListenPort=4589
70
71 # Plugin Information
72 Filter.PluginsPackage=uk.org.iscream.filter.plugins
73 Filter.Plugins=TypeChecker;EnforceEssentialData
74
75 # The name for the root filter
76 RootFilter.name=root
77
78 # The default parent filter (should almost always be the same as Filter.rootFilter)
79 Filter.parentFilter=root
80
81
82
83 ############################################################
84 #### Root filter interfaces configuration
85 ############################################################
86
87 # Comment either of these (or delete them) and
88 # that interface won't be started
89 RootFilter.realtimeInterfaceName=realtimeclients
90 RootFilter.dbInterfaceName=database
91
92
93
94 ############################################################
95 #### Client interface configuration
96 ############################################################
97
98 # The port for the client interface to listen on
99 ClientInterface.listenPort=4510
100
101
102
103 ############################################################
104 #### Host Configuration
105 ############################################################
106
107 # The default filter for a new host
108 Host.filter=computingFilter;
109
110 # The default update times for a new host
111 Host.UDPUpdateTime=10
112 Host.TCPUpdateTime=60
113 Host.AveragerUpdateTime=5
114
115 # The services checks to run on a host
116 Host.serviceChecksPackage=uk.org.iscream.filter.plugins
117
118
119
120 ############################################################
121 #### Monitor Configuration
122 ############################################################
123
124 ## The monitors to run
125 Monitor.PluginsPackage=uk.org.iscream.client.monitors
126 Monitor.Plugins=CPU;Load;Process;Disk;Memory;Swap;Services;Heartbeat;Queue;WebFeeder;
127
128 ## Default alert timeouts
129 # these can be override on a per-monitor basis
130 # timings of the alerts (in seconds)
131 Monitor.alertTimeout.NOTICE=60
132 Monitor.alertTimeout.WARNING=900
133 Monitor.alertTimeout.CAUTION=1800
134 Monitor.alertTimeout.CRITICAL=3600
135
136 ## Threshold values
137 #
138 # note: if the UPPER threshold is broken,
139 # the alertTimeout values are halved.
140 # This is to escalate the alert quicker.
141 #
142
143 # CPU monitor threshold values
144 Monitor.CPU.threshold.LOWER=90
145 Monitor.CPU.threshold.UPPER=99
146
147
148 # Load monitor threshold values
149 Monitor.Load.threshold.LOWER=10.0
150 Monitor.Load.threshold.UPPER=20.0
151
152
153 # Process Count threshold values
154 Monitor.Process.threshold.LOWER=1000
155 Monitor.Process.threshold.UPPER=1500
156
157
158 # Memory monitor threshold values
159 Monitor.Memory.threshold.LOWER=80
160 Monitor.Memory.threshold.UPPER=90
161
162
163 # Swap monitor threshold values
164 Monitor.Swap.threshold.LOWER=80
165 Monitor.Swap.threshold.UPPER=90
166
167
168 # Disk monitor threshold values
169 Monitor.Disk.threshold.LOWER=90
170 Monitor.Disk.threshold.UPPER=95
171 # Thresholds given are PERCENTAGE or VALUE
172 # where PERCENTAGE is a percentage of disk in use
173 # and VALUE is an absolute value of space free
174 Monitor.Disk.thresholdMeasure=PERCENTAGE
175
176
177 # Disk monitor threshold values
178 Monitor.Queue.threshold.LOWER=90
179 Monitor.Queue.threshold.UPPER=95
180 # Thresholds given are PERCENTAGE or VALUE
181 # where PERCENTAGE is a percentage of disk in use
182 # and VALUE is an absolute value of space free
183 Monitor.Queue.thresholdMeasure=PERCENTAGE
184
185
186 # Services monitor threshold values
187 #
188 # THE SERVICES MONITOR USES A HACK
189 # WHEREBY IT USES THE SERVICE STATUS
190 # AS THE THRESHOLD LEVEL. THIS SHOULD
191 # BE LOOKED AT!
192 #
193 # how many times we should be at the highest level before
194 # we go to a FINAL alert
195 Monitor.Services.reachFINALcount=5
196
197
198 # Heartbeat threshold values
199 # these are values in seconds from when the heartbeat
200 # was *expected* to arrive (ie. last + hearbeat period)
201 Monitor.Heartbeat.threshold.LOWER=120
202 Monitor.Heartbeat.threshold.UPPER=300
203 # this is how often we will run a "check" of heartbeats
204 Monitor.Heartbeat.checkPeriod=30
205 # how many times we should be at the highest level before
206 # we go to a FINAL alert
207 Monitor.Heartbeat.reachFINALcount=5
208
209
210
211 ############################################################
212 #### Alerter Configuration
213 ############################################################
214 # The following var's are understood by ALL alerters for messages
215 #
216 # %level% - the alert level (eg, WARNING)
217 # %threshold% - the threshold broken (eg, LOWER)
218 # %source% - the source of the alert (eg, raptor.ukc.ac.uk)
219 # %value% - the value reached (eg, 95)
220 # %thresholdValue% - the value of the threshold broken (eg, 90)
221 # %attributeName% - the attribute that has caused the alert (eg, CPU User)
222 # %timeTillNextAlert% - the time the next alert will be sent out
223 # %timeSinceFirstAlert% - the time elapsed since the first alert for this problem
224 # %timeOfFirstAlert% - the time the first alert was sent
225 #
226
227 # alerters to run
228 Alerter.PluginsPackage=uk.org.iscream.client.alerters
229 Alerter.Plugins=EMail;IRC;WebFeeder;
230
231
232 # EMail alerter configuration
233 Alerter.EMail.level = WARNING
234 Alerter.EMail.destList = dev@i-scream.org.uk
235 Alerter.EMail.sender = dev@i-scream.org.uk
236 Alerter.EMail.smtpServer = mercury.ukc.ac.uk
237 Alerter.EMail.subject = i-scream alert: %level% alert on %source% for %attributeName%
238 Alerter.EMail.message = The i-scream distributed central monitoring system has\nraised a %level% alert for the host %source%.\n\nThe value for %attributeName% of %value% has exceeded the\n%threshold% threshold value of %thresholdValue%.\n\nThis alert was originally raised at %timeOfFirstAlert%,\nwhich was %timeSinceFirstAlert% ago.\n\nThe next alert (should one occur) will be sent in %timeTillNextAlert%.
239
240
241 # IRC alerter configuration
242 Alerter.IRC.level = OK
243 Alerter.IRC.IRCServer = killigrew.ukc.ac.uk
244 Alerter.IRC.IRCPort = 6667
245 Alerter.IRC.nickList = iscreamBot;_iscreamBot;i-screamBot
246 Alerter.IRC.user = i-scream
247 Alerter.IRC.comment = i-scream alerting bot
248 Alerter.IRC.channel = #i-scream
249 Alerter.IRC.message = %level%: %attributeName% on %source% has passed %threshold%(%thresholdValue%) threshold with %value% - time till next alert (should one occur), %timeTillNextAlert%
250 Alerter.IRC.reconnectDelay = 30
251 Alerter.IRC.startupNotice = i-scream alerting bot activated
252 Alerter.IRC.stopCommand = stop alerts
253 Alerter.IRC.startCommand = start alerts
254 Alerter.IRC.lastAlertCommand = last alert
255 Alerter.IRC.joinCommand = join
256 Alerter.IRC.nickChangeCommand = nick
257 Alerter.IRC.statCommand = statistics
258 Alerter.IRC.uptimeCommand = uptime
259 Alerter.IRC.timeSinceLastAlertCommand = time since last alert
260 Alerter.IRC.versionCommand = version
261 Alerter.IRC.helpCommand = help
262 Alerter.IRC.rejectMessage = sorry, I don't understand your request
263
264
265
266 ############################################################
267 #### WebFeeder Configuration
268 ############################################################
269
270 # Define these (one or both_ to turn on the WebFeeder's,
271 # comment it to turn them off
272 WebFeeder.latestActive = true
273 WebFeeder.alertActive = true
274
275 # Only pass on alerts past this level
276 WebFeeder.alertLevel = OK
277
278 # Check period in seconds (for cleaning stale/old alerts)
279 WebFeeder.checkPeriod = 120
280
281 # Delete alerts older than this, in seconds.
282 # Files are only check every WebFeeder.checkPeriod seconds.
283 WebFeeder.alertDeleteOlderThan = 300
284
285 # Root Path
286 WebFeeder.rootPath = /usr/local/proj/co600_10/webroot
287
288 # Latest Data
289 WebFeeder.latestSubDir = latest
290 WebFeeder.latestFileName = latest_data
291
292 # Alert Data
293 WebFeeder.alertSubDir = alert
294 WebFeeder.alertFileName = alert_data
295
296
297 ############################################################