ViewVC Help
View File | Revision Log | Show Annotations | Revision Graph | Root Listing
root/i-scream/projects/cms/source/server/build/etc/system.conf
Revision: 1.25
Committed: Wed Mar 7 01:23:31 2001 UTC (23 years, 8 months ago) by tdb
Branch: MAIN
Changes since 1.24: +4 -2 lines
Log Message:
Added a comment to clarify the situation with heartbeat thresholds.

File Contents

# User Rev Content
1 tdb 1.2 # This is the default system configuration file
2     # used by all components of the i-scream system
3     #
4     # ALL configuration that uses the centralised
5     # configuration system has this file as its
6     # root of configuration
7     #
8 tdb 1.25 # $Author: tdb1 $
9     # $Id: system.conf,v 1.24 2001/03/06 23:52:57 tdb1 Exp $
10 ajm 1.14 #
11     ############################################################
12     #### Configuration Files & Groups
13     ############################################################
14    
15     # for computing machines
16 tdb 1.15 group.computing=Host.129.12.4.*;
17     config.computing=computing.conf
18 ajm 1.14
19     # for library machines
20 tdb 1.15 group.library=Host.129.12.58.*;
21 ajm 1.14 config.library=library.conf
22    
23 tdb 1.15 # for SSB machines
24     group.ssb=Host.stue*.ukc.ac.uk;
25     config.ssb=ssb.conf
26    
27 ajm 1.14 # mySQL configuration
28     config.mySQL=mySQL.conf
29    
30 ajm 1.16 ############################################################
31     #### Misc system-wide configuration
32     ############################################################
33    
34     # the time (in seconds) that checks should be made for
35     # changes in configuration
36     ConfigurationProxy.updateTime=60
37    
38     # The time interval at which the Queue's should be monitored
39     Queue.MonitorInterval=15
40    
41 tdb 1.2
42 ajm 1.14
43     ############################################################
44     #### FilterManager configuration
45     ############################################################
46 tdb 1.2
47     # The default port to listen for new host connections
48     FilterManager.listenPort=4567
49    
50 ajm 1.14
51    
52     ############################################################
53     #### Filter configuration
54     ############################################################
55    
56 tdb 1.2 # The default port for Filter's to listen on
57     Filter.UDPListenPort=4589
58     Filter.TCPListenPort=4589
59    
60 ajm 1.14 # Plugin Information
61     Filter.PluginsPackage=uk.ac.ukc.iscream.filter.plugins
62     Filter.Plugins=TypeChecker;EnforceEssentialData
63    
64 tdb 1.2 # The name for the root filter
65     RootFilter.name=root
66 ajm 1.14
67     # The default parent filter (should almost always be the same as Filter.rootFilter)
68     Filter.parentFilter=root
69    
70    
71    
72     ############################################################
73     #### Root filter interfaces configuration
74     ############################################################
75    
76 tdb 1.2 # Comment either of these (or delete them) and
77     # that interface won't be started
78     RootFilter.realtimeInterfaceName=realtimeclients
79 tdb 1.6 RootFilter.dbInterfaceName=database
80 tdb 1.2
81 ajm 1.14
82    
83     ############################################################
84     #### Client interface configuration
85     ############################################################
86    
87 tdb 1.2 # The port for the client interface to listen on
88     ClientInterface.listenPort=4510
89    
90 ajm 1.14
91    
92     ############################################################
93     #### Host Configuration
94     ############################################################
95 tdb 1.2
96     # The default filter for a new host
97 ajm 1.23 Host.filter=filter1;
98 tdb 1.13
99 tdb 1.2 # The default update times for a new host
100 tdb 1.7 Host.UDPUpdateTime=10
101 tdb 1.2 Host.TCPUpdateTime=60
102 tdb 1.15 Host.AveragerUpdateTime=5
103 tdb 1.2
104 ajm 1.8 # The services checks to run on a host
105     Host.serviceChecksPackage=uk.ac.ukc.iscream.filter.plugins
106 tdb 1.11 Host.serviceChecks=HTTP;SMTP
107 tdb 1.2
108 ajm 1.14
109 tdb 1.12
110 ajm 1.14 ############################################################
111     #### Monitor Configuration
112     ############################################################
113    
114     # the monitors to run
115     Monitor.PluginsPackage=uk.ac.ukc.iscream.client.monitors
116 tdb 1.24 Monitor.Plugins=CPU;Memory;Swap;Heartbeat;
117    
118 ajm 1.14
119 tdb 1.22 ## CPU monitor configuration
120 ajm 1.16 # threshold values
121     #
122     # note: if the UPPER threshold is broken,
123     # the alertTimeout values are halved.
124     # This is to escalate the alert quicker.
125     Monitor.CPU.threshold.LOWER=90
126     Monitor.CPU.threshold.UPPER=99
127    
128     # timings of the alerts (in seconds)
129     Monitor.CPU.alertTimeout.NOTICE=60
130     Monitor.CPU.alertTimeout.WARNING=900
131     Monitor.CPU.alertTimeout.CAUTION=1800
132     Monitor.CPU.alertTimeout.CRITICAL=3600
133 tdb 1.24
134    
135     ## Memory monitor configuration
136     # threshold values
137     #
138     # note: if the UPPER threshold is broken,
139     # the alertTimeout values are halved.
140     # This is to escalate the alert quicker.
141     Monitor.Memory.threshold.LOWER=80
142     Monitor.Memory.threshold.UPPER=90
143    
144     # timings of the alerts (in seconds)
145     Monitor.Memory.alertTimeout.NOTICE=60
146     Monitor.Memory.alertTimeout.WARNING=900
147     Monitor.Memory.alertTimeout.CAUTION=1800
148     Monitor.Memory.alertTimeout.CRITICAL=3600
149    
150    
151     ## Swap monitor configuration
152     # threshold values
153     #
154     # note: if the UPPER threshold is broken,
155     # the alertTimeout values are halved.
156     # This is to escalate the alert quicker.
157     Monitor.Swap.threshold.LOWER=80
158     Monitor.Swap.threshold.UPPER=90
159    
160     # timings of the alerts (in seconds)
161     Monitor.Swap.alertTimeout.NOTICE=60
162     Monitor.Swap.alertTimeout.WARNING=900
163     Monitor.Swap.alertTimeout.CAUTION=1800
164     Monitor.Swap.alertTimeout.CRITICAL=3600
165    
166 ajm 1.14
167 tdb 1.22 ## Heartbeat monitor configuration
168     # threshold values
169     #
170     # note: if the UPPER threshold is broken,
171     # the alertTimeout values are halved.
172     # This is to escalate the alert quicker.
173     Monitor.Heartbeat.checkPeriod=50
174 tdb 1.25 # these are values in seconds from when the heartbeat
175     # was *expected* to arrive (ie. last + hearbeat period)
176 tdb 1.22 Monitor.Heartbeat.threshold.LOWER=120
177     Monitor.Heartbeat.threshold.LOWER=300
178 ajm 1.14
179 tdb 1.22 # timings of the alerts (in seconds)
180     Monitor.Heartbeat.alertTimeout.NOTICE=60
181     Monitor.Heartbeat.alertTimeout.WARNING=900
182     Monitor.Heartbeat.alertTimeout.CAUTION=1800
183     Monitor.Heartbeat.alertTimeout.CRITICAL=3600
184 ajm 1.14
185 ajm 1.23 # this means it will reach a FINAL level,
186     # and thus the host will be removed from the monitor list,
187     # if the highest level alert is reached and occours this
188     # number of times.
189     #
190     # int this setup, that means 5 CRITICAL alerts would occour
191     # on a Heartbeat before reaching FINAL.
192     # If this value is wrong or not present, FINAL is never reached
193     #
194     Monitor.Heartbeat.reachFINALcount=5
195    
196 ajm 1.14 ############################################################
197     #### Alerter Configuration
198     ############################################################
199 ajm 1.23 # The following var's are understood by ALL alerters for messages
200     #
201     # %level% - the alert level (eg, WARNING)
202     # %threshold% - the threshold broken (eg, LOWER)
203     # %source% - the source of the alert (eg, raptor.ukc.ac.uk)
204     # %value% - the value reached (eg, 95)
205     # %thresholdValue% - the value of the threshold broken (eg, 90)
206     # %attributeName% - the attribute that has caused the alert (eg, CPU User)
207     # %timeTillNextAlert% - the time the next alert will be sent out
208     # %timeSinceFirstAlert% - the time elapsed since the first alert for this problem
209     # %timeOfFirstAlert% - the time the first alert was sent
210     #
211 ajm 1.14
212     # alerters to run
213     Alerter.PluginsPackage=uk.ac.ukc.iscream.client.alerters
214     Alerter.Plugins=EMail;IRC;
215    
216     # EMail alerter configuration
217 ajm 1.16 Alerter.EMail.level = CAUTION
218 tdb 1.20 Alerter.EMail.defaultDestList = dev@i-scream.org.uk
219 ajm 1.14 Alerter.EMail.sender = dev@i-scream.org.uk
220     Alerter.EMail.smtpServer = mercury.ukc.ac.uk
221 ajm 1.16 Alerter.EMail.subject = i-scream alert: %level% alert on %source% for %attributeName%
222     Alerter.EMail.message = The i-scream distributed central monitoring system has\nraised a %level% alert for the host %source%.\n\nThe value for %attributeName% of %value% has exceeded the\n%threshold% threshold value of %thresholdValue%.\n\nThe next alert (should one occur) will be sent in %timeTillNextAlert%.
223 ajm 1.14
224     # IRC alerter configuration
225 ajm 1.16 Alerter.IRC.level = OK
226 ajm 1.14 Alerter.IRC.IRCServer = killigrew.ukc.ac.uk
227     Alerter.IRC.IRCPort = 6667
228 tdb 1.19 Alerter.IRC.nickList = iscreamBot;_iscreamBot;i-screamBot
229 tdb 1.17 Alerter.IRC.user = i-scream
230     Alerter.IRC.comment = i-scream alerting bot
231 ajm 1.14 Alerter.IRC.channel = #i-scream
232 ajm 1.16 Alerter.IRC.message = %level%: %attributeName% on %source% has passed %threshold%(%thresholdValue%) threshold with %value% - time till next alert (should one occur), %timeTillNextAlert%
233 tdb 1.17 Alerter.IRC.reconnectDelay = 30
234     Alerter.IRC.startupNotice = i-scream alerting bot activated
235     Alerter.IRC.stopCommand = stop alerts
236     Alerter.IRC.startCommand = start alerts
237     Alerter.IRC.lastAlertCommand = last alert
238     Alerter.IRC.joinCommand = join
239 tdb 1.18 Alerter.IRC.nickChangeCommand = nick
240     Alerter.IRC.statCommand = statistics
241     Alerter.IRC.uptimeCommand = uptime
242     Alerter.IRC.timeSinceLastAlertCommand = time since last alert
243 tdb 1.19 Alerter.IRC.versionCommand = version
244 tdb 1.17 Alerter.IRC.helpCommand = help
245     Alerter.IRC.rejectMessage = sorry, I don't understand your request
246 ajm 1.16
247 tdb 1.17 ############################################################
248 ajm 1.16