| 18 |  | Host.chert.ukc.ac.uk;Host.granite.ukc.ac.uk;Host.jade.ukc.ac.uk;Host.jasper.ukc.ac.uk;\ | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 19 |  | Host.magnetite.ukc.ac.uk;Host.obsidian.ukc.ac.uk;Host.pumice.ukc.ac.uk;\ | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 20 |  | Host.pyrite.ukc.ac.uk;Host.slate.ukc.ac.uk;Host.topaz.ukc.ac.uk; | 
 
 
 
 
 
 
 
 | 21 | + | group.compsoc=Host.compsoc1.ukc.ac.uk | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 22 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 23 |  | config.computing=computing.conf | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 24 |  | config.rocks=rocks.conf | 
 
 
 
 
 
 
 
 | 25 | + | config.compsoc1=rocks.conf | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 26 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 27 |  | # for library machines | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 28 |  | group.library=Host.129.12.58.*; | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 58 |  | # The default port to listen for new host connections | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 59 |  | FilterManager.listenPort=4567 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 60 |  |  | 
 
 
 
 
 
 
 
 | 61 | + | # Access control list | 
 
 
 
 
 
 
 
 | 62 | + | FilterManager.ACL=DEFAULT:DENY;*.ukc.ac.uk:ALLOW;129.12.*:ALLOW | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 63 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 64 |  |  | 
 
 
 
 
 
 
 
 | 65 | + |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 66 |  | ############################################################ | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 67 |  | #### Filter configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 68 |  | ############################################################ | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 72 |  | Filter.TCPListenPort=4589 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 73 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 74 |  | # Plugin Information | 
 
 
 
 
 
 
 
 
 
 
 | 75 | < | Filter.PluginsPackage=uk.org.iscream.filter.plugins | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 76 | < | Filter.Plugins=TypeChecker;EnforceEssentialData | 
 
 
 
 
 
 
 
 
 | 75 | > | Filter.PluginsPackage=uk.org.iscream.cms.server.filter.plugins | 
 
 
 
 
 | 76 | > | Filter.Plugins=TypeChecker;EnforceEssentialData;SourceChecker;KeyChecker | 
 
 
 
 
 
 
 
 
 
 
 | 77 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 78 |  | # The name for the root filter | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 79 |  | RootFilter.name=root | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 81 |  | # The default parent filter (should almost always be the same as Filter.rootFilter) | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 82 |  | Filter.parentFilter=root | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 83 |  |  | 
 
 
 
 
 
 
 
 | 84 | + | # The input methods to activate | 
 
 
 
 
 
 
 
 | 85 | + | # (comment or set to 0 to disable) | 
 
 
 
 
 
 
 
 | 86 | + | Filter.ActivateTCPReader=1 | 
 
 
 
 
 
 
 
 | 87 | + | Filter.ActivateUDPReader=1 | 
 
 
 
 
 
 
 
 | 88 | + | Filter.ActivateCORBAReader=1 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 89 |  |  | 
 
 
 
 
 
 
 
 | 90 | + | # Access control list for the TCP and UDP inputs | 
 
 
 
 
 
 
 
 | 91 | + | Filter.TCPACL=DEFAULT:DENY;*.ukc.ac.uk:ALLOW;129.12.*:ALLOW | 
 
 
 
 
 
 
 
 | 92 | + | Filter.UDPACL=DEFAULT:DENY;*.ukc.ac.uk:ALLOW;129.12.*:ALLOW | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 93 |  |  | 
 
 
 
 
 
 
 
 | 94 | + | # Access control list for the SourceChecker plugin | 
 
 
 
 
 
 
 
 | 95 | + | #   - packets not permitted by this ACL will be filtered | 
 
 
 
 
 
 
 
 | 96 | + | Filter.SourceCheckerPluginACL=DEFAULT:DENY;*.ukc.ac.uk:ALLOW;129.12.*:ALLOW | 
 
 
 
 
 
 
 
 | 97 | + |  | 
 
 
 
 
 
 
 
 | 98 | + | # Enforce host authentication? | 
 
 
 
 
 
 
 
 | 99 | + | # (comment or set to 0 to disable) | 
 
 
 
 
 
 
 
 | 100 | + | Filter.EnforceHostAuth=1 | 
 
 
 
 
 
 
 
 | 101 | + |  | 
 
 
 
 
 
 
 
 | 102 | + |  | 
 
 
 
 
 
 
 
 | 103 | + |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 104 |  | ############################################################ | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 105 |  | #### Root filter interfaces configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 106 |  | ############################################################ | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 118 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 119 |  | # The port for the client interface to listen on | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 120 |  | ClientInterface.listenPort=4510 | 
 
 
 
 
 
 
 
 | 121 | + | # The name for the client interface | 
 
 
 
 
 
 
 
 | 122 | + | ClientInterface.name=realtimeclients | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 123 |  |  | 
 
 
 
 
 
 
 
 | 124 | + | # Access Control List for TCP Clients | 
 
 
 
 
 
 
 
 | 125 | + | ClientInterface.TCPControlChannelACL=DEFAULT:DENY;*.ukc.ac.uk:ALLOW;129.12.*:ALLOW | 
 
 
 
 
 
 
 
 | 126 | + | ClientInterface.TCPDataChannelACL=DEFAULT:DENY;*.ukc.ac.uk:ALLOW;129.12.*:ALLOW | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 127 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 128 |  |  | 
 
 
 
 
 
 
 
 | 129 | + |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 130 |  | ############################################################ | 
 
 
 
 
 
 
 
 | 131 | + | #### Database interface configuration | 
 
 
 
 
 
 
 
 | 132 | + | ############################################################ | 
 
 
 
 
 
 
 
 | 133 | + |  | 
 
 
 
 
 
 
 
 | 134 | + | # The name for the Database interface | 
 
 
 
 
 
 
 
 | 135 | + | DBInterface.name=database | 
 
 
 
 
 
 
 
 | 136 | + |  | 
 
 
 
 
 
 
 
 | 137 | + |  | 
 
 
 
 
 
 
 
 | 138 | + |  | 
 
 
 
 
 
 
 
 | 139 | + | ############################################################ | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 140 |  | #### Host Configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 141 |  | ############################################################ | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 142 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 146 |  | # The default update times for a new host | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 147 |  | Host.UDPUpdateTime=10 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 148 |  | Host.TCPUpdateTime=60 | 
 
 
 
 
 
 
 
 
 | 111 | – | Host.AveragerUpdateTime=5 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 149 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 150 |  | # The services checks to run on a host | 
 
 
 
 
 
 
 
 
 
 
 | 151 | < | Host.serviceChecksPackage=uk.org.iscream.filter.plugins | 
 
 
 
 
 
 
 
 
 | 151 | > | Host.serviceChecksPackage=uk.org.iscream.cms.server.filter.plugins | 
 
 
 
 
 
 
 
 
 
 
 | 152 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 153 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 154 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 156 |  | #### Monitor Configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 157 |  | ############################################################ | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 158 |  |  | 
 
 
 
 
 
 
 
 
 
 
 | 159 | < | # the monitors to run | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 160 | < | Monitor.PluginsPackage=uk.org.iscream.client.monitors | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 161 | < | Monitor.Plugins=CPU;Disk;Memory;Swap;Services;Heartbeat;WebFeeder; | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 159 | > | ## The monitors to run | 
 
 
 
 
 | 160 | > | Monitor.PluginsPackage=uk.org.iscream.cms.server.client.monitors | 
 
 
 
 
 | 161 | > | Monitor.Plugins=CPU;Load;Process;Disk;Memory;Swap;Services;\ | 
 
 
 
 
 | 162 | > | Heartbeat;Queue;UserCount;WebFeeder; | 
 
 
 
 
 
 
 
 
 
 
 | 163 |  |  | 
 
 
 
 
 
 
 
 | 164 | + | ## Default alert timeouts | 
 
 
 
 
 
 
 
 | 165 | + | # these can be override on a per-monitor basis | 
 
 
 
 
 
 
 
 | 166 | + | # timings of the alerts (in seconds) | 
 
 
 
 
 
 
 
 | 167 | + | Monitor.alertTimeout.NOTICE=60 | 
 
 
 
 
 
 
 
 | 168 | + | Monitor.alertTimeout.WARNING=900 | 
 
 
 
 
 
 
 
 | 169 | + | Monitor.alertTimeout.CAUTION=1800 | 
 
 
 
 
 
 
 
 | 170 | + | Monitor.alertTimeout.CRITICAL=3600 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 171 |  |  | 
 
 
 
 
 
 
 
 
 
 
 | 172 | < | ## CPU monitor configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 128 | < | # threshold values | 
 
 
 
 
 
 
 
 
 | 172 | > | ## Threshold values | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 173 |  | # | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 174 |  | # note: if the UPPER threshold is broken, | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 175 |  | # the alertTimeout values are halved. | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 176 |  | # This is to escalate the alert quicker. | 
 
 
 
 
 
 
 
 | 177 | + | # | 
 
 
 
 
 
 
 
 | 178 | + |  | 
 
 
 
 
 
 
 
 | 179 | + | # CPU monitor threshold values | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 180 |  | Monitor.CPU.threshold.LOWER=90 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 181 |  | Monitor.CPU.threshold.UPPER=99 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 182 |  |  | 
 
 
 
 
 
 
 
 
 | 136 | – | # timings of the alerts (in seconds) | 
 
 
 
 
 
 
 
 
 | 137 | – | Monitor.CPU.alertTimeout.NOTICE=60 | 
 
 
 
 
 
 
 
 
 | 138 | – | Monitor.CPU.alertTimeout.WARNING=900 | 
 
 
 
 
 
 
 
 
 | 139 | – | Monitor.CPU.alertTimeout.CAUTION=1800 | 
 
 
 
 
 
 
 
 
 | 140 | – | Monitor.CPU.alertTimeout.CRITICAL=3600 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 183 |  |  | 
 
 
 
 
 
 
 
 | 184 | + | # Load monitor threshold values | 
 
 
 
 
 
 
 
 | 185 | + | Monitor.Load.threshold.LOWER=10.0 | 
 
 
 
 
 
 
 
 | 186 | + | Monitor.Load.threshold.UPPER=20.0 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 187 |  |  | 
 
 
 
 
 
 
 
 
 
 
 | 188 | < | ## Memory monitor configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 189 | < | # threshold values | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 190 | < | # | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 191 | < | # note: if the UPPER threshold is broken, | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 192 | < | # the alertTimeout values are halved. | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 193 | < | # This is to escalate the alert quicker. | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 188 | > |  | 
 
 
 
 
 | 189 | > | # Process Count threshold values | 
 
 
 
 
 | 190 | > | Monitor.Process.threshold.LOWER=1000 | 
 
 
 
 
 | 191 | > | Monitor.Process.threshold.UPPER=1500 | 
 
 
 
 
 | 192 | > |  | 
 
 
 
 
 | 193 | > |  | 
 
 
 
 
 | 194 | > | # Memory monitor threshold values | 
 
 
 
 
 
 
 
 
 
 
 | 195 |  | Monitor.Memory.threshold.LOWER=80 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 196 |  | Monitor.Memory.threshold.UPPER=90 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 197 |  |  | 
 
 
 
 
 
 
 
 
 | 152 | – | # timings of the alerts (in seconds) | 
 
 
 
 
 
 
 
 
 | 153 | – | Monitor.Memory.alertTimeout.NOTICE=60 | 
 
 
 
 
 
 
 
 
 | 154 | – | Monitor.Memory.alertTimeout.WARNING=900 | 
 
 
 
 
 
 
 
 
 | 155 | – | Monitor.Memory.alertTimeout.CAUTION=1800 | 
 
 
 
 
 
 
 
 
 | 156 | – | Monitor.Memory.alertTimeout.CRITICAL=3600 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 198 |  |  | 
 
 
 
 
 
 
 
 
 
 
 | 199 | < |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 159 | < | ## Swap monitor configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 160 | < | # threshold values | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 161 | < | # | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 162 | < | # note: if the UPPER threshold is broken, | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 163 | < | # the alertTimeout values are halved. | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 164 | < | # This is to escalate the alert quicker. | 
 
 
 
 
 
 
 
 
 | 199 | > | # Swap monitor threshold values | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 200 |  | Monitor.Swap.threshold.LOWER=80 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 201 |  | Monitor.Swap.threshold.UPPER=90 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 202 |  |  | 
 
 
 
 
 
 
 
 
 | 168 | – | # timings of the alerts (in seconds) | 
 
 
 
 
 
 
 
 
 | 169 | – | Monitor.Swap.alertTimeout.NOTICE=60 | 
 
 
 
 
 
 
 
 
 | 170 | – | Monitor.Swap.alertTimeout.WARNING=900 | 
 
 
 
 
 
 
 
 
 | 171 | – | Monitor.Swap.alertTimeout.CAUTION=1800 | 
 
 
 
 
 
 
 
 
 | 172 | – | Monitor.Swap.alertTimeout.CRITICAL=3600 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 203 |  |  | 
 
 
 
 
 
 
 
 | 204 | + | # UserCount monitor threshold values | 
 
 
 
 
 
 
 
 | 205 | + | Monitor.UserCount.threshold.LOWER=100 | 
 
 
 
 
 
 
 
 | 206 | + | Monitor.UserCount.threshold.UPPER=200 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 207 |  |  | 
 
 
 
 
 
 
 
 
 | 175 | – | ## Disk monitor configuration | 
 
 
 
 
 
 
 
 
 | 176 | – | # threshold values | 
 
 
 
 
 
 
 
 
 | 177 | – | # | 
 
 
 
 
 
 
 
 
 | 178 | – | # note: if the UPPER threshold is broken, | 
 
 
 
 
 
 
 
 
 | 179 | – | # the alertTimeout values are halved. | 
 
 
 
 
 
 
 
 
 | 180 | – | # This is to escalate the alert quicker. | 
 
 
 
 
 
 
 
 
 | 181 | – | Monitor.Disk.threshold.LOWER=80 | 
 
 
 
 
 
 
 
 
 | 182 | – | Monitor.Disk.threshold.UPPER=90 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 208 |  |  | 
 
 
 
 
 
 
 
 
 
 
 | 209 | < | # timings of the alerts (in seconds) | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 210 | < | Monitor.Disk.alertTimeout.NOTICE=60 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 211 | < | Monitor.Disk.alertTimeout.WARNING=900 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 212 | < | Monitor.Disk.alertTimeout.CAUTION=1800 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 213 | < | Monitor.Disk.alertTimeout.CRITICAL=3600 | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 209 | > | # Disk monitor threshold values | 
 
 
 
 
 | 210 | > | Monitor.Disk.threshold.LOWER=90 | 
 
 
 
 
 | 211 | > | Monitor.Disk.threshold.UPPER=95 | 
 
 
 
 
 | 212 | > | # Thresholds given are PERCENTAGE or VALUE | 
 
 
 
 
 | 213 | > | # where PERCENTAGE is a percentage of disk in use | 
 
 
 
 
 | 214 | > | # and VALUE is an absolute value of space free | 
 
 
 
 
 | 215 | > | Monitor.Disk.thresholdMeasure=PERCENTAGE | 
 
 
 
 
 
 
 
 
 
 
 | 216 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 217 |  |  | 
 
 
 
 
 
 
 
 
 
 
 | 218 | < | ## Services monitor configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 219 | < | # threshold values | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 218 | > | # Queue monitor threshold values | 
 
 
 
 
 | 219 | > | Monitor.Queue.threshold.LOWER=50 | 
 
 
 
 
 | 220 | > | Monitor.Queue.threshold.UPPER=80 | 
 
 
 
 
 | 221 | > | # Thresholds given are PERCENTAGE or VALUE | 
 
 
 
 
 | 222 | > | # where PERCENTAGE is a percentage of disk in use | 
 
 
 
 
 | 223 | > | # and VALUE is an absolute value of space free | 
 
 
 
 
 | 224 | > | Monitor.Queue.thresholdMeasure=PERCENTAGE | 
 
 
 
 
 | 225 | > |  | 
 
 
 
 
 | 226 | > |  | 
 
 
 
 
 | 227 | > | # Services monitor threshold values | 
 
 
 
 
 
 
 
 
 
 
 | 228 |  | # | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 229 |  | # THE SERVICES MONITOR USES A HACK | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 230 |  | # WHEREBY IT USES THE SERVICE STATUS | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 231 |  | # AS THE THRESHOLD LEVEL.  THIS SHOULD | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 232 |  | # BE LOOKED AT! | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 233 |  | # | 
 
 
 
 
 
 
 
 
 
 
 | 234 | < | # note: if the UPPER threshold is broken, | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 235 | < | # the alertTimeout values are halved. | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 201 | < | # This is to escalate the alert quicker. | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 202 | < | #Monitor.Services.threshold.LOWER=120 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 203 | < | #Monitor.Services.threshold.LOWER=300 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 204 | < |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 205 | < | # timings of the alerts (in seconds) | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 206 | < | Monitor.Services.alertTimeout.NOTICE=60 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 207 | < | Monitor.Services.alertTimeout.WARNING=900 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 208 | < | Monitor.Services.alertTimeout.CAUTION=1800 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 209 | < | Monitor.Services.alertTimeout.CRITICAL=3600 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 210 | < |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 211 | < | # Make sure we shut up eventually | 
 
 
 
 
 
 
 
 
 | 234 | > | # how many times we should be at the highest level before | 
 
 
 
 
 | 235 | > | # we go to a FINAL alert | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 236 |  | Monitor.Services.reachFINALcount=5 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 237 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 238 |  |  | 
 
 
 
 
 
 
 
 
 
 
 | 239 | < | ## Heartbeat monitor configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 216 | < | # threshold values | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 217 | < | # | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 218 | < | # note: if the UPPER threshold is broken, | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 219 | < | # the alertTimeout values are halved. | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 220 | < | # This is to escalate the alert quicker. | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 221 | < | Monitor.Heartbeat.checkPeriod=50 | 
 
 
 
 
 
 
 
 
 | 239 | > | # Heartbeat threshold values | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 240 |  | # these are values in seconds from when the heartbeat | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 241 |  | # was *expected* to arrive (ie. last + hearbeat period) | 
 
 
 
 
 
 
 
 
 
 
 | 242 | < | Monitor.Heartbeat.threshold.LOWER=120 | 
 
 
 
 
 
 
 
 
 | 242 | > | Monitor.Heartbeat.threshold.LOWER=180 | 
 
 
 
 
 
 
 
 
 
 
 | 243 |  | Monitor.Heartbeat.threshold.UPPER=300 | 
 
 
 
 
 
 
 
 | 244 | + | # this is how often we will run a "check" of heartbeats | 
 
 
 
 
 
 
 
 | 245 | + | Monitor.Heartbeat.checkPeriod=50 | 
 
 
 
 
 
 
 
 | 246 | + | # how many times we should be at the highest level before | 
 
 
 
 
 
 
 
 | 247 | + | # we go to a FINAL alert | 
 
 
 
 
 
 
 
 | 248 | + | Monitor.Heartbeat.reachFINALcount=5 | 
 
 
 
 
 
 
 
 | 249 | + | # list of hosts we expect to have at startup | 
 
 
 
 
 
 
 
 | 250 | + | # this ensures we notice hosts that aren't running, not | 
 
 
 
 
 
 
 
 | 251 | + | # just those that have gone down recently. | 
 
 
 
 
 
 
 
 | 252 | + | Monitor.Heartbeat.initialHosts=raptor.ukc.ac.uk;myrtle.ukc.ac.uk;kestrel.ukc.ac.uk | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 253 |  |  | 
 
 
 
 
 
 
 
 
 | 227 | – | # timings of the alerts (in seconds) | 
 
 
 
 
 
 
 
 
 | 228 | – | Monitor.Heartbeat.alertTimeout.NOTICE=60 | 
 
 
 
 
 
 
 
 
 | 229 | – | Monitor.Heartbeat.alertTimeout.WARNING=900 | 
 
 
 
 
 
 
 
 
 | 230 | – | Monitor.Heartbeat.alertTimeout.CAUTION=1800 | 
 
 
 
 
 
 
 
 
 | 231 | – | Monitor.Heartbeat.alertTimeout.CRITICAL=3600 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 254 |  |  | 
 
 
 
 
 
 
 
 
 | 233 | – | # this means it will reach a FINAL level, | 
 
 
 
 
 
 
 
 
 | 234 | – | # and thus the host will be removed from the monitor list, | 
 
 
 
 
 
 
 
 
 | 235 | – | # if the highest level alert is reached and occours this | 
 
 
 
 
 
 
 
 
 | 236 | – | # number of times. | 
 
 
 
 
 
 
 
 
 | 237 | – | # | 
 
 
 
 
 
 
 
 
 | 238 | – | # int this setup, that means 5 CRITICAL alerts would occour | 
 
 
 
 
 
 
 
 
 | 239 | – | # on a Heartbeat before reaching FINAL. | 
 
 
 
 
 
 
 
 
 | 240 | – | # If this value is wrong or not present, FINAL is never reached | 
 
 
 
 
 
 
 
 
 | 241 | – | # | 
 
 
 
 
 
 
 
 
 | 242 | – | Monitor.Heartbeat.reachFINALcount=5 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 255 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 256 |  | ############################################################ | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 257 |  | #### Alerter Configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 270 |  | # | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 271 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 272 |  | # alerters to run | 
 
 
 
 
 
 
 
 
 
 
 | 273 | < | Alerter.PluginsPackage=uk.org.iscream.client.alerters | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 274 | < | Alerter.Plugins=EMail;IRC;WebFeeder; | 
 
 
 
 
 
 
 
 
 | 273 | > | Alerter.PluginsPackage=uk.org.iscream.cms.server.client.alerters | 
 
 
 
 
 | 274 | > | Alerter.Plugins=EMail;IRC;WebFeeder;Logging; | 
 
 
 
 
 
 
 
 
 
 
 | 275 |  |  | 
 
 
 
 
 
 
 
 | 276 | + |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 277 |  | # EMail alerter configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 278 |  | Alerter.EMail.level = WARNING | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 279 |  | Alerter.EMail.destList = dev@i-scream.org.uk | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 289 |  | Alerter.IRC.IRCPort = 6667 | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 290 |  | Alerter.IRC.nickList = iscreamBot;_iscreamBot;i-screamBot | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 291 |  | Alerter.IRC.user = i-scream | 
 
 
 
 
 
 
 
 
 
 
 | 292 | < | Alerter.IRC.comment = i-scream alerting bot | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 292 | > | Alerter.IRC.comment = i-scream alerting bot (based on PircBot) | 
 
 
 
 
 | 293 | > | Alerter.IRC.finger = i-scream alerting bot (based on PircBot) | 
 
 
 
 
 
 
 
 
 
 
 | 294 |  | Alerter.IRC.channel = #i-scream | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 295 |  | Alerter.IRC.message = %level%: %attributeName% on %source% has passed %threshold%(%thresholdValue%) threshold with %value% - time till next alert (should one occur), %timeTillNextAlert% | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 296 |  | Alerter.IRC.reconnectDelay = 30 | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 307 |  | Alerter.IRC.helpCommand = help | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 308 |  | Alerter.IRC.rejectMessage = sorry, I don't understand your request | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 309 |  |  | 
 
 
 
 
 
 
 
 | 310 | + |  | 
 
 
 
 
 
 
 
 | 311 | + | # Logging alerter configuration | 
 
 
 
 
 
 
 
 | 312 | + | Alerter.Logging.level = WARNING | 
 
 
 
 
 
 
 
 | 313 | + | Alerter.Logging.message = %level%: %attributeName% on %source% has passed %threshold%(%thresholdValue%) threshold with %value% | 
 
 
 
 
 
 
 
 | 314 | + |  | 
 
 
 
 
 
 
 
 | 315 | + |  | 
 
 
 
 
 
 
 
 | 316 | + |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 317 |  | ############################################################ | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 318 |  | #### WebFeeder Configuration | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 319 |  | ############################################################ | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 323 |  | WebFeeder.latestActive = true | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 324 |  | WebFeeder.alertActive = true | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 325 |  |  | 
 
 
 
 
 
 
 
 | 326 | + | # Only pass on alerts past this level | 
 
 
 
 
 
 
 
 | 327 | + | Alerter.WebFeeder.level = OK | 
 
 
 
 
 
 
 
 | 328 | + |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 329 |  | # Check period in seconds (for cleaning stale/old alerts) | 
 
 
 
 
 
 
 
 
 
 
 | 330 | < | WebFeeder.checkPeriod = 900 | 
 
 
 
 
 
 
 
 
 | 330 | > | WebFeeder.checkPeriod = 120 | 
 
 
 
 
 
 
 
 
 
 
 | 331 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 332 |  | # Delete alerts older than this, in seconds. | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 333 |  | # Files are only check every WebFeeder.checkPeriod seconds. | 
 
 
 
 
 
 
 
 
 
 
 | 334 | < | WebFeeder.alertDeleteOlderThan = 1800 | 
 
 
 
 
 
 
 
 
 | 334 | > | WebFeeder.alertDeleteOlderThan = 300 | 
 
 
 
 
 
 
 
 
 
 
 | 335 |  |  | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 336 |  | # Root Path | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 337 |  | WebFeeder.rootPath = /usr/local/proj/co600_10/webroot | 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 | 344 |  | WebFeeder.alertSubDir = alert | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 345 |  | WebFeeder.alertFileName = alert_data | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 346 |  |  | 
 
 
 
 
 
 
 
 
 | 323 | – | ############################################################ | 
 
 
 
 
 
 
 
 
 
 
 
 
 | 347 |  |  | 
 
 
 
 
 
 
 
 | 348 | + | ############################################################ |