ViewVC Help
View File | Revision Log | Show Annotations | Revision Graph | Root Listing
root/i-scream/projects/cms/source/host/ihost-perl/ihost.pl
(Generate patch)

Comparing projects/cms/source/host/ihost-perl/ihost.pl (file contents):
Revision 1.11 by pjm2, Thu Feb 1 09:10:52 2001 UTC vs.
Revision 1.50 by tdb, Tue May 21 16:47:11 2002 UTC

# Line 1 | Line 1
1   #!/usr/bin/perl -w
2  
3 + #
4 + # i-scream central monitoring system
5 + # http://www.i-scream.org.uk
6 + # Copyright (C) 2000-2002 i-scream
7 + #
8 + # This program is free software; you can redistribute it and/or
9 + # modify it under the terms of the GNU General Public License
10 + # as published by the Free Software Foundation; either version 2
11 + # of the License, or (at your option) any later version.
12 + #
13 + # This program is distributed in the hope that it will be useful,
14 + # but WITHOUT ANY WARRANTY; without even the implied warranty of
15 + # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
16 + # GNU General Public License for more details.
17 + #
18 + # You should have received a copy of the GNU General Public License
19 + # along with this program; if not, write to the Free Software
20 + # Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111-1307, USA.
21 + #
22 +
23   # -----------------------------------------------------------
24   # Perl i-scream Host.
25 + # http://www.i-scream.org.uk
26   #
27   # An all-in-one script to act as an i-scream host on
28 < # a typical Unix/Linux box.  You may adapt the data-gathering
8 < # methods as you see fit.
9 < #  - pjm2@ukc.ac.uk
28 > # a typical Unix/Linux box.
29   #
30   # $Author$
31   # $Id$
# Line 31 | Line 50 | use vars qw (
50               $tcp_port
51               $filter_addr
52               $file_list
53 +             $fqdn
54 +             $pidfile
55 +             $retry_wait
56 +             $ostype
57 +             $key
58 +             @data
59              );
60  
61   if (@ARGV != 2) {
# Line 41 | Line 66 | $filter_manager_addr = $ARGV[0];
66   $filter_manager_port = $ARGV[1];
67  
68   $seq_no = 1;
69 + $retry_wait = 60;
70  
71 + # work out our platform, if we can.
72 + $ostype = `uname -s`;
73 + chomp $ostype;
74 + $ostype = "unknown" if not defined $ostype;
75 +
76 + # write our PID to a file
77 + # use home dir by default
78 + #$pidfile = $ENV{"HOME"};
79 + # or drop it in /var/tmp if we can't find HOME
80 + $pidfile = "/var/tmp" if not defined $pidfile;
81 + $pidfile .= "/.ihost.pid";
82 + &write_pid();
83 +
84   &tcp_configure();
85 + &send_tcp_heartbeat();
86   &send_udp_packet();
87  
88   $last_udp_time = time;
# Line 66 | Line 106 | while (1) {
106      else {
107          $delay = $next_tcp;
108      }
109 <    `sleep $delay`;
109 >    sleep $delay;
110   }
111  
112 + # we'll probably never get here...
113 + `rm -f $pidfile`;
114   exit(0);
115  
116 +
117 + #-----------------------------------------------------------------------
118 + # wait_then_retry
119 + # Waits for the period of time specified in $retry_wait, then attempts
120 + # to reconfigure with the server.
121 + #-----------------------------------------------------------------------
122 + sub wait_then_retry() {
123 +    print "Will retry configuration with filter manager in $retry_wait seconds.\n";
124 +    sleep $retry_wait;
125 + }
126 +
127 +
128 + #-----------------------------------------------------------------------
129 + # tcp_configure
130 + # Establishes a TCP connection to the specified i-scream filter manager.
131 + # The host then requests details from the server, such as the intervals
132 + # at which to send UDP packets.
133 + #-----------------------------------------------------------------------
134   sub tcp_configure() {
135      
136 <    my($sock) = new IO::Socket::INET(
137 <                                     PeerAddr => $filter_manager_addr,
138 <                                     PeerPort => $filter_manager_port,
139 <                                     Proto => 'tcp'
140 <                                    );
141 <    if (!defined $sock) {
142 <        print "IHOST ERROR: Could not connect to $filter_manager_addr:$filter_manager_port.\n";
143 <        print "Please check that there is an i-scream server at this address.\n";
144 <        print "Program ended.\n";
145 <        exit(1);
146 <    }
136 >    while (1) {
137 >        my($sock) = new IO::Socket::INET(
138 >                                         PeerAddr => $filter_manager_addr,
139 >                                         PeerPort => $filter_manager_port,
140 >                                         Proto => 'tcp'
141 >                                        ) or die "Cannot connect!";
142 >        if (!defined $sock) {
143 >            print "IHOST ERROR: Could not connect to $filter_manager_addr:$filter_manager_port.\n";
144 >            print "Please check that there is an i-scream server at this address.\n";
145 >            wait_then_retry();
146 >            next;
147 >        }
148  
149 <    # Now run through the configuration process.
150 <    my($response);
149 >        # Now run through the configuration process...
150 >        my($response);
151      
152 <    print $sock "STARTCONFIG\n";
153 <    $response = <$sock>;
154 <    if (!chop $response eq "OK") {
155 <        print "The i-scream server rejected the STARTCONFIG command.  Terminated.";
156 <        exit(1);
157 <    }
152 >        print $sock "STARTCONFIG\n";
153 >        $response = <$sock>;
154 >        if ($response && !($response eq "OK\n")) {
155 >            print "The i-scream server rejected the STARTCONFIG command.\n";
156 >            close($sock);
157 >            wait_then_retry();
158 >            next;
159 >        }
160  
161 <    print "Config started okay.\n";
161 >        print "Config started okay.\n";
162      
163 <    print $sock "LASTMODIFIED\n";
164 <    $response = <$sock>;
165 <    chop $response;
166 <    $last_modified = $response;
163 >        print $sock "LASTMODIFIED\n";
164 >        $response = <$sock>;
165 >        if (!$response || $response eq "ERROR\n") {
166 >            print "The i-scream server did not provide the LASTMODIFIED value.\n";
167 >            close($sock);
168 >            wait_then_retry();
169 >            next;
170 >        }
171 >        chomp $response;
172 >        $last_modified = $response;
173      
174 <    print "Config last modified: ". (scalar localtime $last_modified/1000) . "\n";
174 >        print "Config last modified: ". (scalar localtime $last_modified/1000) . "\n";
175  
176 <    print $sock "FILELIST\n";
177 <    $response = <$sock>;
178 <    chop $response;
179 <    $file_list = $response;
176 >        print $sock "FILELIST\n";
177 >        $response = <$sock>;
178 >        if (!$response || $response eq "ERROR\n") {
179 >            print "The i-scream server did not provide a configuration file list.\n";
180 >            close($sock);
181 >            wait_then_retry();
182 >            next;
183 >        }
184 >        chomp $response;
185 >        $file_list = $response;
186  
187 <    print "File list obtained: $file_list\n";
187 >        print "File list obtained: $file_list\n";
188  
189 <    print $sock "UDPUpdateTime\n";
190 <    $response = <$sock>;
191 <    chop $response;
192 <    $udp_update_time = $response;
189 >        print $sock "FQDN\n";
190 >        $response = <$sock>;
191 >        if (!$response || $response eq "ERROR\n") {
192 >            print "The i-scream server did not tell us our FQDN.\n";
193 >            close($sock);
194 >            wait_then_retry();
195 >            next;
196 >        }
197 >        chomp $response;
198 >        $fqdn = $response;
199  
200 <    print $sock "TCPUpdateTime\n";
201 <    $response = <$sock>;
202 <    chop $response;
203 <    $tcp_update_time = $response;
200 >        print "FQDN returned: $fqdn\n";
201 >
202 >        print $sock "UDPUpdateTime\n";
203 >        $response = <$sock>;
204 >        if (!$response || $response eq "ERROR\n") {
205 >            print "The i-scream server did not give us a UDPUpdateTime.\n";
206 >            close($sock);
207 >            wait_then_retry();
208 >            next;
209 >        }
210 >        chomp $response;
211 >        $udp_update_time = $response;
212 >
213 >        print $sock "TCPUpdateTime\n";
214 >        $response = <$sock>;
215 >        if (!$response || $response eq "ERROR\n") {
216 >            print "The i-scream server did not give us a TCPUpdateTime.\n";
217 >            close($sock);
218 >            wait_then_retry();
219 >            next;
220 >        }
221 >        chomp $response;
222 >        $tcp_update_time = $response;
223      
224 <    print "UDP packet period: $udp_update_time seconds.\nTCP heartbeat period: $tcp_update_time seconds.\n";
224 >        print "UDP packet period: $udp_update_time seconds.\nTCP heartbeat period: $tcp_update_time seconds.\n";
225  
226 <    print $sock "ENDCONFIG\n";
227 <    $response = <$sock>;
228 <    chomp $response;
229 <    if (!$response eq "OK") {
230 <        print "ENDCONFIG command to server failed.  Terminated.\n";
231 <        exit(1);
232 <    }
226 >        print $sock "ENDCONFIG\n";
227 >        $response = <$sock>;
228 >        if ($response && !($response eq "OK\n")) {
229 >            print "ENDCONFIG command to server failed.  Terminated.\n";
230 >            close($sock);
231 >            wait_then_retry();
232 >            next;
233 >        }
234  
235 <    print "Config ended.\n";
235 >        print "Config ended.\n";
236      
237 <    print $sock "FILTER\n";
238 <    $response = <$sock>;
239 <    chop $response;
240 <    $response =~ /(.*);(.*);(.*)/;
241 <    ($filter_addr, $udp_port, $tcp_port) = ($1, $2, $3);
237 >        print $sock "FILTER\n";
238 >        $response = <$sock>;
239 >        if (!$response) {
240 >            print "Failed: Could not get a filter address from the filter manager.\n";
241 >            close($sock);
242 >            wait_then_retry();
243 >            next;
244 >        }
245 >        chomp $response;
246 >        if ($response eq "ERROR") {
247 >            print "There are no active configured filters for your host.\n";
248 >            close($sock);
249 >            wait_then_retry();
250 >            next;
251 >        }
252 >        $response =~ /^(.*);(.*);(.*)/;
253 >        ($filter_addr, $udp_port, $tcp_port) = ($1, $2, $3);
254 >        unless (defined($filter_addr) && defined($udp_port) && defined($tcp_port)) {
255 >            print "Failed: Filter address response from server did not make sense: $response\n";
256 >            close($sock);
257 >            wait_then_retry();
258 >            next;
259 >        }
260      
261 <    print "Got filter data ($filter_addr, $udp_port, $tcp_port)\n";
261 >        print "Got filter data ($filter_addr, $udp_port, $tcp_port)\n";
262  
263 <    print $sock "END\n";
264 <    $response = <$sock>;
265 <    chop $response;
266 <    if ($response eq "OK") {
267 <        print "Host successfully configured via TCP.\n"
268 <    }
269 <    else {
270 <        print "The server failed the host configuration on the END command.";
271 <        exit(1);
272 <    }
263 >        print $sock "END\n";
264 >        $response = <$sock>;
265 >        if ($response && ($response eq "OK\n")) {
266 >            print "Host successfully configured via TCP.\n"
267 >        }
268 >        else {
269 >            print "The server failed the host configuration on the END command.\n";
270 >            close($sock);
271 >            wait_then_retry();
272 >            next;
273 >        }
274      
275 <    close($sock);
275 >        close($sock);
276  
277 <    print "Configuration finished sucessfully!\n";
277 >        print "Configuration finished sucessfully!\n";
278 >        last;
279 >    }
280 >    return;
281   }
282  
283 +
284 + #-----------------------------------------------------------------------
285 + # send_udp_packet
286 + # Sends a UDP packet to an i-scream filter.
287 + # The packet contains XML markup describing some of the machine's state.
288 + # Receipt of UDP packets is not guaranteed.
289 + #-----------------------------------------------------------------------
290   sub send_udp_packet() {
291  
292 <    my(@statgrab) = `./statgrab.pl`;
293 <    my(%packet);
294 <    for (my($i) = 0; $i < $#statgrab; $i++) {
295 <        $statgrab[$i] =~ /^([^\s]*) (.*)$/;
296 <        $packet{$1} = $2;
292 >    my($plugins_dir) = "plugins";
293 >    
294 >    opendir PLUGINS, $plugins_dir;
295 >    my(@plugins) = readdir PLUGINS;
296 >    foreach my $plugin (@plugins) {
297 >        push @data, `$plugins_dir/$plugin $ostype` if -x "$plugins_dir/$plugin" && -f "$plugins_dir/$plugin";
298      }
299      
300 +    # get some extra data
301      my($date) = time;
302 +    my($ip);
303 +    $ip = inet_ntoa(scalar(gethostbyname(hostname())) || 'localhost') or $ip = 'localhost';
304      
305 <    my($disk_info) = "<disk>";
306 <    my($i) = 0;
307 <    while (defined $packet{"packet.disk.p$i.attributes.mount"}) {
308 <        $disk_info .= "<p$i>";
309 <        $disk_info .= qq/<name>$packet{"packet.disk.p$i.attributes.name"}<\/name>/;
310 <        $disk_info .= qq/<kbytes>$packet{"packet.disk.p$i.attributes.kbytes"}<\/kbytes>/;
311 <        $disk_info .= qq/<used>$packet{"packet.disk.p$i.attributes.used"}<\/used>/;
178 <        $disk_info .= qq/<avail>$packet{"packet.disk.p$i.attributes.avail"}<\/avail>/;
179 <        $disk_info .= qq/<mount>$packet{"packet.disk.p$i.attributes.mount"}<\/mount>/;
180 <        $disk_info .= "</p$i>";
181 <        ++$i;
182 <    }
183 <    $disk_info .= "</disk>";
184 <
185 <    my($hostname) = hostname();
186 <    $hostname =~ s/\..*$//g;
187 <    `cat /etc/resolv.conf` =~ /domain\s+([^\s]+)/;
188 <    my($domainname) = $1;
189 <    my($machine_name) = "$hostname.$domainname";
190 <    my($ip) = inet_ntoa(scalar(gethostbyname($hostname)) || 'localhost');
191 <
192 <    # Build the XML packet this way, as we can clearly
193 <    # see the structure and contents... I like this ;-)
194 <    my($xml) = <<EOF;
305 >    # add some extra data to the array
306 >    push(@data, "packet.attributes.seq_no $seq_no");
307 >    push(@data, "packet.attributes.machine_name $fqdn");
308 >    push(@data, "packet.attributes.date $date");
309 >    push(@data, "packet.attributes.type data");
310 >    push(@data, "packet.attributes.ip $ip");
311 >    push(@data, "packet.attributes.key $key");
312      
313 < <packet seq_no="$seq_no" machine_name="$machine_name" date="$date" type="data" ip="$ip">
314 <    <load>
198 <        <load1>$packet{"packet.load.load1"}</load1>
199 <        <load5>$packet{"packet.load.load5"}</load5>
200 <        <load15>$packet{"packet.load.load15"}</load15>
201 <    </load>
202 <    <os>
203 <        <name>$packet{"packet.os.name"}</name>
204 <        <release>$packet{"packet.os.release"}</release>
205 <        <platform>$packet{"packet.os.platform"}</platform>
206 <        <sysname>$packet{"packet.os.sysname"}</sysname>
207 <        <version>$packet{"packet.os.version"}</version>
208 <        <uptime>$packet{"packet.os.uptime"}</uptime>
209 <    </os>
210 <    <users>
211 <        <count>$packet{"packet.users.count"}</count>
212 <        <list>$packet{"packet.users.list"}</list>
213 <    </users>
214 <    <processes>
215 <        <total>$packet{"packet.processes.total"}</total>
216 <        <sleeping>$packet{"packet.processes.sleeping"}</sleeping>
217 <        <zombie>$packet{"packet.processes.zombie"}</zombie>
218 <        <stopped>$packet{"packet.processes.stopped"}</stopped>
219 <        <cpu>$packet{"packet.processes.cpu"}</cpu>
220 <    </processes>
221 <    <cpu>
222 <        <idle>$packet{"packet.cpu.idle"}</idle>
223 <        <user>$packet{"packet.cpu.user"}</user>
224 <        <kernel>$packet{"packet.cpu.kernel"}</kernel>
225 <        <iowait>$packet{"packet.cpu.iowait"}</iowait>
226 <        <swap>$packet{"packet.cpu.swap"}</swap>
227 <    </cpu>
228 <    <memory>
229 <        <total>$packet{"packet.memory.real"}</total>
230 <        <free>$packet{"packet.memory.free"}</free>
231 <    </memory>
232 <    <swap>
233 <        <total>$packet{"packet.memory.swap_total"}</total>
234 <        <free>$packet{"packet.memory.swap_free"}</free>
235 <    </swap>
236 <    $disk_info
237 < </packet>
313 >    # sort the data
314 >    @data = sort(grep(!/^$/, grep(/^packet\./, @data)));
315  
316 < EOF
316 >    # turn the array into some nice XML
317 >    my($xml) = &make_xml("", "");
318  
241    $xml =~ s/\n\s*//g;
242    
319      my($sock) = new IO::Socket::INET (
320                                        PeerPort => $udp_port,
321                                        PeerAddr => $filter_addr,
322                                        Proto => 'udp'
323 <                                     ) or die "Socket: $!\n";
324 <
323 >                                     ) or die "Could not send UDP: $!\n";
324 >    
325      print $sock $xml or die "Could not send UDP packet: $!\n";
326      close($sock);
327      $seq_no++;
328      print "-";
329 +    
330 +    return;
331   }
332  
333 +
334 + #-----------------------------------------------------------------------
335 + # send_tcp_heartbeat
336 + # Establishes a TCP connection to an i-scream filter.
337 + # The heartbeat is used as a guaranteed "I'm alive" delivery mechanism.
338 + # If we need to reconfigure, then we complete the heartbeat before
339 + # doing so.
340 + #-----------------------------------------------------------------------
341   sub send_tcp_heartbeat() {
342  
343 +    my ($doReconfigure) = 0;
344 +
345      my($sock) = new IO::Socket::INET(
346                                       PeerAddr => $filter_addr,
347                                       PeerPort => $tcp_port,
348                                       Proto => 'tcp'
349 <                                    );
349 >                                    ) or return;
350      if (!defined $sock) {
351          print "IHOST WARNING: Failed to deliver a heartbeat to the i-scream filter.\n";
352 +        &tcp_configure();
353          return;
354      }
355  
# Line 269 | Line 358 | sub send_tcp_heartbeat() {
358  
359      print $sock "HEARTBEAT\n";
360      $response = <$sock>;
361 <    chop $response;
273 <    if (!$response eq "OK") {
361 >    if (!$response eq "OK\n") {
362          close($sock);
363          print "Server gave wrong response to HEARTBEAT: $response\n";
364 +        &tcp_configure();
365          return;
366      }
367      
368      print $sock "CONFIG\n";
369      $response = <$sock>;
370 <    chop $response;
282 <    if (!$response eq "OK") {
370 >    if (!$response eq "OK\n") {
371          close($sock);
372          print "Server gave wrong response to CONFIG: $response\n";
373 +        &tcp_configure();
374          return;
375      }
376  
377      print $sock "$file_list\n";
378      $response = <$sock>;
379 <    chop $response;
291 <    if (!$response eq "OK") {
379 >    if (!$response eq "OK\n") {
380          close($sock);
381          print "Server gave wrong response to file list: $response\n";
382 +        &tcp_configure();
383          return;
384      }
385      
386      print $sock "$last_modified\n";
387      $response = <$sock>;
388 <    chop $response;
300 <    if ($response eq "ERROR") {
388 >    if ($response eq "ERROR\n") {
389          close($sock);
390 <        &tcp_configure();
391 <        return;
390 >        print "Server configuration changed.  Reconfiguring with filter manager.\n";
391 >        $doReconfigure = 1;
392      }
393 <    if (!$response eq "OK") {
393 >    if (!$response eq "OK\n") {
394          close($sock);
395          print "Server gave wrong response to HEARTBEAT: $response\n";
396 +        &tcp_configure();
397          return;
398      }
399      
400 +    print $sock "KEY\n";
401 +    $key = <$sock>;
402 +    
403      print $sock "ENDHEARTBEAT\n";
404      $response = <$sock>;
405 <    chop $response;
314 <    if (!$response eq "OK") {
405 >    if (!$response eq "OK\n") {
406          close($sock);
407          print "Server gave wrong response to ENDHEARTBEAT: $response\n";
408 +        &tcp_configure();
409          return;
410      }
411      
412      close($sock);
413      print "^";
414 +    
415 +    &tcp_configure() if $doReconfigure;
416 +    
417 +    return;
418 + }
419 +
420 +
421 + #-----------------------------------------------------------------------
422 + # write_pid
423 + # Writes the PID (process ID) of this instance to $pidfile.
424 + # This is then used by a seperate script to check (and restart) ihost.
425 + #-----------------------------------------------------------------------
426 + sub write_pid() {
427 +    open PID, ">$pidfile";
428 +    print PID $$;
429 +    close PID;
430 +    
431 +    return;
432 + }
433 +
434 + #-----------------------------------------------------------------------
435 + # make_xml
436 + # Turns an array of plugins data into an XML string.
437 + #-----------------------------------------------------------------------
438 + sub make_xml() {
439 +    my($curlevel, $curline) = @_;
440 +    my($xmltemp) = ""; my($curtag) = ""; my($attributes) = "";
441 +    while(1) {
442 +        $curline = shift(@data) if $curline eq "";
443 +        return $xmltemp if not defined $curline;
444 +        chomp $curline;
445 +        # dealing with nest (or attributes)
446 +        if($curline =~ /^$curlevel([^\.\s]+\.)/) {
447 +            $curtag=$1;
448 +            if($curline =~ /^$curlevel$curtag([^\.\s]+)\s+(.*)$/) {
449 +                $xmltemp .= &make_xml("$curlevel$curtag", $curline);
450 +            }
451 +            elsif($curline =~ /^$curlevel$curtag(attributes)\.([^\.\s]+)\s+(.*)$/) {
452 +                $attributes .= " $2=\"$3\"";
453 +            }
454 +            else {
455 +                $xmltemp .= &make_xml("$curlevel$curtag", $curline);
456 +            }
457 +            my($nextline) = $data[0]; chomp $nextline if defined $nextline;
458 +            $curtag =~ s/(.*)\./$1/;
459 +            if((defined $nextline) && ($nextline =~ /^$curlevel$curtag\./)) {
460 +                $curline = "";
461 +            }
462 +            else {
463 +                $xmltemp = "<$curtag$attributes>$xmltemp</$curtag>" unless $curtag eq "";
464 +                return $xmltemp;
465 +            }
466 +        }
467 +        # dealing with value
468 +        elsif($curline =~ /^$curlevel([^\.\s]+)\s+(.*)$/) {
469 +            $curtag=$1;
470 +            $xmltemp=$2;          
471 +            my($nextline) = $data[0]; chomp $nextline if defined $nextline;
472 +            if(defined $nextline && ($nextline =~ /^$curlevel$curtag\./ || $nextline =~ /^$curlevel$curtag\s+/)) {
473 +                $curline = "";
474 +            }
475 +            else {
476 +                $xmltemp = "<$curtag$attributes>$xmltemp</$curtag>" unless $curtag eq "";
477 +                return $xmltemp;
478 +            }
479 +        }
480 +        # dealing with a null value
481 +        elsif($curline =~ /^$curlevel([^\.\s]+)$/) {
482 +            # simply adding a space makes the above elsif deal with it :)
483 +            # just level with an empty tag in the XML
484 +            $curline .= " ";
485 +        }
486 +        # failing all that, skip the line
487 +        else {
488 +            $curline = "";
489 +        }
490 +    }
491   }

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines