ViewVC Help
View File | Revision Log | Show Annotations | Revision Graph | Root Listing
root/i-scream/projects/cms/source/host/ihost-perl/ihost.pl
(Generate patch)

Comparing projects/cms/source/host/ihost-perl/ihost.pl (file contents):
Revision 1.19 by tdb, Wed Feb 28 10:52:16 2001 UTC vs.
Revision 1.36 by tdb, Wed Nov 14 16:41:30 2001 UTC

# Line 5 | Line 5
5   # http://www.i-scream.org.uk
6   #
7   # An all-in-one script to act as an i-scream host on
8 < # a typical Unix/Linux box.  You may adapt the data-gathering
9 < # methods as you see fit.
10 < #  - pjm2@ukc.ac.uk
8 > # a typical Unix/Linux box.
9   #
10   # $Author$
11   # $Id$
# Line 33 | Line 31 | use vars qw (
31               $filter_addr
32               $file_list
33               $fqdn
34 +             $pidfile
35 +             $retry_wait
36 +             @statgrab
37              );
38  
39   if (@ARGV != 2) {
# Line 43 | Line 44 | $filter_manager_addr = $ARGV[0];
44   $filter_manager_port = $ARGV[1];
45  
46   $seq_no = 1;
47 + $retry_wait = 60;
48  
49 + # write our PID to a file
50 + $pidfile = "/var/tmp/ihost.pid";
51 + &write_pid();
52 +
53   &tcp_configure();
54   &send_udp_packet();
55  
# Line 68 | Line 74 | while (1) {
74      else {
75          $delay = $next_tcp;
76      }
77 <    `sleep $delay`;
77 >    sleep $delay;
78   }
79  
80 + # we'll probably never get here...
81 + `rm -f $pidfile`;
82   exit(0);
83  
84  
85   #-----------------------------------------------------------------------
86 + # wait_then_retry
87 + # Waits for the period of time specified in $retry_wait, then attempts
88 + # to reconfigure with the server.
89 + #-----------------------------------------------------------------------
90 + sub wait_then_retry() {
91 +    print "Will retry configuration with filter manager in $retry_wait seconds.\n";
92 +    sleep $retry_wait;
93 + }
94 +
95 +
96 + #-----------------------------------------------------------------------
97   # tcp_configure
98   # Establishes a TCP connection to the specified i-scream filter manager.
99   # The host then requests details from the server, such as the intervals
# Line 82 | Line 101 | exit(0);
101   #-----------------------------------------------------------------------
102   sub tcp_configure() {
103      
104 <    my($sock) = new IO::Socket::INET(
105 <                                     PeerAddr => $filter_manager_addr,
106 <                                     PeerPort => $filter_manager_port,
107 <                                     Proto => 'tcp'
108 <                                    );
109 <    if (!defined $sock) {
110 <        print "IHOST ERROR: Could not connect to $filter_manager_addr:$filter_manager_port.\n";
111 <        print "Please check that there is an i-scream server at this address.\n";
112 <        print "Program ended.\n";
113 <        exit(1);
114 <    }
104 >    while (1) {
105 >        my($sock) = new IO::Socket::INET(
106 >                                         PeerAddr => $filter_manager_addr,
107 >                                         PeerPort => $filter_manager_port,
108 >                                         Proto => 'tcp'
109 >                                        ) or die "Cannot connect!";
110 >        if (!defined $sock) {
111 >            print "IHOST ERROR: Could not connect to $filter_manager_addr:$filter_manager_port.\n";
112 >            print "Please check that there is an i-scream server at this address.\n";
113 >            wait_then_retry();
114 >            next;
115 >        }
116  
117 <    # Now run through the configuration process...
118 <    my($response);
117 >        # Now run through the configuration process...
118 >        my($response);
119      
120 <    print $sock "STARTCONFIG\n";
121 <    $response = <$sock>;
122 <    if (!chop $response eq "OK") {
123 <        print "The i-scream server rejected the STARTCONFIG command.  Terminated.";
124 <        exit(1);
125 <    }
120 >        print $sock "STARTCONFIG\n";
121 >        $response = <$sock>;
122 >        if ($response && !($response eq "OK\n")) {
123 >            print "The i-scream server rejected the STARTCONFIG command.\n";
124 >            close($sock);
125 >            wait_then_retry();
126 >            next;
127 >        }
128  
129 <    print "Config started okay.\n";
129 >        print "Config started okay.\n";
130      
131 <    print $sock "LASTMODIFIED\n";
132 <    $response = <$sock>;
133 <    chop $response;
134 <    $last_modified = $response;
131 >        print $sock "LASTMODIFIED\n";
132 >        $response = <$sock>;
133 >        if (!$response) {
134 >            print "The i-scream server did not return anything for the LASTMODIFIED command.\n";
135 >            close($sock);
136 >            wait_then_retry();
137 >            next;
138 >        }
139 >        chop $response;
140 >        $last_modified = $response;
141      
142 <    print "Config last modified: ". (scalar localtime $last_modified/1000) . "\n";
142 >        print "Config last modified: ". (scalar localtime $last_modified/1000) . "\n";
143  
144 <    print $sock "FILELIST\n";
145 <    $response = <$sock>;
146 <    chop $response;
147 <    $file_list = $response;
144 >        print $sock "FILELIST\n";
145 >        $response = <$sock>;
146 >        if (!$response) {
147 >            print "The i-scream server did not provide a configuration file list.\n";
148 >            close($sock);
149 >            wait_then_retry();
150 >            next;
151 >        }
152 >        chop $response;
153 >        $file_list = $response;
154  
155 <    print "File list obtained: $file_list\n";
155 >        print "File list obtained: $file_list\n";
156  
157 <    print $sock "FQDN\n";
158 <    $response = <$sock>;
159 <    chop $response;
160 <    $fqdn = $response;
157 >        print $sock "FQDN\n";
158 >        $response = <$sock>;
159 >        if (!$response) {
160 >            print "The i-scream server did not tell us our FQDN.\n";
161 >            close($sock);
162 >            wait_then_retry();
163 >            next;
164 >        }
165 >        chop $response;
166 >        $fqdn = $response;
167  
168 <    print "FQDN returned: $fqdn\n";
168 >        print "FQDN returned: $fqdn\n";
169  
170 <    print $sock "UDPUpdateTime\n";
171 <    $response = <$sock>;
172 <    chop $response;
173 <    $udp_update_time = $response;
170 >        print $sock "UDPUpdateTime\n";
171 >        $response = <$sock>;
172 >        if (!$response) {
173 >            print "The i-scream server did not give us a UDPUpdateTime.\n";
174 >            close($sock);
175 >            wait_then_retry();
176 >            next;
177 >        }
178 >        chop $response;
179 >        $udp_update_time = $response;
180  
181 <    print $sock "TCPUpdateTime\n";
182 <    $response = <$sock>;
183 <    chop $response;
184 <    $tcp_update_time = $response;
181 >        print $sock "TCPUpdateTime\n";
182 >        $response = <$sock>;
183 >        if (!$response) {
184 >            print "The i-scream server did not give us a TCPUpdateTime.\n";
185 >            close($sock);
186 >            wait_then_retry();
187 >            next;
188 >        }
189 >        chop $response;
190 >        $tcp_update_time = $response;
191      
192 <    print "UDP packet period: $udp_update_time seconds.\nTCP heartbeat period: $tcp_update_time seconds.\n";
192 >        print "UDP packet period: $udp_update_time seconds.\nTCP heartbeat period: $tcp_update_time seconds.\n";
193  
194 <    print $sock "ENDCONFIG\n";
195 <    $response = <$sock>;
196 <    chomp $response;
197 <    if (!$response eq "OK") {
198 <        print "ENDCONFIG command to server failed.  Terminated.\n";
199 <        exit(1);
200 <    }
194 >        print $sock "ENDCONFIG\n";
195 >        $response = <$sock>;
196 >        if ($response && !($response eq "OK\n")) {
197 >            print "ENDCONFIG command to server failed.  Terminated.\n";
198 >            close($sock);
199 >            wait_then_retry();
200 >            next;
201 >        }
202  
203 <    print "Config ended.\n";
203 >        print "Config ended.\n";
204      
205 <    print $sock "FILTER\n";
206 <    $response = <$sock>;
207 <    chop $response;
208 <    $response =~ /(.*);(.*);(.*)/;
209 <    ($filter_addr, $udp_port, $tcp_port) = ($1, $2, $3);
205 >        print $sock "FILTER\n";
206 >        $response = <$sock>;
207 >        if (!$response) {
208 >            print "Failed: Could not get a filter address from the filter manager.\n";
209 >            close($sock);
210 >            wait_then_retry();
211 >            next;
212 >        }
213 >        chop $response;
214 >        $response =~ /^(.*);(.*);(.*)/;
215 >        if ($response eq "ERROR") {
216 >            print "There are no active configured filters for your host.\n";
217 >            close($sock);
218 >            wait_then_retry();
219 >            next;
220 >        }
221 >        ($filter_addr, $udp_port, $tcp_port) = ($1, $2, $3);
222 >        unless (defined($filter_addr) && defined($udp_port) && defined($tcp_port)) {
223 >            print "Failed: Filter address response from server did not make sense: $response\n";
224 >            close($sock);
225 >            wait_then_retry();
226 >            next;
227 >        }
228      
229 <    print "Got filter data ($filter_addr, $udp_port, $tcp_port)\n";
229 >        print "Got filter data ($filter_addr, $udp_port, $tcp_port)\n";
230  
231 <    print $sock "END\n";
232 <    $response = <$sock>;
233 <    chop $response;
234 <    if ($response eq "OK") {
235 <        print "Host successfully configured via TCP.\n"
236 <    }
237 <    else {
238 <        print "The server failed the host configuration on the END command.";
239 <        exit(1);
240 <    }
231 >        print $sock "END\n";
232 >        $response = <$sock>;
233 >        if ($response && ($response eq "OK\n")) {
234 >            print "Host successfully configured via TCP.\n"
235 >        }
236 >        else {
237 >            print "The server failed the host configuration on the END command.\n";
238 >            close($sock);
239 >            wait_then_retry();
240 >            next;
241 >        }
242      
243 <    close($sock);
243 >        close($sock);
244  
245 <    print "Configuration finished sucessfully!\n";
246 <    
245 >        print "Configuration finished sucessfully!\n";
246 >        last;
247 >    }
248      return;
249   }
250  
251  
179
180
252   #-----------------------------------------------------------------------
253   # send_udp_packet
254   # Sends a UDP packet to an i-scream filter.
# Line 186 | Line 257 | sub tcp_configure() {
257   #-----------------------------------------------------------------------
258   sub send_udp_packet() {
259  
260 <    my(@statgrab) = `./statgrab.pl`;
190 <    my(%packet);
191 <    for (my($i) = 0; $i <= $#statgrab; $i++) {
192 <        $statgrab[$i] =~ /^([^\s]*) (.*)$/;
193 <        $packet{$1} = $2;
194 <    }
260 >    @statgrab = `./statgrab.pl`;
261      
262 +    # get some extra data
263      my($date) = time;
264 +    my($ip);
265 +    $ip = inet_ntoa(scalar(gethostbyname(hostname())) || 'localhost') or $ip = 'localhost';
266      
267 <    my($disk_info) = "<disk>";
268 <    my($i) = 0;
269 <    while (defined $packet{"packet.disk.p$i.attributes.mount"}) {
270 <        $disk_info .= "<p$i";
271 <        $disk_info .= " name=\"" . $packet{"packet.disk.p$i.attributes.name"} . "\"";
272 <        $disk_info .= " kbytes=\"" . $packet{"packet.disk.p$i.attributes.kbytes"} . "\"";
204 <        $disk_info .= " used=\"" . $packet{"packet.disk.p$i.attributes.used"} . "\"";
205 <        $disk_info .= " avail=\"" . $packet{"packet.disk.p$i.attributes.avail"} . "\"";
206 <        $disk_info .= " mount=\"" . $packet{"packet.disk.p$i.attributes.mount"} . "\"";
207 <        $disk_info .= "></p$i>";
208 <        ++$i;
209 <    }
210 <    $disk_info .= "</disk>";
211 <
212 <    my($ip) = inet_ntoa(scalar(gethostbyname(hostname())) || 'localhost');
213 <
214 <    # Build the XML packet this way, as we can clearly
215 <    # see the structure and contents... I like this ;-)
216 <    # [Note that the server rejects UDP packets that are
217 <    # larger than 8196 bytes]
218 <    my($xml) = <<EOF;
267 >    # add some extra data to the array
268 >    push(@statgrab, "packet.attributes.seq_no=$seq_no");
269 >    push(@statgrab, "packet.attributes.machine_name=$fqdn");
270 >    push(@statgrab, "packet.attributes.date=$date");
271 >    push(@statgrab, "packet.attributes.type=data");
272 >    push(@statgrab, "packet.attributes.ip=$ip");
273      
274 < <packet seq_no="$seq_no" machine_name="$fqdn" date="$date" type="data" ip="$ip">
275 <    <load>
222 <        <load1>$packet{"packet.load.load1"}</load1>
223 <        <load5>$packet{"packet.load.load5"}</load5>
224 <        <load15>$packet{"packet.load.load15"}</load15>
225 <    </load>
226 <    <os>
227 <        <name>$packet{"packet.os.name"}</name>
228 <        <release>$packet{"packet.os.release"}</release>
229 <        <platform>$packet{"packet.os.platform"}</platform>
230 <        <sysname>$packet{"packet.os.sysname"}</sysname>
231 <        <version>$packet{"packet.os.version"}</version>
232 <        <uptime>$packet{"packet.os.uptime"}</uptime>
233 <    </os>
234 <    <users>
235 <        <count>$packet{"packet.users.count"}</count>
236 <        <list>$packet{"packet.users.list"}</list>
237 <    </users>
238 <    <processes>
239 <        <total>$packet{"packet.processes.total"}</total>
240 <        <sleeping>$packet{"packet.processes.sleeping"}</sleeping>
241 <        <zombie>$packet{"packet.processes.zombie"}</zombie>
242 <        <stopped>$packet{"packet.processes.stopped"}</stopped>
243 <        <cpu>$packet{"packet.processes.cpu"}</cpu>
244 <    </processes>
245 <    <cpu>
246 <        <idle>$packet{"packet.cpu.idle"}</idle>
247 <        <user>$packet{"packet.cpu.user"}</user>
248 <        <kernel>$packet{"packet.cpu.kernel"}</kernel>
249 <        <iowait>$packet{"packet.cpu.iowait"}</iowait>
250 <        <swap>$packet{"packet.cpu.swap"}</swap>
251 <    </cpu>
252 <    <memory>
253 <        <total>$packet{"packet.memory.total"}</total>
254 <        <free>$packet{"packet.memory.free"}</free>
255 <    </memory>
256 <    <swap>
257 <        <total>$packet{"packet.swap.total"}</total>
258 <        <free>$packet{"packet.swap.free"}</free>
259 <    </swap>
260 <    $disk_info
261 < </packet>
262 <
263 < EOF
264 <
265 <    # Make the packet smaller by stripping out newlines and leading spaces.
266 <    $xml =~ s/\n\s*//g;
267 <
268 < print $xml;
274 >    # turn the array into some nice XML
275 >    my($xml) = &make_xml("", "");
276      
277      my($sock) = new IO::Socket::INET (
278                                        PeerPort => $udp_port,
279                                        PeerAddr => $filter_addr,
280                                        Proto => 'udp'
281 <                                     ) or die "Socket: $!\n";
282 <
281 >                                     ) or die "Could not send UDP: $!\n";
282 >    
283      print $sock $xml or die "Could not send UDP packet: $!\n";
284      close($sock);
285      $seq_no++;
# Line 282 | Line 289 | print $xml;
289   }
290  
291  
285
286
292   #-----------------------------------------------------------------------
293   # send_tcp_heartbeat
294   # Establishes a TCP connection to an i-scream filter.
295   # The heartbeat is used as a guaranteed "I'm alive" delivery mechanism.
296 + # If we need to reconfigure, then we complete the heartbeat before
297 + # doing so.
298   #-----------------------------------------------------------------------
299   sub send_tcp_heartbeat() {
300  
301 +    my ($doReconfigure) = 0;
302 +
303      my($sock) = new IO::Socket::INET(
304                                       PeerAddr => $filter_addr,
305                                       PeerPort => $tcp_port,
306                                       Proto => 'tcp'
307 <                                    );
307 >                                    ) or return;
308      if (!defined $sock) {
309          print "IHOST WARNING: Failed to deliver a heartbeat to the i-scream filter.\n";
310 +        &tcp_configure();
311          return;
312      }
313  
# Line 306 | Line 316 | sub send_tcp_heartbeat() {
316  
317      print $sock "HEARTBEAT\n";
318      $response = <$sock>;
319 <    chop $response;
310 <    if (!$response eq "OK") {
319 >    if (!$response eq "OK\n") {
320          close($sock);
321          print "Server gave wrong response to HEARTBEAT: $response\n";
322 +        &tcp_configure();
323          return;
324      }
325      
326      print $sock "CONFIG\n";
327      $response = <$sock>;
328 <    chop $response;
319 <    if (!$response eq "OK") {
328 >    if (!$response eq "OK\n") {
329          close($sock);
330          print "Server gave wrong response to CONFIG: $response\n";
331 +        &tcp_configure();
332          return;
333      }
334  
335      print $sock "$file_list\n";
336      $response = <$sock>;
337 <    chop $response;
328 <    if (!$response eq "OK") {
337 >    if (!$response eq "OK\n") {
338          close($sock);
339          print "Server gave wrong response to file list: $response\n";
340 +        &tcp_configure();
341          return;
342      }
343      
344      print $sock "$last_modified\n";
345      $response = <$sock>;
346 <    chop $response;
337 <    if ($response eq "ERROR") {
346 >    if ($response eq "ERROR\n") {
347          close($sock);
348 <        &tcp_configure();
349 <        return;
348 >        print "Server configuration changed.  Reconfiguring with filter manager.\n";
349 >        $doReconfigure = 1;
350      }
351 <    if (!$response eq "OK") {
351 >    if (!$response eq "OK\n") {
352          close($sock);
353          print "Server gave wrong response to HEARTBEAT: $response\n";
354 +        &tcp_configure();
355          return;
356      }
357      
358      print $sock "ENDHEARTBEAT\n";
359      $response = <$sock>;
360 <    chop $response;
351 <    if (!$response eq "OK") {
360 >    if (!$response eq "OK\n") {
361          close($sock);
362          print "Server gave wrong response to ENDHEARTBEAT: $response\n";
363 +        &tcp_configure();
364          return;
365      }
366      
367      close($sock);
368      print "^";
369      
370 +    &tcp_configure() if $doReconfigure;
371 +    
372      return;
373 + }
374 +
375 +
376 + #-----------------------------------------------------------------------
377 + # write_pid
378 + # Writes the PID (process ID) of this instance to $pidfile.
379 + # This is then used by a seperate script to check (and restart) ihost.
380 + #-----------------------------------------------------------------------
381 + sub write_pid() {
382 +    open PID, ">$pidfile";
383 +    print PID $$;
384 +    close PID;
385 +    
386 +    return;
387 + }
388 +
389 + #-----------------------------------------------------------------------
390 + # make_xml
391 + # Turns an array of statgrab data into an XML string.
392 + #-----------------------------------------------------------------------
393 + sub make_xml() {
394 +    my($curlevel, $curline) = @_;
395 +    my($xmltemp) = ""; my($curtag) = ""; my($attributes) = "";
396 +    while(true) {
397 +        $curline = shift(@statgrab) if $curline eq ""; chomp $curline;
398 +        if($curline =~ /^$curlevel([^\.\s]+\.)/) {
399 +            $curtag=$1;
400 +        }
401 +        if($curline =~ /^$curlevel$curtag([^\.\s]+)\s+(.*)$/) {
402 +            $xmltemp .= "<$1$attributes>$2</$1>";
403 +        }
404 +        elsif($curline =~ /^$curlevel$curtag(attributes)\.([^\.=]+)=(.*)$/) {
405 +            $attributes .= " $2=\"$3\"";
406 +        }
407 +        else {
408 +            $xmltemp .= &make_xml("$curlevel$curtag", $curline);
409 +        }
410 +        my($nextline) = $statgrab[0]; chomp $nextline if defined $nextline;
411 +        $curtag =~ s/(.*)\./$1/;                
412 +        if(defined $nextline && $nextline =~ /^$curlevel$curtag\./) {
413 +            $curline = "";
414 +        }
415 +        else {
416 +            $xmltemp = "<$curtag$attributes>$xmltemp</$curtag>" unless $curtag eq "";
417 +            return $xmltemp;
418 +        }
419 +    }
420   }

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines