Annotation of loncom/loncron, revision 1.35
1.1 albertel 1: #!/usr/bin/perl
2:
3: # The LearningOnline Network
4: # Housekeeping program, started by cron
5: #
6: # (TCP networking package
7: # 6/1/99,6/2,6/10,6/11,6/12,6/14,6/26,6/28,6/29,6/30,
8: # 7/1,7/2,7/9,7/10,7/12 Gerd Kortemeyer)
9: #
1.3 www 10: # 7/14,7/15,7/19,7/21,7/22,11/18,
11: # 2/8 Gerd Kortemeyer
1.20 harris41 12: # 12/6/2000,12/8 Scott Harrison
1.11 www 13: # 12/23 Gerd Kortemeyer
1.22 harris41 14: # YEAR=2001
15: # 1/10/2001, 2/12/, 2/26, 3/15, 04/11, 04/21,8/27 Scott Harrison
1.25 www 16: # 09/04,09/06,11/26 Gerd Kortemeyer
1.26 harris41 17: # YEAR=2002
18: # 5/11/2002 Scott Harrison
1.24 www 19:
20: $|=1;
1.1 albertel 21:
1.26 harris41 22: use lib '/home/httpd/lib/perl/';
23: use LONCAPA::Configuration;
24:
1.1 albertel 25: use IO::File;
26: use IO::Socket;
27:
28: # -------------------------------------------------- Non-critical communication
29: sub reply {
30: my ($cmd,$server)=@_;
31: my $peerfile="$perlvar{'lonSockDir'}/$server";
32: my $client=IO::Socket::UNIX->new(Peer =>"$peerfile",
33: Type => SOCK_STREAM,
34: Timeout => 10)
35: or return "con_lost";
36: print $client "$cmd\n";
37: my $answer=<$client>;
38: chomp($answer);
39: if (!$answer) { $answer="con_lost"; }
40: return $answer;
41: }
42:
43: # --------------------------------------------------------- Output error status
44:
45: sub errout {
46: my $fh=shift;
47: print $fh (<<ENDERROUT);
48: <p><table border=2 bgcolor="#CCCCCC">
49: <tr><td>Notices</td><td>$notices</td></tr>
50: <tr><td>Warnings</td><td>$warnings</td></tr>
51: <tr><td>Errors</td><td>$errors</td></tr>
52: </table><p><a href="#top">Top</a><p>
53: ENDERROUT
54: }
55:
56: # ================================================================ Main Program
57:
1.27 matthew 58: # --------------------------------- Read loncapa_apache.conf and loncapa.conf
1.33 harris41 59: my $perlvarref=LONCAPA::Configuration::read_conf('loncapa.conf');
1.28 albertel 60: %perlvar=%{$perlvarref};
1.26 harris41 61: undef $perlvarref;
62: delete $perlvar{'lonReceipt'}; # remove since sensitive and not needed
63: delete $perlvar{'lonSqlAccess'}; # remove since sensitive and not needed
1.13 harris41 64:
1.14 harris41 65: # --------------------------------------- Make sure that LON-CAPA is configured
66: # I only test for one thing here (lonHostID). This is just a safeguard.
67: if ('{[[[[lonHostID]]]]}' eq $perlvar{'lonHostID'}) {
1.15 harris41 68: print("Unconfigured machine.\n");
1.14 harris41 69: $emailto=$perlvar{'lonSysEMail'};
70: $hostname=`/bin/hostname`;
71: chop $hostname;
72: $hostname=~s/[^\w\.]//g; # make sure is safe to pass through shell
73: $subj="LON: Unconfigured machine $hostname";
74: system("echo 'Unconfigured machine $hostname.' |\
75: mailto $emailto -s '$subj' > /dev/null");
76: exit 1;
77: }
78:
1.13 harris41 79: # ----------------------------- Make sure this process is running from user=www
80: my $wwwid=getpwnam('www');
81: if ($wwwid!=$<) {
1.14 harris41 82: print("User ID mismatch. This program must be run as user 'www'\n");
1.13 harris41 83: $emailto="$perlvar{'lonAdmEMail'},$perlvar{'lonSysEMail'}";
84: $subj="LON: $perlvar{'lonHostID'} User ID mismatch";
85: system("echo 'User ID mismatch. loncron must be run as user www.' |\
86: mailto $emailto -s '$subj' > /dev/null");
1.14 harris41 87: exit 1;
1.1 albertel 88: }
89:
90: # ------------------------------------------------------------- Read hosts file
91: {
92: my $config=IO::File->new("$perlvar{'lonTabDir'}/hosts.tab");
93:
94: while (my $configline=<$config>) {
1.31 albertel 95: my ($id,$domain,$role,$name,$ip,$domdescr)=split(/:/,$configline);
96: if ($id && $domain && $role && $name && $ip) {
97: $hostname{$id}=$name;
98: $hostdom{$id}=$domain;
99: $hostip{$id}=$ip;
100: $hostrole{$id}=$role;
101: if ($domdescr) { $domaindescription{$domain}=$domdescr; }
102: if (($role eq 'library') && ($id ne $perlvar{'lonHostID'})) {
103: $libserv{$id}=$name;
104: }
105: } else {
106: if ($configline) {
107: # &logthis("Skipping hosts.tab line -$configline-");
108: }
109: }
1.1 albertel 110: }
111: }
112:
113: # ------------------------------------------------------ Read spare server file
114: {
115: my $config=IO::File->new("$perlvar{'lonTabDir'}/spare.tab");
116:
117: while (my $configline=<$config>) {
118: chomp($configline);
119: if (($configline) && ($configline ne $perlvar{'lonHostID'})) {
120: $spareid{$configline}=1;
121: }
122: }
123: }
124:
125: # ---------------------------------------------------------------- Start report
126:
127: $statusdir="/home/httpd/html/lon-status";
128:
129: $errors=0;
130: $warnings=0;
131: $notices=0;
132:
133: $now=time;
134: $date=localtime($now);
135:
136: {
137: my $fh=IO::File->new(">$statusdir/newstatus.html");
138:
139: print $fh (<<ENDHEADERS);
140: <html>
141: <head>
142: <title>LON Status Report $perlvar{'lonHostID'}</title>
143: </head>
1.3 www 144: <body bgcolor="#AAAAAA">
1.1 albertel 145: <a name="top">
146: <h1>LON Status Report $perlvar{'lonHostID'}</h1>
147: <h2>$date ($now)</h2>
148: <ol>
149: <li><a href="#configuration">Configuration</a>
150: <li><a href="#machine">Machine Information</a>
1.11 www 151: <li><a href="#tmp">Temporary Files</a>
152: <li><a href="#tokens">Session Tokens</a>
1.1 albertel 153: <li><a href="#httpd">httpd</a>
1.11 www 154: <li><a href="#lonsql">lonsql</a>
1.1 albertel 155: <li><a href="#lond">lond</a>
156: <li><a href="#lonc">lonc</a>
1.34 www 157: <li><a href="#lonhttpd">lonhttpd</a>
1.1 albertel 158: <li><a href="#lonnet">lonnet</a>
159: <li><a href="#connections">Connections</a>
160: <li><a href="#delayed">Delayed Messages</a>
161: <li><a href="#errcount">Error Count</a>
162: </ol>
163: <hr>
164: <a name="configuration">
165: <h2>Configuration</h2>
166: <h3>PerlVars</h3>
167: <table border=2>
168: ENDHEADERS
169:
1.31 albertel 170: foreach $varname (sort(keys(%perlvar))) {
1.1 albertel 171: print $fh "<tr><td>$varname</td><td>$perlvar{$varname}</td></tr>\n";
172: }
173: print $fh "</table><h3>Hosts</h3><table border=2>";
1.31 albertel 174: foreach $id (sort(keys(%hostname))) {
175: print $fh
176: "<tr><td>$id</td><td>$hostdom{$id}</td><td>$hostrole{$id}</td>";
177: print $fh "<td>$hostname{$id}</td><td>$hostip{$id}</td></tr>\n";
1.1 albertel 178: }
179: print $fh "</table><h3>Spare Hosts</h3><ol>";
1.31 albertel 180: foreach $id (sort(keys(%spareid))) {
1.1 albertel 181: print $fh "<li>$id\n";
182: }
183:
184: print $fh "</ol>\n";
185:
186: # --------------------------------------------------------------------- Machine
187:
188: print $fh '<hr><a name="machine"><h2>Machine Information</h2>';
189: print $fh "<h3>loadavg</h3>";
190:
191: open (LOADAVGH,"/proc/loadavg");
192: $loadavg=<LOADAVGH>;
193: close (LOADAVGH);
194:
195: print $fh "<tt>$loadavg</tt>";
196:
197: @parts=split(/\s+/,$loadavg);
1.4 www 198: if ($parts[1]>4.0) {
1.1 albertel 199: $errors++;
200: } elsif ($parts[1]>2.0) {
201: $warnings++;
202: } elsif ($parts[1]>1.0) {
203: $notices++;
204: }
205:
206: print $fh "<h3>df</h3>";
207: print $fh "<pre>";
208:
209: open (DFH,"df|");
210: while ($line=<DFH>) {
211: print $fh "$line";
212: @parts=split(/\s+/,$line);
213: $usage=$parts[4];
214: $usage=~s/\W//g;
215: if ($usage>90) {
1.24 www 216: $warnings++;
217: $notices++;
1.1 albertel 218: } elsif ($usage>80) {
219: $warnings++;
220: } elsif ($usage>60) {
221: $notices++;
222: }
1.4 www 223: if ($usage>95) { $warnings++; $warnings++ }
1.1 albertel 224: }
225: close (DFH);
226: print $fh "</pre>";
1.24 www 227:
228:
229: print $fh "<h3>ps</h3>";
230: print $fh "<pre>";
231: $psproc=0;
232:
233: open (PSH,"ps -aux|");
234: while ($line=<PSH>) {
235: print $fh "$line";
236: $psproc++;
237: }
238: close (PSH);
239: print $fh "</pre>";
240:
241: if ($psproc>200) { $notices++; }
242: if ($psproc>250) { $notices++; }
243:
1.1 albertel 244: &errout($fh);
1.11 www 245:
246: # --------------------------------------------------------------- clean out tmp
247: print $fh '<hr><a name="tmp"><h2>Temporary Files</h2>';
248: $cleaned=0;
1.29 www 249: $old=0;
1.11 www 250: while ($fname=<$perlvar{'lonDaemons'}/tmp/*>) {
251: my ($dev,$ino,$mode,$nlink,
252: $uid,$gid,$rdev,$size,
253: $atime,$mtime,$ctime,
254: $blksize,$blocks)=stat($fname);
255: $now=time;
256: $since=$now-$mtime;
257: if ($since>$perlvar{'lonExpire'}) {
1.29 www 258: $line='';
259: if (open(PROBE,$fname)) {
260: $line=<PROBE>;
261: close(PROBE);
262: }
263: unless ($line=~/^CHECKOUTTOKEN\&/) {
264: $cleaned++;
265: unlink("$fname");
266: } else {
1.32 www 267: if ($since>365*$perlvar{'lonExpire'}) {
1.29 www 268: $cleaned++;
269: unlink("$fname");
270: } else { $old++; }
271: }
1.11 www 272: }
273:
274: }
1.29 www 275: print $fh "Cleaned up ".$cleaned." files (".$old." old checkout tokens).";
1.11 www 276:
277: # ------------------------------------------------------------ clean out lonIDs
278: print $fh '<hr><a name="tokens"><h2>Session Tokens</h2>';
279: $cleaned=0;
280: $active=0;
281: while ($fname=<$perlvar{'lonIDsDir'}/*>) {
282: my ($dev,$ino,$mode,$nlink,
283: $uid,$gid,$rdev,$size,
284: $atime,$mtime,$ctime,
285: $blksize,$blocks)=stat($fname);
286: $now=time;
287: $since=$now-$mtime;
288: if ($since>$perlvar{'lonExpire'}) {
289: $cleaned++;
290: print $fh "Unlinking $fname<br>";
291: unlink("$fname");
292: } else {
293: $active++;
294: }
295:
296: }
297: print $fh "<p>Cleaned up ".$cleaned." stale session token(s).";
298: print $fh "<h3>$active open session(s)</h3>";
299:
1.1 albertel 300: # ----------------------------------------------------------------------- httpd
301:
302: print $fh '<hr><a name="httpd"><h2>httpd</h2><h3>Access Log</h3><pre>';
303:
1.23 www 304: open (DFH,"tail -n25 /etc/httpd/logs/access_log|");
1.1 albertel 305: while ($line=<DFH>) { print $fh "$line" };
306: close (DFH);
307:
308: print $fh "</pre><h3>Error Log</h3><pre>";
309:
1.23 www 310: open (DFH,"tail -n25 /etc/httpd/logs/error_log|");
1.1 albertel 311: while ($line=<DFH>) {
312: print $fh "$line";
313: if ($line=~/\[error\]/) { $notices++; }
314: };
315: close (DFH);
316: print $fh "</pre>";
317: &errout($fh);
1.5 harris41 318:
319:
1.11 www 320: # ---------------------------------------------------------------------- lonsql
1.22 harris41 321:
322: my $restartflag=1;
1.18 harris41 323: if ($perlvar{'lonRole'} eq "library") {
1.5 harris41 324:
1.11 www 325: print $fh '<hr><a name="lonsql"><h2>lonsql</h2><h3>Log</h3><pre>';
1.23 www 326: print "lonsql\n";
1.5 harris41 327: if (-e "$perlvar{'lonDaemons'}/logs/lonsql.log"){
328: open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonsql.log|");
329: while ($line=<DFH>) {
330: print $fh "$line";
331: if ($line=~/INFO/) { $notices++; }
332: if ($line=~/WARNING/) { $notices++; }
333: if ($line=~/CRITICAL/) { $warnings++; }
334: };
335: close (DFH);
336: }
337: print $fh "</pre>";
338:
339: my $lonsqlfile="$perlvar{'lonDaemons'}/logs/lonsql.pid";
1.23 www 340:
341: $restartflag=1;
342:
1.5 harris41 343: if (-e $lonsqlfile) {
344: my $lfh=IO::File->new("$lonsqlfile");
345: my $lonsqlpid=<$lfh>;
346: chomp($lonsqlpid);
347: if (kill 0 => $lonsqlpid) {
348: print $fh "<h3>lonsql at pid $lonsqlpid responding</h3>";
1.22 harris41 349: $restartflag=0;
1.5 harris41 350: } else {
351: $errors++; $errors++;
352: print $fh "<h3>lonsql at pid $lonsqlpid not responding</h3>";
1.22 harris41 353: $restartflag=1;
1.23 www 354: print $fh
355: "<h3>Decided to clean up stale .pid file and restart lonsql</h3>";
1.5 harris41 356: }
1.22 harris41 357: }
358: if ($restartflag==1) {
1.5 harris41 359: $errors++;
1.23 www 360: print $fh '<br><font color="red">Killall lonsql: '.
361: system('killall lonsql').' - ';
1.30 albertel 362: sleep 2;
1.23 www 363: print $fh unlink($lonsqlfile).' - '.
364: system('killall -9 lonsql').
365: '</font><br>';
1.5 harris41 366: print $fh "<h3>lonsql not running, trying to start</h3>";
1.16 harris41 367: system(
368: "$perlvar{'lonDaemons'}/lonsql 2>>$perlvar{'lonDaemons'}/logs/lonsql_errors");
1.30 albertel 369: sleep 2;
1.5 harris41 370: if (-e $lonsqlfile) {
371: print $fh "Seems like it started ...<p>";
372: my $lfh=IO::File->new("$lonsqlfile");
373: my $lonsqlpid=<$lfh>;
374: chomp($lonsqlpid);
1.30 albertel 375: sleep 2;
1.5 harris41 376: if (kill 0 => $lonsqlpid) {
377: print $fh "<h3>lonsql at pid $lonsqlpid responding</h3>";
378: } else {
379: $errors++; $errors++;
380: print $fh "<h3>lonsql at pid $lonsqlpid not responding</h3>";
381: print $fh "Give it one more try ...<p>";
1.16 harris41 382: system(
383: "$perlvar{'lonDaemons'}/lonsql 2>>$perlvar{'lonDaemons'}/logs/lonsql_errors");
1.30 albertel 384: sleep 2;
1.5 harris41 385: }
386: } else {
387: print $fh "Seems like that did not work!<p>";
388: $errors++;
389: }
390: if (-e "$perlvar{'lonDaemons'}/logs/lonsql.log"){
391: print $fh "<p><pre>";
392: open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonsql.log|");
393: while ($line=<DFH>) {
394: print $fh "$line";
395: if ($line=~/WARNING/) { $notices++; }
396: if ($line=~/CRITICAL/) { $notices++; }
397: };
398: close (DFH);
399: print $fh "</pre>";
400: }
401: }
402:
403: $fname="$perlvar{'lonDaemons'}/logs/lonsql.log";
404:
405: my ($dev,$ino,$mode,$nlink,
406: $uid,$gid,$rdev,$size,
407: $atime,$mtime,$ctime,
408: $blksize,$blocks)=stat($fname);
409:
410: if ($size>40000) {
411: print $fh "Rotating logs ...<p>";
412: rename("$fname.2","$fname.3");
413: rename("$fname.1","$fname.2");
414: rename("$fname","$fname.1");
415: }
416:
417: &errout($fh);
418: }
1.1 albertel 419: # ------------------------------------------------------------------------ lond
420:
421: print $fh '<hr><a name="lond"><h2>lond</h2><h3>Log</h3><pre>';
1.23 www 422: print "lond\n";
1.1 albertel 423:
424: if (-e "$perlvar{'lonDaemons'}/logs/lond.log"){
1.23 www 425: open (DFH,"tail -n25 $perlvar{'lonDaemons'}/logs/lond.log|");
1.1 albertel 426: while ($line=<DFH>) {
427: print $fh "$line";
1.3 www 428: if ($line=~/INFO/) { $notices++; }
1.4 www 429: if ($line=~/WARNING/) { $notices++; }
430: if ($line=~/CRITICAL/) { $warnings++; }
1.1 albertel 431: };
432: close (DFH);
433: }
434: print $fh "</pre>";
435:
436: my $londfile="$perlvar{'lonDaemons'}/logs/lond.pid";
437:
1.22 harris41 438: $restartflag=1;
1.7 harris41 439: if (-e $londfile) {
1.1 albertel 440: my $lfh=IO::File->new("$londfile");
441: my $londpid=<$lfh>;
442: chomp($londpid);
443: if (kill 0 => $londpid) {
1.25 www 444: print $fh "<h3>lond at pid $londpid responding, sending USR1</h3>";
445: kill USR1 => $londpid;
1.7 harris41 446: $restartflag=0;
1.1 albertel 447: } else {
1.8 harris41 448: $errors++;
1.1 albertel 449: print $fh "<h3>lond at pid $londpid not responding</h3>";
1.23 www 450: $restartflag=1;
1.8 harris41 451: print $fh
1.23 www 452: "<h3>Decided to clean up stale .pid file and restart lond</h3>";
1.1 albertel 453: }
1.7 harris41 454: }
455: if ($restartflag==1) {
1.1 albertel 456: $errors++;
1.23 www 457: print $fh '<br><font color="red">Killall lond: '.
458: system('killall lond').' - ';
1.30 albertel 459: sleep 2;
1.23 www 460: print $fh unlink($londfile).' - '.system('killall -9 lond').
461: '</font><br>';
1.1 albertel 462: print $fh "<h3>lond not running, trying to start</h3>";
1.16 harris41 463: system(
464: "$perlvar{'lonDaemons'}/lond 2>>$perlvar{'lonDaemons'}/logs/lond_errors");
1.30 albertel 465: sleep 2;
1.1 albertel 466: if (-e $londfile) {
467: print $fh "Seems like it started ...<p>";
468: my $lfh=IO::File->new("$londfile");
469: my $londpid=<$lfh>;
470: chomp($londpid);
1.30 albertel 471: sleep 2;
1.1 albertel 472: if (kill 0 => $londpid) {
473: print $fh "<h3>lond at pid $londpid responding</h3>";
474: } else {
475: $errors++; $errors++;
476: print $fh "<h3>lond at pid $londpid not responding</h3>";
477: print $fh "Give it one more try ...<p>";
1.16 harris41 478: system(
479: "$perlvar{'lonDaemons'}/lond 2>>$perlvar{'lonDaemons'}/logs/lond_errors");
1.30 albertel 480: sleep 2;
1.1 albertel 481: }
482: } else {
483: print $fh "Seems like that did not work!<p>";
484: $errors++;
485: }
1.3 www 486: if (-e "$perlvar{'lonDaemons'}/logs/lond.log"){
487: print $fh "<p><pre>";
488: open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lond.log|");
489: while ($line=<DFH>) {
490: print $fh "$line";
1.4 www 491: if ($line=~/WARNING/) { $notices++; }
492: if ($line=~/CRITICAL/) { $notices++; }
1.3 www 493: };
494: close (DFH);
495: print $fh "</pre>";
496: }
1.1 albertel 497: }
498:
499: $fname="$perlvar{'lonDaemons'}/logs/lond.log";
500:
501: my ($dev,$ino,$mode,$nlink,
502: $uid,$gid,$rdev,$size,
503: $atime,$mtime,$ctime,
504: $blksize,$blocks)=stat($fname);
505:
506: if ($size>40000) {
507: print $fh "Rotating logs ...<p>";
508: rename("$fname.2","$fname.3");
509: rename("$fname.1","$fname.2");
510: rename("$fname","$fname.1");
511: }
512:
513: &errout($fh);
514: # ------------------------------------------------------------------------ lonc
515:
516: print $fh '<hr><a name="lonc"><h2>lonc</h2><h3>Log</h3><pre>';
1.23 www 517: print "lonc\n";
1.1 albertel 518:
519: if (-e "$perlvar{'lonDaemons'}/logs/lonc.log"){
1.23 www 520: open (DFH,"tail -n25 $perlvar{'lonDaemons'}/logs/lonc.log|");
1.1 albertel 521: while ($line=<DFH>) {
522: print $fh "$line";
1.3 www 523: if ($line=~/INFO/) { $notices++; }
1.4 www 524: if ($line=~/WARNING/) { $notices++; }
525: if ($line=~/CRITICAL/) { $warnings++; }
1.1 albertel 526: };
527: close (DFH);
528: }
529: print $fh "</pre>";
530:
531: my $loncfile="$perlvar{'lonDaemons'}/logs/lonc.pid";
532:
1.7 harris41 533: $restartflag=1;
1.1 albertel 534: if (-e $loncfile) {
535: my $lfh=IO::File->new("$loncfile");
536: my $loncpid=<$lfh>;
537: chomp($loncpid);
538: if (kill 0 => $loncpid) {
539: print $fh "<h3>lonc at pid $loncpid responding, sending USR1</h3>";
540: kill USR1 => $loncpid;
1.7 harris41 541: $restartflag=0;
1.1 albertel 542: } else {
1.8 harris41 543: $errors++;
1.1 albertel 544: print $fh "<h3>lonc at pid $loncpid not responding</h3>";
1.10 harris41 545: # Solution: kill parent and children processes, remove .pid and restart
1.8 harris41 546: $restartflag=1;
547: print $fh
1.23 www 548: "<h3>Decided to clean up stale .pid file and restart lonc</h3>";
1.1 albertel 549: }
1.7 harris41 550: }
551: if ($restartflag==1) {
1.1 albertel 552: $errors++;
1.23 www 553: print $fh '<br><font color="red">Killall lonc: '.
554: system('killall lonc').' - ';
1.30 albertel 555: sleep 2;
1.23 www 556: print $fh unlink($loncfile).' - '.system('killall -9 lonc').
557: '</font><br>';
1.1 albertel 558: print $fh "<h3>lonc not running, trying to start</h3>";
1.16 harris41 559: system(
1.17 harris41 560: "$perlvar{'lonDaemons'}/lonc 2>>$perlvar{'lonDaemons'}/logs/lonc_errors");
1.30 albertel 561: sleep 2;
1.1 albertel 562: if (-e $loncfile) {
563: print $fh "Seems like it started ...<p>";
564: my $lfh=IO::File->new("$loncfile");
565: my $loncpid=<$lfh>;
566: chomp($loncpid);
1.30 albertel 567: sleep 2;
1.1 albertel 568: if (kill 0 => $loncpid) {
569: print $fh "<h3>lonc at pid $loncpid responding</h3>";
570: } else {
571: $errors++; $errors++;
572: print $fh "<h3>lonc at pid $loncpid not responding</h3>";
573: print $fh "Give it one more try ...<p>";
1.16 harris41 574: system(
1.17 harris41 575: "$perlvar{'lonDaemons'}/lonc 2>>$perlvar{'lonDaemons'}/logs/lonc_errors");
1.30 albertel 576: sleep 2;
1.1 albertel 577: }
578: } else {
579: print $fh "Seems like that did not work!<p>";
580: $errors++;
581: }
1.3 www 582: if (-e "$perlvar{'lonDaemons'}/logs/lonc.log") {
583: print $fh "<p><pre>";
584: open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonc.log|");
585: while ($line=<DFH>) {
586: print $fh "$line";
1.4 www 587: if ($line=~/WARNING/) { $notices++; }
588: if ($line=~/CRITICAL/) { $notices++; }
1.3 www 589: };
590: close (DFH);
591: print $fh "</pre>";
592: }
1.1 albertel 593: }
594:
595: $fname="$perlvar{'lonDaemons'}/logs/lonc.log";
1.34 www 596:
597: my ($dev,$ino,$mode,$nlink,
598: $uid,$gid,$rdev,$size,
599: $atime,$mtime,$ctime,
600: $blksize,$blocks)=stat($fname);
601:
602: if ($size>40000) {
603: print $fh "Rotating logs ...<p>";
604: rename("$fname.2","$fname.3");
605: rename("$fname.1","$fname.2");
606: rename("$fname","$fname.1");
607: }
608:
609:
610: &errout($fh);
611: # -------------------------------------------------------------------- lonhttpd
612:
613: print $fh '<hr><a name="lonhttpd"><h2>lonhttpd</h2><h3>Log</h3><pre>';
614: print "lonhttpd\n";
615:
616: if (-e "$perlvar{'lonDaemons'}/logs/lonhttpd.log"){
617: open (DFH,"tail -n25 $perlvar{'lonDaemons'}/logs/lonhttpd.log|");
618: while ($line=<DFH>) {
619: print $fh "$line";
620: if ($line=~/INFO/) { $notices++; }
621: if ($line=~/WARNING/) { $notices++; }
622: if ($line=~/CRITICAL/) { $warnings++; }
623: };
624: close (DFH);
625: }
626: print $fh "</pre>";
627:
628: my $lonhttpdfile="$perlvar{'lonDaemons'}/logs/lonhttpd.pid";
629:
630: $restartflag=1;
631: if (-e $lonhttpdfile) {
632: my $lfh=IO::File->new("$lonhttpdfile");
633: my $lonhttpdpid=<$lfh>;
634: chomp($lonhttpdpid);
635: if (kill 0 => $lonhttpdpid) {
1.35 ! albertel 636: print $fh "<h3>lonhttpd at pid $lonhttpdpid responding</h3>";
1.34 www 637: $restartflag=0;
638: } else {
639: $errors++;
640: print $fh "<h3>lonhttpd at pid $lonhttpdpid not responding</h3>";
641: # Solution: kill parent and children processes, remove .pid and restart
642: $restartflag=1;
643: print $fh
644: "<h3>Decided to clean up stale .pid file and restart lonhttpd</h3>";
645: }
646: }
647: if ($restartflag==1) {
648: $errors++;
649: print $fh '<br><font color="red">Killall lonhttpd: '.
650: system('killall lonhttpd').' - ';
651: sleep 2;
652: print $fh unlink($lonhttpdfile).' - '.system('killall -9 lonhttpd').
653: '</font><br>';
654: print $fh "<h3>lonhttpd not running, trying to start</h3>";
655: system(
656: "$perlvar{'lonDaemons'}/lonhttpd 2>>$perlvar{'lonDaemons'}/logs/lonhttpd_errors");
657: sleep 2;
658: if (-e $lonhttpdfile) {
659: print $fh "Seems like it started ...<p>";
660: my $lfh=IO::File->new("$lonhttpdfile");
661: my $lonhttpdpid=<$lfh>;
662: chomp($lonhttpdpid);
663: sleep 2;
664: if (kill 0 => $lonhttpdpid) {
665: print $fh "<h3>lonhttpd at pid $lonhttpdpid responding</h3>";
666: } else {
667: $errors++; $errors++;
668: print $fh "<h3>lonhttpd at pid $lonhttpdpid not responding</h3>";
669: print $fh "Give it one more try ...<p>";
670: system(
671: "$perlvar{'lonDaemons'}/lonhttpd 2>>$perlvar{'lonDaemons'}/logs/lonhttpd_errors");
672: sleep 2;
673: }
674: } else {
675: print $fh "Seems like that did not work!<p>";
676: $errors++;
677: }
678: if (-e "$perlvar{'lonDaemons'}/logs/lonhttpd.log") {
679: print $fh "<p><pre>";
680: open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonhttpd.log|");
681: while ($line=<DFH>) {
682: print $fh "$line";
683: if ($line=~/WARNING/) { $notices++; }
684: if ($line=~/CRITICAL/) { $notices++; }
685: };
686: close (DFH);
687: print $fh "</pre>";
688: }
689: }
690:
691: $fname="$perlvar{'lonDaemons'}/logs/lonhttpd.log";
1.1 albertel 692:
693: my ($dev,$ino,$mode,$nlink,
694: $uid,$gid,$rdev,$size,
695: $atime,$mtime,$ctime,
696: $blksize,$blocks)=stat($fname);
697:
698: if ($size>40000) {
699: print $fh "Rotating logs ...<p>";
700: rename("$fname.2","$fname.3");
701: rename("$fname.1","$fname.2");
702: rename("$fname","$fname.1");
703: }
704:
705:
706: &errout($fh);
707: # ---------------------------------------------------------------------- lonnet
708:
709: print $fh '<hr><a name="lonnet"><h2>lonnet</h2><h3>Temp Log</h3><pre>';
1.23 www 710: print "lonnet\n";
1.1 albertel 711: if (-e "$perlvar{'lonDaemons'}/logs/lonnet.log"){
712: open (DFH,"tail -n50 $perlvar{'lonDaemons'}/logs/lonnet.log|");
713: while ($line=<DFH>) {
714: print $fh "$line";
715: };
716: close (DFH);
717: }
1.11 www 718: print $fh "</pre><h3>Perm Log</h3><pre>";
1.1 albertel 719:
720: if (-e "$perlvar{'lonDaemons'}/logs/lonnet.perm.log") {
721: open(DFH,"tail -n10 $perlvar{'lonDaemons'}/logs/lonnet.perm.log|");
722: while ($line=<DFH>) {
723: print $fh "$line";
724: };
725: close (DFH);
726: } else { print $fh "No perm log\n" }
727:
728: $fname="$perlvar{'lonDaemons'}/logs/lonnet.log";
729:
730: my ($dev,$ino,$mode,$nlink,
731: $uid,$gid,$rdev,$size,
732: $atime,$mtime,$ctime,
733: $blksize,$blocks)=stat($fname);
734:
735: if ($size>40000) {
736: print $fh "Rotating logs ...<p>";
737: rename("$fname.2","$fname.3");
738: rename("$fname.1","$fname.2");
739: rename("$fname","$fname.1");
740: }
741:
742: print $fh "</pre>";
743: &errout($fh);
744: # ----------------------------------------------------------------- Connections
745:
746: print $fh '<hr><a name="connections"><h2>Connections</h2>';
747:
748: print $fh "<table border=2>";
1.31 albertel 749: foreach $tryserver (sort(keys(%hostname))) {
1.1 albertel 750:
751: $answer=reply("pong",$tryserver);
752: if ($answer eq "$tryserver:$perlvar{'lonHostID'}") {
753: $result="<b>ok</b>";
754: } else {
755: $result=$answer;
756: $warnings++;
757: if ($answer eq 'con_lost') { $warnings++; }
758: }
759: print $fh "<tr><td>$tryserver</td><td>$result</td></tr>\n";
760:
761: }
762: print $fh "</table>";
763:
764: &errout($fh);
765: # ------------------------------------------------------------ Delayed messages
766:
767: print $fh '<hr><a name="delayed"><h2>Delayed Messages</h2>';
1.23 www 768: print "buffers\n";
1.1 albertel 769:
770: print $fh '<h3>Scanning Permanent Log</h3>';
771:
772: $unsend=0;
773: {
774: my $dfh=IO::File->new("$perlvar{'lonDaemons'}/logs/lonnet.perm.log");
775: while ($line=<$dfh>) {
776: ($time,$sdf,$dserv,$dcmd)=split(/:/,$line);
777: if ($sdf eq 'F') {
778: $local=localtime($time);
779: print "<b>Failed: $time, $dserv, $dcmd</b><br>";
780: $warnings++;
781: }
782: if ($sdf eq 'S') { $unsend--; }
783: if ($sdf eq 'D') { $unsend++; }
784: }
785: }
786: print $fh "Total unsend messages: <b>$unsend</b><p>\n";
787: $warnings=$warnings+5*$unsend;
788:
789: print $fh "<h3>Outgoing Buffer</h3>";
790:
791: open (DFH,"ls -lF $perlvar{'lonSockDir'}/delayed|");
792: while ($line=<DFH>) {
793: print $fh "$line<br>";
794: };
795: close (DFH);
796:
797: # ------------------------------------------------------------------------- End
798: print $fh "<a name=errcount>\n";
799: $totalcount=$notices+4*$warnings+100*$errors;
800: &errout($fh);
801: print $fh "<h1>Total Error Count: $totalcount</h1>";
802: $now=time;
803: $date=localtime($now);
804: print $fh "<hr>$date ($now)</body></html>\n";
1.23 www 805: print "writing done\n";
1.1 albertel 806: }
807:
808: rename ("$statusdir/newstatus.html","$statusdir/index.html");
809:
810: if ($totalcount>200) {
1.23 www 811: print "mailing\n";
1.1 albertel 812: $emailto="$perlvar{'lonAdmEMail'},$perlvar{'lonSysEMail'}";
813: $subj="LON: $perlvar{'lonHostID'} E:$errors W:$warnings N:$notices";
814: system(
1.24 www 815: "metasend -b -t $emailto -s '$subj' -f $statusdir/index.html -m text/html");
1.1 albertel 816: }
817: 1;
818:
819:
820:
821:
822:
823:
824:
825:
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>