--- loncom/loncron 2002/09/09 13:59:16 1.33 +++ loncom/loncron 2003/07/30 16:49:27 1.41 @@ -9,13 +9,9 @@ # # 7/14,7/15,7/19,7/21,7/22,11/18, # 2/8 Gerd Kortemeyer -# 12/6/2000,12/8 Scott Harrison # 12/23 Gerd Kortemeyer # YEAR=2001 -# 1/10/2001, 2/12/, 2/26, 3/15, 04/11, 04/21,8/27 Scott Harrison # 09/04,09/06,11/26 Gerd Kortemeyer -# YEAR=2002 -# 5/11/2002 Scott Harrison $|=1; @@ -135,6 +131,7 @@ $date=localtime($now); { my $fh=IO::File->new(">$statusdir/newstatus.html"); +my %simplestatus=(); print $fh (<<ENDHEADERS); <html> @@ -154,6 +151,7 @@ print $fh (<<ENDHEADERS); <li><a href="#lonsql">lonsql</a> <li><a href="#lond">lond</a> <li><a href="#lonc">lonc</a> +<li><a href="#lonhttpd">lonhttpd</a> <li><a href="#lonnet">lonnet</a> <li><a href="#connections">Connections</a> <li><a href="#delayed">Delayed Messages</a> @@ -219,7 +217,7 @@ while ($line=<DFH>) { } elsif ($usage>60) { $notices++; } - if ($usage>95) { $warnings++; $warnings++ } + if ($usage>95) { $warnings++; $warnings++; $simplestatus{'diskfull'}++; } } close (DFH); print $fh "</pre>"; @@ -319,8 +317,6 @@ print $fh "</pre>"; # ---------------------------------------------------------------------- lonsql my $restartflag=1; -if ($perlvar{'lonRole'} eq "library") { - print $fh '<hr><a name="lonsql"><h2>lonsql</h2><h3>Log</h3><pre>'; print "lonsql\n"; if (-e "$perlvar{'lonDaemons'}/logs/lonsql.log"){ @@ -355,6 +351,7 @@ if ($perlvar{'lonRole'} eq "library") { } } if ($restartflag==1) { + $simplestatus{'lonsql'}='off'; $errors++; print $fh '<br><font color="red">Killall lonsql: '. system('killall lonsql').' - '; @@ -374,6 +371,7 @@ if ($perlvar{'lonRole'} eq "library") { sleep 2; if (kill 0 => $lonsqlpid) { print $fh "<h3>lonsql at pid $lonsqlpid responding</h3>"; + $simplestatus{'lonsql'}='restarted'; } else { $errors++; $errors++; print $fh "<h3>lonsql at pid $lonsqlpid not responding</h3>"; @@ -406,7 +404,7 @@ if ($perlvar{'lonRole'} eq "library") { $atime,$mtime,$ctime, $blksize,$blocks)=stat($fname); - if ($size>40000) { + if ($size>200000) { print $fh "Rotating logs ...<p>"; rename("$fname.2","$fname.3"); rename("$fname.1","$fname.2"); @@ -414,7 +412,6 @@ if ($perlvar{'lonRole'} eq "library") { } &errout($fh); -} # ------------------------------------------------------------------------ lond print $fh '<hr><a name="lond"><h2>lond</h2><h3>Log</h3><pre>'; @@ -452,6 +449,7 @@ if (-e $londfile) { } } if ($restartflag==1) { + $simplestatus{'lond'}='off'; $errors++; print $fh '<br><font color="red">Killall lond: '. system('killall lond').' - '; @@ -470,6 +468,7 @@ if ($restartflag==1) { sleep 2; if (kill 0 => $londpid) { print $fh "<h3>lond at pid $londpid responding</h3>"; + $simplestatus{'lond'}='restarted'; } else { $errors++; $errors++; print $fh "<h3>lond at pid $londpid not responding</h3>"; @@ -548,6 +547,7 @@ if (-e $loncfile) { } } if ($restartflag==1) { + $simplestatus{'lonc'}='off'; $errors++; print $fh '<br><font color="red">Killall lonc: '. system('killall lonc').' - '; @@ -566,6 +566,7 @@ if ($restartflag==1) { sleep 2; if (kill 0 => $loncpid) { print $fh "<h3>lonc at pid $loncpid responding</h3>"; + $simplestatus{'lonc'}='restarted'; } else { $errors++; $errors++; print $fh "<h3>lonc at pid $loncpid not responding</h3>"; @@ -607,6 +608,104 @@ if ($size>40000) { &errout($fh); +# -------------------------------------------------------------------- lonhttpd + +print $fh '<hr><a name="lonhttpd"><h2>lonhttpd</h2><h3>Log</h3><pre>'; +print "lonhttpd\n"; + +if (-e "$perlvar{'lonDaemons'}/logs/lonhttpd.log"){ +open (DFH,"tail -n25 $perlvar{'lonDaemons'}/logs/lonhttpd.log|"); +while ($line=<DFH>) { + print $fh "$line"; + if ($line=~/INFO/) { $notices++; } + if ($line=~/WARNING/) { $notices++; } + if ($line=~/CRITICAL/) { $warnings++; } +}; +close (DFH); +} +print $fh "</pre>"; + +my $lonhttpdfile="$perlvar{'lonDaemons'}/logs/lonhttpd.pid"; + +$restartflag=1; +if (-e $lonhttpdfile) { + my $lfh=IO::File->new("$lonhttpdfile"); + my $lonhttpdpid=<$lfh>; + chomp($lonhttpdpid); + if (kill 0 => $lonhttpdpid) { + print $fh "<h3>lonhttpd at pid $lonhttpdpid responding</h3>"; + $restartflag=0; + } else { + $errors++; + print $fh "<h3>lonhttpd at pid $lonhttpdpid not responding</h3>"; + # Solution: kill parent and children processes, remove .pid and restart + $restartflag=1; + print $fh + "<h3>Decided to clean up stale .pid file and restart lonhttpd</h3>"; + } +} +if ($restartflag==1) { + $simplestatus{'lonhttpd'}='off'; + $errors++; + print $fh '<br><font color="red">Killall lonhttpd: '. + system('killall lonhttpd').' - '; + sleep 2; + print $fh unlink($lonhttpdfile).' - '.system('killall -9 lonhttpd'). + '</font><br>'; + print $fh "<h3>lonhttpd not running, trying to start</h3>"; + system( + "$perlvar{'lonDaemons'}/lonhttpd 2>>$perlvar{'lonDaemons'}/logs/lonhttpd_errors"); + sleep 2; + if (-e $lonhttpdfile) { + print $fh "Seems like it started ...<p>"; + my $lfh=IO::File->new("$lonhttpdfile"); + my $lonhttpdpid=<$lfh>; + chomp($lonhttpdpid); + sleep 2; + if (kill 0 => $lonhttpdpid) { + print $fh "<h3>lonhttpd at pid $lonhttpdpid responding</h3>"; + $simplestatus{'lonhttpd'}='restarted'; + } else { + $errors++; $errors++; + print $fh "<h3>lonhttpd at pid $lonhttpdpid not responding</h3>"; + print $fh "Give it one more try ...<p>"; + system( + "$perlvar{'lonDaemons'}/lonhttpd 2>>$perlvar{'lonDaemons'}/logs/lonhttpd_errors"); + sleep 2; + } + } else { + print $fh "Seems like that did not work!<p>"; + $errors++; + } + if (-e "$perlvar{'lonDaemons'}/logs/lonhttpd.log") { + print $fh "<p><pre>"; + open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonhttpd.log|"); + while ($line=<DFH>) { + print $fh "$line"; + if ($line=~/WARNING/) { $notices++; } + if ($line=~/CRITICAL/) { $notices++; } + }; + close (DFH); + print $fh "</pre>"; + } +} + +$fname="$perlvar{'lonDaemons'}/logs/lonhttpd.log"; + + my ($dev,$ino,$mode,$nlink, + $uid,$gid,$rdev,$size, + $atime,$mtime,$ctime, + $blksize,$blocks)=stat($fname); + +if ($size>40000) { + print $fh "Rotating logs ...<p>"; + rename("$fname.2","$fname.3"); + rename("$fname.1","$fname.2"); + rename("$fname","$fname.1"); +} + + +&errout($fh); # ---------------------------------------------------------------------- lonnet print $fh '<hr><a name="lonnet"><h2>lonnet</h2><h3>Temp Log</h3><pre>'; @@ -689,6 +788,7 @@ $unsend=0; print $fh "Total unsend messages: <b>$unsend</b><p>\n"; $warnings=$warnings+5*$unsend; +if ($unsend) { $simplestatus{'unsend'}=$unsend; } print $fh "<h3>Outgoing Buffer</h3>"; open (DFH,"ls -lF $perlvar{'lonSockDir'}/delayed|"); @@ -706,13 +806,28 @@ $now=time; $date=localtime($now); print $fh "<hr>$date ($now)</body></html>\n"; print "writing done\n"; +$fh->close(); } +if ($errors) { $simplestatus{'errors'}=$errors; } +if ($warnings) { $simplestatus{'warnings'}=$warnings; } +if ($notices) { $simplestatus{'notices'}=$notices; } +$simplestatus{'time'}=time; rename ("$statusdir/newstatus.html","$statusdir/index.html"); - +{ +my $sfh=IO::File->new(">$statusdir/loncron_simple.txt"); +foreach (keys %simplestatus) { + print $sfh $_.'='.$simplestatus{$_}.'&'; +} +print $sfh "\n"; +$sfh->close(); +} if ($totalcount>200) { print "mailing\n"; - $emailto="$perlvar{'lonAdmEMail'},$perlvar{'lonSysEMail'}"; + $emailto="$perlvar{'lonAdmEMail'}"; + if ($totalcount>1000) { + $emailto.=",$perlvar{'lonSysEMail'}"; + } $subj="LON: $perlvar{'lonHostID'} E:$errors W:$warnings N:$notices"; system( "metasend -b -t $emailto -s '$subj' -f $statusdir/index.html -m text/html");