--- loncom/loncron 2001/04/11 13:37:39 1.19 +++ loncom/loncron 2001/08/27 13:54:50 1.22 @@ -9,13 +9,20 @@ # # 7/14,7/15,7/19,7/21,7/22,11/18, # 2/8 Gerd Kortemeyer -# Dec 00 Scott Harrison +# 12/6/2000,12/8 Scott Harrison # 12/23 Gerd Kortemeyer -# 02/12/2001, 04/11/2001 Scott Harrison +# YEAR=2001 +# 1/10/2001, 2/12/, 2/26, 3/15, 04/11, 04/21,8/27 Scott Harrison use IO::File; use IO::Socket; +my $qflag=0; +if (@ARGV) { + my $arg=shift @ARGV; + $qflag=1 if $arg eq 'quick'; +} + # -------------------------------------------------- Non-critical communication sub reply { my ($cmd,$server)=@_; @@ -277,9 +284,8 @@ print $fh ""; # ---------------------------------------------------------------------- lonsql -# -# Do not run for now -# + +my $restartflag=1; if ($perlvar{'lonRole'} eq "library") { print $fh '
'; @@ -304,22 +310,42 @@ if ($perlvar{'lonRole'} eq "library") { chomp($lonsqlpid); if (kill 0 => $lonsqlpid) { print $fh ""; my $londfile="$perlvar{'lonDaemons'}/logs/lond.pid"; -my $restartflag=1; +$restartflag=1; if (-e $londfile) { my $lfh=IO::File->new("$londfile"); my $londpid=<$lfh>; @@ -416,13 +442,13 @@ if ($restartflag==1) { print $fh "lonsql at pid $lonsqlpid responding
"; + $restartflag=0; } else { $errors++; $errors++; print $fh "lonsql at pid $lonsqlpid not responding
"; + # Intelligently handle this. + # Possibility #1: there is no process + # Solution: remove .pid file and restart + if (getpgrp($lonsqlpid)==-1) { + unlink($lonsqlfile); + $restartflag=1; + } + else { + # Possibility #2: there is a live process that is not + # responding for an unknown reason + # Solution: kill parent and children processes, remove .pid + # and restart + `killall -9 lonsql`; + unlink($lonsqlfile); + $restartflag=1; + } } - } else { + print $fh + "Deciding to clean up stale .pid file and restart lonsql
"; + } + if ($restartflag==1) { $errors++; print $fh "lonsql not running, trying to start
"; system( "$perlvar{'lonDaemons'}/lonsql 2>>$perlvar{'lonDaemons'}/logs/lonsql_errors"); - sleep 120; + sleep 120 unless $qflag; if (-e $lonsqlfile) { print $fh "Seems like it started ..."; my $lfh=IO::File->new("$lonsqlfile"); my $lonsqlpid=<$lfh>; chomp($lonsqlpid); - sleep 30; + sleep 30 unless $qflag; if (kill 0 => $lonsqlpid) { print $fh "
lonsql at pid $lonsqlpid responding
"; } else { @@ -328,7 +354,7 @@ if ($perlvar{'lonRole'} eq "library") { print $fh "Give it one more try ..."; system( "$perlvar{'lonDaemons'}/lonsql 2>>$perlvar{'lonDaemons'}/logs/lonsql_errors"); - sleep 120; + sleep 120 unless $qflag; } } else { print $fh "Seems like that did not work!
"; @@ -381,7 +407,7 @@ print $fh "
"; my $lfh=IO::File->new("$londfile"); my $londpid=<$lfh>; chomp($londpid); - sleep 30; + sleep 30 unless $qflag; if (kill 0 => $londpid) { print $fh "
"; system( "$perlvar{'lonDaemons'}/lond 2>>$perlvar{'lonDaemons'}/logs/lond_errors"); - sleep 120; + sleep 120 unless $qflag; } } else { print $fh "Seems like that did not work!
"; @@ -519,13 +545,13 @@ if ($restartflag==1) { print $fh "
"; my $lfh=IO::File->new("$loncfile"); my $loncpid=<$lfh>; chomp($loncpid); - sleep 30; + sleep 30 unless $qflag; if (kill 0 => $loncpid) { print $fh "
"; system( "$perlvar{'lonDaemons'}/lonc 2>>$perlvar{'lonDaemons'}/logs/lonc_errors"); - sleep 120; + sleep 120 unless $qflag; } } else { print $fh "Seems like that did not work!
"; @@ -674,7 +700,8 @@ if ($totalcount>200) { $emailto="$perlvar{'lonAdmEMail'},$perlvar{'lonSysEMail'}"; $subj="LON: $perlvar{'lonHostID'} E:$errors W:$warnings N:$notices"; system( - "metasend -b -t $emailto -s '$subj' -f $statusdir/index.html -m text/html"); + "metasend -b -t $emailto -s '$subj' -f $statusdir/index.html -m text/html") + unless $qflag; } 1;