Diff for /loncom/loncron between versions 1.29 and 1.43

version 1.29, 2002/05/27 19:21:59 version 1.43, 2003/09/11 19:49:59
Line 9 Line 9
 #  #
 # 7/14,7/15,7/19,7/21,7/22,11/18,  # 7/14,7/15,7/19,7/21,7/22,11/18,
 # 2/8 Gerd Kortemeyer  # 2/8 Gerd Kortemeyer
 # 12/6/2000,12/8 Scott Harrison  
 # 12/23 Gerd Kortemeyer  # 12/23 Gerd Kortemeyer
 # YEAR=2001  # YEAR=2001
 # 1/10/2001, 2/12/, 2/26, 3/15, 04/11, 04/21,8/27 Scott Harrison  
 # 09/04,09/06,11/26 Gerd Kortemeyer  # 09/04,09/06,11/26 Gerd Kortemeyer
 # YEAR=2002  
 # 5/11/2002 Scott Harrison  
   
 $|=1;  $|=1;
   
Line 53  sub errout { Line 49  sub errout {
 ENDERROUT  ENDERROUT
 }  }
   
   sub start_daemon {
       my ($fh,$daemon,$pidfile) = @_;
       system("$perlvar{'lonDaemons'}/$daemon 2>>$perlvar{'lonDaemons'}/logs/${daemon}_errors");
       sleep 2;
       if (-e $pidfile) {
    print $fh "Seems like it started ...<p>";
    my $lfh=IO::File->new("$pidfile");
    my $daemonpid=<$lfh>;
    chomp($daemonpid);
    sleep 2;
    if (kill 0 => $daemonpid) {
       return 1;
    } else {
       return 0;
    }
       }
       print $fh "Seems like that did not work!<p>";
       $errors++;
       return 0;
   }
   
   sub checkon_daemon {
       my ($fh,$daemon,$maxsize,$sendusr1)=@_;
   
       print $fh '<hr><a name="'.$daemon.'"><h2>'.$daemon.'</h2><h3>Log</h3><pre>';
       printf("%-10s ",$daemon);
       if (-e "$perlvar{'lonDaemons'}/logs/$daemon.log"){
    open (DFH,"tail -n25 $perlvar{'lonDaemons'}/logs/$daemon.log|");
    while ($line=<DFH>) { 
       print $fh "$line";
       if ($line=~/INFO/) { $notices++; }
       if ($line=~/WARNING/) { $notices++; }
       if ($line=~/CRITICAL/) { $warnings++; }
    };
    close (DFH);
       }
       print $fh "</pre>";
       
       my $pidfile="$perlvar{'lonDaemons'}/logs/$daemon.pid";
       
       my $restartflag=1;
       
       if (-e $pidfile) {
    my $lfh=IO::File->new("$pidfile");
    my $daemonpid=<$lfh>;
    chomp($daemonpid);
    if (kill 0 => $daemonpid) {
       print $fh "<h3>$daemon at pid $daemonpid responding";
       if ($sendusr1) { print $fh ", sending USR1"; }
       print $fh "</h3>";
       if ($sendusr1) { kill USR1 => $daemonpid; }
       $restartflag=0;
       print "running\n";
    } else {
       $errors++;
       print $fh "<h3>$daemon at pid $daemonpid not responding</h3>";
       $restartflag=1;
       print $fh "<h3>Decided to clean up stale .pid file and restart $daemon</h3>";
    }
       }
       if ($restartflag==1) {
    $simplestatus{$daemon}='off';
    $errors++;
    print $fh '<br><font color="red">Killall '.$daemon.': '.
       `killall $daemon 2>&1`.' - ';
    sleep 2;
    print $fh unlink($pidfile).' - '.
       `killall -9 $daemon 2>&1`.
       '</font><br>';
    print $fh "<h3>$daemon not running, trying to start</h3>";
   
    if (&start_daemon($fh,$daemon,$pidfile)) {
       print $fh "<h3>$daemon at pid $daemonpid responding</h3>";
       $simplestatus{$daemon}='restarted';
       print "started\n";
    } else {
       $errors++;
       print $fh "<h3>$daemon at pid $daemonpid not responding</h3>";
       print $fh "Give it one more try ...<p>";
       print " ";
       if (&start_daemon($fh,$daemon,$pidfile)) {
    print $fh "<h3>$daemon at pid $daemonpid responding</h3>";
    $simplestatus{$daemon}='restarted';
    print "started\n";
       } else {
    print " failed\n";
    $simplestatus{$daemon}='failed';
    $errors++; $errors++;
    print $fh "<h3>$daemon at pid $daemonpid not responding</h3>";
    print $fh "Unable to start $daemon<p>";
       }
    }
   
    if (-e "$perlvar{'lonDaemons'}/logs/$daemon.log"){
       print $fh "<p><pre>";
       open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/$daemon.log|");
       while ($line=<DFH>) { 
    print $fh "$line";
    if ($line=~/WARNING/) { $notices++; }
    if ($line=~/CRITICAL/) { $notices++; }
       };
       close (DFH);
       print $fh "</pre>";
    }
       }
       
       $fname="$perlvar{'lonDaemons'}/logs/$daemon.log";
       
       my ($dev,$ino,$mode,$nlink,
    $uid,$gid,$rdev,$size,
    $atime,$mtime,$ctime,
    $blksize,$blocks)=stat($fname);
       
       if ($size>$maxsize) {
    print $fh "Rotating logs ...<p>";
    rename("$fname.2","$fname.3");
    rename("$fname.1","$fname.2");
    rename("$fname","$fname.1");
       }
   
       &errout($fh);
   }
 # ================================================================ Main Program  # ================================================================ Main Program
   
 # --------------------------------- Read loncapa_apache.conf and loncapa.conf  # --------------------------------- Read loncapa_apache.conf and loncapa.conf
 my $perlvarref=LONCAPA::Configuration::read_conf('loncapa_apache.conf',  my $perlvarref=LONCAPA::Configuration::read_conf('loncapa.conf');
                                                  'loncapa.conf');  
 %perlvar=%{$perlvarref};  %perlvar=%{$perlvarref};
 undef $perlvarref;  undef $perlvarref;
 delete $perlvar{'lonReceipt'}; # remove since sensitive and not needed  delete $perlvar{'lonReceipt'}; # remove since sensitive and not needed
Line 66  delete $perlvar{'lonSqlAccess'}; # remov Line 183  delete $perlvar{'lonSqlAccess'}; # remov
 # --------------------------------------- Make sure that LON-CAPA is configured  # --------------------------------------- Make sure that LON-CAPA is configured
 # I only test for one thing here (lonHostID).  This is just a safeguard.  # I only test for one thing here (lonHostID).  This is just a safeguard.
 if ('{[[[[lonHostID]]]]}' eq $perlvar{'lonHostID'}) {  if ('{[[[[lonHostID]]]]}' eq $perlvar{'lonHostID'}) {
    print("Unconfigured machine.\n");      print("Unconfigured machine.\n");
    $emailto=$perlvar{'lonSysEMail'};      $emailto=$perlvar{'lonSysEMail'};
    $hostname=`/bin/hostname`;      $hostname=`/bin/hostname`;
    chop $hostname;      chop $hostname;
    $hostname=~s/[^\w\.]//g; # make sure is safe to pass through shell      $hostname=~s/[^\w\.]//g; # make sure is safe to pass through shell
    $subj="LON: Unconfigured machine $hostname";      $subj="LON: Unconfigured machine $hostname";
    system("echo 'Unconfigured machine $hostname.' |\      system("echo 'Unconfigured machine $hostname.' |\
  mailto $emailto -s '$subj' > /dev/null");   mailto $emailto -s '$subj' > /dev/null");
     exit 1;      exit 1;
 }  }
Line 80  if ('{[[[[lonHostID]]]]}' eq $perlvar{'l Line 197  if ('{[[[[lonHostID]]]]}' eq $perlvar{'l
 # ----------------------------- Make sure this process is running from user=www  # ----------------------------- Make sure this process is running from user=www
 my $wwwid=getpwnam('www');  my $wwwid=getpwnam('www');
 if ($wwwid!=$<) {  if ($wwwid!=$<) {
    print("User ID mismatch.  This program must be run as user 'www'\n");      print("User ID mismatch.  This program must be run as user 'www'\n");
    $emailto="$perlvar{'lonAdmEMail'},$perlvar{'lonSysEMail'}";      $emailto="$perlvar{'lonAdmEMail'},$perlvar{'lonSysEMail'}";
    $subj="LON: $perlvar{'lonHostID'} User ID mismatch";      $subj="LON: $perlvar{'lonHostID'} User ID mismatch";
    system("echo 'User ID mismatch.  loncron must be run as user www.' |\      system("echo 'User ID mismatch.  loncron must be run as user www.' |\
  mailto $emailto -s '$subj' > /dev/null");   mailto $emailto -s '$subj' > /dev/null");
    exit 1;      exit 1;
 }  }
   
 # ------------------------------------------------------------- Read hosts file  # ------------------------------------------------------------- Read hosts file
 {  {
     my $config=IO::File->new("$perlvar{'lonTabDir'}/hosts.tab");      my $config=IO::File->new("$perlvar{'lonTabDir'}/hosts.tab");
       
     while (my $configline=<$config>) {      while (my $configline=<$config>) {
        my ($id,$domain,$role,$name,$ip)=split(/:/,$configline);   my ($id,$domain,$role,$name,$ip,$domdescr)=split(/:/,$configline);
        $hostname{$id}=$name;   if ($id && $domain && $role && $name && $ip) {
        $hostdom{$id}=$domain;      $hostname{$id}=$name;
        $hostrole{$id}=$role;      $hostdom{$id}=$domain;
        $hostip{$id}=$ip;      $hostip{$id}=$ip;
        if (($role eq 'library') && ($id ne $perlvar{'lonHostID'})) {      $hostrole{$id}=$role;
    $libserv{$id}=$name;      if ($domdescr) { $domaindescription{$domain}=$domdescr; }
        }      if (($role eq 'library') && ($id ne $perlvar{'lonHostID'})) {
    $libserv{$id}=$name;
       }
    } else {
       if ($configline) {
   # &logthis("Skipping hosts.tab line -$configline-");
       }
    }
     }      }
 }  }
   
 # ------------------------------------------------------ Read spare server file  # ------------------------------------------------------ Read spare server file
 {  {
     my $config=IO::File->new("$perlvar{'lonTabDir'}/spare.tab");      my $config=IO::File->new("$perlvar{'lonTabDir'}/spare.tab");
       
     while (my $configline=<$config>) {      while (my $configline=<$config>) {
        chomp($configline);   chomp($configline);
        if (($configline) && ($configline ne $perlvar{'lonHostID'})) {   if (($configline) && ($configline ne $perlvar{'lonHostID'})) {
           $spareid{$configline}=1;      $spareid{$configline}=1;
        }   }
     }      }
 }  }
   
Line 128  $now=time; Line 252  $now=time;
 $date=localtime($now);  $date=localtime($now);
   
 {  {
 my $fh=IO::File->new(">$statusdir/newstatus.html");      my $fh=IO::File->new(">$statusdir/newstatus.html");
       my %simplestatus=();
 print $fh (<<ENDHEADERS);      
       print $fh (<<ENDHEADERS);
 <html>  <html>
 <head>  <head>
 <title>LON Status Report $perlvar{'lonHostID'}</title>  <title>LON Status Report $perlvar{'lonHostID'}</title>
Line 148  print $fh (<<ENDHEADERS); Line 273  print $fh (<<ENDHEADERS);
 <li><a href="#lonsql">lonsql</a>  <li><a href="#lonsql">lonsql</a>
 <li><a href="#lond">lond</a>  <li><a href="#lond">lond</a>
 <li><a href="#lonc">lonc</a>  <li><a href="#lonc">lonc</a>
   <li><a href="#lonhttpd">lonhttpd</a>
 <li><a href="#lonnet">lonnet</a>  <li><a href="#lonnet">lonnet</a>
 <li><a href="#connections">Connections</a>  <li><a href="#connections">Connections</a>
 <li><a href="#delayed">Delayed Messages</a>  <li><a href="#delayed">Delayed Messages</a>
Line 160  print $fh (<<ENDHEADERS); Line 286  print $fh (<<ENDHEADERS);
 <table border=2>  <table border=2>
 ENDHEADERS  ENDHEADERS
   
 foreach $varname (keys %perlvar) {      foreach $varname (sort(keys(%perlvar))) {
     print $fh "<tr><td>$varname</td><td>$perlvar{$varname}</td></tr>\n";   print $fh "<tr><td>$varname</td><td>$perlvar{$varname}</td></tr>\n";
 }      }
 print $fh "</table><h3>Hosts</h3><table border=2>";      print $fh "</table><h3>Hosts</h3><table border=2>";
 foreach $id (keys %hostname) {      foreach $id (sort(keys(%hostname))) {
 print $fh    print $fh 
     "<tr><td>$id</td><td>$hostdom{$id}</td><td>$hostrole{$id}</td>";      "<tr><td>$id</td><td>$hostdom{$id}</td><td>$hostrole{$id}</td>";
 print $fh "<td>$hostname{$id}</td><td>$hostip{$id}</td></tr>\n";   print $fh "<td>$hostname{$id}</td><td>$hostip{$id}</td></tr>\n";
 }      }
 print $fh "</table><h3>Spare Hosts</h3><ol>";      print $fh "</table><h3>Spare Hosts</h3><ol>";
 foreach $id (keys %spareid) {      foreach $id (sort(keys(%spareid))) {
     print $fh "<li>$id\n";   print $fh "<li>$id\n";
 }      }
       
 print $fh "</ol>\n";      print $fh "</ol>\n";
   
 # --------------------------------------------------------------------- Machine  # --------------------------------------------------------------------- Machine
       
       print $fh '<hr><a name="machine"><h2>Machine Information</h2>';
       print $fh "<h3>loadavg</h3>";
       
       open (LOADAVGH,"/proc/loadavg");
       $loadavg=<LOADAVGH>;
       close (LOADAVGH);
       
       print $fh "<tt>$loadavg</tt>";
       
       @parts=split(/\s+/,$loadavg);
       if ($parts[1]>4.0) {
    $errors++;
       } elsif ($parts[1]>2.0) {
    $warnings++;
       } elsif ($parts[1]>1.0) {
    $notices++;
       }
   
 print $fh '<hr><a name="machine"><h2>Machine Information</h2>';      print $fh "<h3>df</h3>";
 print $fh "<h3>loadavg</h3>";      print $fh "<pre>";
   
 open (LOADAVGH,"/proc/loadavg");      open (DFH,"df|");
 $loadavg=<LOADAVGH>;      while ($line=<DFH>) { 
 close (LOADAVGH);   print $fh "$line"; 
    @parts=split(/\s+/,$line);
    $usage=$parts[4];
    $usage=~s/\W//g;
    if ($usage>90) { 
       $warnings++;
       $notices++; 
    } elsif ($usage>80) {
       $warnings++;
    } elsif ($usage>60) {
       $notices++;
    }
    if ($usage>95) { $warnings++; $warnings++; $simplestatus{'diskfull'}++; }
       }
       close (DFH);
       print $fh "</pre>";
   
 print $fh "<tt>$loadavg</tt>";  
   
 @parts=split(/\s+/,$loadavg);      print $fh "<h3>ps</h3>";
 if ($parts[1]>4.0) {      print $fh "<pre>";
     $errors++;      $psproc=0;
 } elsif ($parts[1]>2.0) {  
     $warnings++;      open (PSH,"ps -aux|");
 } elsif ($parts[1]>1.0) {      while ($line=<PSH>) { 
     $notices++;   print $fh "$line"; 
 }   $psproc++;
       }
 print $fh "<h3>df</h3>";      close (PSH);
 print $fh "<pre>";      print $fh "</pre>";
   
 open (DFH,"df|");  
 while ($line=<DFH>) {   
    print $fh "$line";   
    @parts=split(/\s+/,$line);  
    $usage=$parts[4];  
    $usage=~s/\W//g;  
    if ($usage>90) {   
       $warnings++;  
       $notices++;   
    } elsif ($usage>80) {  
       $warnings++;  
    } elsif ($usage>60) {  
       $notices++;  
    }  
    if ($usage>95) { $warnings++; $warnings++ }  
 }  
 close (DFH);  
 print $fh "</pre>";  
   
   
 print $fh "<h3>ps</h3>";  
 print $fh "<pre>";  
 $psproc=0;  
   
 open (PSH,"ps -aux|");  
 while ($line=<PSH>) {   
    print $fh "$line";   
    $psproc++;  
 }  
 close (PSH);  
 print $fh "</pre>";  
   
 if ($psproc>200) { $notices++; }      if ($psproc>200) { $notices++; }
 if ($psproc>250) { $notices++; }      if ($psproc>250) { $notices++; }
   
 &errout($fh);      &errout($fh);
   
 # --------------------------------------------------------------- clean out tmp  # --------------------------------------------------------------- clean out tmp
 print $fh '<hr><a name="tmp"><h2>Temporary Files</h2>';      print $fh '<hr><a name="tmp"><h2>Temporary Files</h2>';
 $cleaned=0;      $cleaned=0;
 $old=0;      $old=0;
 while ($fname=<$perlvar{'lonDaemons'}/tmp/*>) {      while ($fname=<$perlvar{'lonDaemons'}/tmp/*>) {
                           my ($dev,$ino,$mode,$nlink,   my ($dev,$ino,$mode,$nlink,
                               $uid,$gid,$rdev,$size,      $uid,$gid,$rdev,$size,
                               $atime,$mtime,$ctime,      $atime,$mtime,$ctime,
                               $blksize,$blocks)=stat($fname);      $blksize,$blocks)=stat($fname);
                           $now=time;   $now=time;
                           $since=$now-$mtime;   $since=$now-$mtime;
                           if ($since>$perlvar{'lonExpire'}) {   if ($since>$perlvar{'lonExpire'}) {
                               $line='';      $line='';
                               if (open(PROBE,$fname)) {      if (open(PROBE,$fname)) {
   $line=<PROBE>;   $line=<PROBE>;
                                   close(PROBE);   close(PROBE);
       }      }
       unless ($line=~/^CHECKOUTTOKEN\&/) {      unless ($line=~/^CHECKOUTTOKEN\&/) {
                                  $cleaned++;   $cleaned++;
                                  unlink("$fname");   unlink("$fname");
       } else {      } else {
   if ($since>100*$perlvar{'lonExpire'}) {   if ($since>365*$perlvar{'lonExpire'}) {
                                      $cleaned++;      $cleaned++;
                                      unlink("$fname");      unlink("$fname");
  } else { $old++; }   } else { $old++; }
                               }      }
                           }   }
           
 }      }
 print $fh "Cleaned up ".$cleaned." files (".$old." old checkout tokens).";      print $fh "Cleaned up ".$cleaned." files (".$old." old checkout tokens).";
   
 # ------------------------------------------------------------ clean out lonIDs  # ------------------------------------------------------------ clean out lonIDs
 print $fh '<hr><a name="tokens"><h2>Session Tokens</h2>';      print $fh '<hr><a name="tokens"><h2>Session Tokens</h2>';
 $cleaned=0;      $cleaned=0;
 $active=0;      $active=0;
 while ($fname=<$perlvar{'lonIDsDir'}/*>) {      while ($fname=<$perlvar{'lonIDsDir'}/*>) {
                           my ($dev,$ino,$mode,$nlink,   my ($dev,$ino,$mode,$nlink,
                               $uid,$gid,$rdev,$size,      $uid,$gid,$rdev,$size,
                               $atime,$mtime,$ctime,      $atime,$mtime,$ctime,
                               $blksize,$blocks)=stat($fname);      $blksize,$blocks)=stat($fname);
                           $now=time;   $now=time;
                           $since=$now-$mtime;   $since=$now-$mtime;
                           if ($since>$perlvar{'lonExpire'}) {   if ($since>$perlvar{'lonExpire'}) {
                               $cleaned++;      $cleaned++;
                               print $fh "Unlinking $fname<br>";      print $fh "Unlinking $fname<br>";
                               unlink("$fname");      unlink("$fname");
                           } else {   } else {
                               $active++;      $active++;
                           }   }
       
 }      }
 print $fh "<p>Cleaned up ".$cleaned." stale session token(s).";      print $fh "<p>Cleaned up ".$cleaned." stale session token(s).";
 print $fh "<h3>$active open session(s)</h3>";      print $fh "<h3>$active open session(s)</h3>";
   
 # ----------------------------------------------------------------------- httpd  # ----------------------------------------------------------------------- httpd
   
 print $fh '<hr><a name="httpd"><h2>httpd</h2><h3>Access Log</h3><pre>';      print $fh '<hr><a name="httpd"><h2>httpd</h2><h3>Access Log</h3><pre>';
       
       open (DFH,"tail -n25 /etc/httpd/logs/access_log|");
       while ($line=<DFH>) { print $fh "$line" };
       close (DFH);
   
 open (DFH,"tail -n25 /etc/httpd/logs/access_log|");      print $fh "</pre><h3>Error Log</h3><pre>";
 while ($line=<DFH>) { print $fh "$line" };  
 close (DFH);      open (DFH,"tail -n25 /etc/httpd/logs/error_log|");
       while ($line=<DFH>) { 
 print $fh "</pre><h3>Error Log</h3><pre>";   print $fh "$line";
    if ($line=~/\[error\]/) { $notices++; } 
 open (DFH,"tail -n25 /etc/httpd/logs/error_log|");      };
 while ($line=<DFH>) {       close (DFH);
    print $fh "$line";      print $fh "</pre>";
    if ($line=~/\[error\]/) { $notices++; }       &errout($fh);
 };  
 close (DFH);  
 print $fh "</pre>";  
 &errout($fh);  
   
   
 # ---------------------------------------------------------------------- lonsql  # ---------------------------------------------------------------------- lonsql
   
 my $restartflag=1;      &checkon_daemon($fh,'lonsql',200000);
 if ($perlvar{'lonRole'} eq "library") {  
   # ------------------------------------------------------------------------ lond
   
       &checkon_daemon($fh,'lond',40000,1);
   
   # ------------------------------------------------------------------------ lonc
   
       &checkon_daemon($fh,'lonc',40000,1);
   
     print $fh '<hr><a name="lonsql"><h2>lonsql</h2><h3>Log</h3><pre>';  # -------------------------------------------------------------------- lonhttpd
     print "lonsql\n";  
     if (-e "$perlvar{'lonDaemons'}/logs/lonsql.log"){      &checkon_daemon($fh,'lonhttpd',40000);
  open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonsql.log|");  
   # ---------------------------------------------------------------------- lonnet
   
       print $fh '<hr><a name="lonnet"><h2>lonnet</h2><h3>Temp Log</h3><pre>';
       print "checking logs\n";
       if (-e "$perlvar{'lonDaemons'}/logs/lonnet.log"){
    open (DFH,"tail -n50 $perlvar{'lonDaemons'}/logs/lonnet.log|");
  while ($line=<DFH>) {    while ($line=<DFH>) { 
     print $fh "$line";      print $fh "$line";
     if ($line=~/INFO/) { $notices++; }  
     if ($line=~/WARNING/) { $notices++; }  
     if ($line=~/CRITICAL/) { $warnings++; }  
  };   };
  close (DFH);   close (DFH);
     }      }
     print $fh "</pre>";      print $fh "</pre><h3>Perm Log</h3><pre>";
           
     my $lonsqlfile="$perlvar{'lonDaemons'}/logs/lonsql.pid";      if (-e "$perlvar{'lonDaemons'}/logs/lonnet.perm.log") {
     open(DFH,"tail -n10 $perlvar{'lonDaemons'}/logs/lonnet.perm.log|");
     $restartflag=1;   while ($line=<DFH>) { 
          print $fh "$line";
     if (-e $lonsqlfile) {   };
  my $lfh=IO::File->new("$lonsqlfile");   close (DFH);
  my $lonsqlpid=<$lfh>;      } else { print $fh "No perm log\n" }
  chomp($lonsqlpid);  
  if (kill 0 => $lonsqlpid) {  
     print $fh "<h3>lonsql at pid $lonsqlpid responding</h3>";  
     $restartflag=0;  
  } else {  
     $errors++; $errors++;  
     print $fh "<h3>lonsql at pid $lonsqlpid not responding</h3>";  
  $restartflag=1;  
  print $fh   
     "<h3>Decided to clean up stale .pid file and restart lonsql</h3>";  
  }  
     }  
     if ($restartflag==1) {  
  $errors++;  
          print $fh '<br><font color="red">Killall lonsql: '.  
                     system('killall lonsql').' - ';  
                     sleep 60;  
                     print $fh unlink($lonsqlfile).' - '.  
                               system('killall -9 lonsql').  
                     '</font><br>';  
  print $fh "<h3>lonsql not running, trying to start</h3>";  
  system(  
  "$perlvar{'lonDaemons'}/lonsql 2>>$perlvar{'lonDaemons'}/logs/lonsql_errors");  
  sleep 10;  
  if (-e $lonsqlfile) {  
     print $fh "Seems like it started ...<p>";  
     my $lfh=IO::File->new("$lonsqlfile");  
     my $lonsqlpid=<$lfh>;  
     chomp($lonsqlpid);  
     sleep 30;  
     if (kill 0 => $lonsqlpid) {  
  print $fh "<h3>lonsql at pid $lonsqlpid responding</h3>";  
     } else {  
  $errors++; $errors++;  
  print $fh "<h3>lonsql at pid $lonsqlpid not responding</h3>";  
  print $fh "Give it one more try ...<p>";  
  system(  
  "$perlvar{'lonDaemons'}/lonsql 2>>$perlvar{'lonDaemons'}/logs/lonsql_errors");  
  sleep 10;  
     }  
  } else {  
     print $fh "Seems like that did not work!<p>";  
     $errors++;  
  }  
  if (-e "$perlvar{'lonDaemons'}/logs/lonsql.log"){  
     print $fh "<p><pre>";  
     open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonsql.log|");  
     while ($line=<DFH>) {   
  print $fh "$line";  
  if ($line=~/WARNING/) { $notices++; }  
  if ($line=~/CRITICAL/) { $notices++; }  
     };  
     close (DFH);  
     print $fh "</pre>";  
  }  
     }  
   
     $fname="$perlvar{'lonDaemons'}/logs/lonsql.log";      $fname="$perlvar{'lonDaemons'}/logs/lonnet.log";
   
     my ($dev,$ino,$mode,$nlink,      my ($dev,$ino,$mode,$nlink,
  $uid,$gid,$rdev,$size,   $uid,$gid,$rdev,$size,
Line 407  if ($perlvar{'lonRole'} eq "library") { Line 487  if ($perlvar{'lonRole'} eq "library") {
  rename("$fname","$fname.1");   rename("$fname","$fname.1");
     }      }
   
       print $fh "</pre>";
     &errout($fh);      &errout($fh);
 }  # ----------------------------------------------------------------- Connections
 # ------------------------------------------------------------------------ lond  
   
 print $fh '<hr><a name="lond"><h2>lond</h2><h3>Log</h3><pre>';      print $fh '<hr><a name="connections"><h2>Connections</h2>';
 print "lond\n";      print "testing connections\n";
       print $fh "<table border=2>";
       foreach $tryserver (sort(keys(%hostname))) {
    print(".");
    $answer=reply("pong",$tryserver);
    if ($answer eq "$tryserver:$perlvar{'lonHostID'}") {
       $result="<b>ok</b>";
    } else {
       $result=$answer;
       $warnings++;
       if ($answer eq 'con_lost') { $warnings++; }
    }
    if ($answer =~ /con_lost/) { print(" $tryserver down\n"); }
    print $fh "<tr><td>$tryserver</td><td>$result</td></tr>\n";
   
 if (-e "$perlvar{'lonDaemons'}/logs/lond.log"){      }
 open (DFH,"tail -n25 $perlvar{'lonDaemons'}/logs/lond.log|");      print $fh "</table>";
 while ($line=<DFH>) {   
    print $fh "$line";  
    if ($line=~/INFO/) { $notices++; }  
    if ($line=~/WARNING/) { $notices++; }  
    if ($line=~/CRITICAL/) { $warnings++; }  
 };  
 close (DFH);  
 }  
 print $fh "</pre>";  
   
 my $londfile="$perlvar{'lonDaemons'}/logs/lond.pid";  
   
 $restartflag=1;  
 if (-e $londfile) {      
    my $lfh=IO::File->new("$londfile");  
    my $londpid=<$lfh>;  
    chomp($londpid);  
    if (kill 0 => $londpid) {  
       print $fh "<h3>lond at pid $londpid responding, sending USR1</h3>";  
       kill USR1 => $londpid;  
       $restartflag=0;  
    } else {  
       $errors++;  
       print $fh "<h3>lond at pid $londpid not responding</h3>";  
       $restartflag=1;  
       print $fh   
   "<h3>Decided to clean up stale .pid file and restart lond</h3>";  
    }  
 }   
 if ($restartflag==1) {  
    $errors++;  
   print $fh '<br><font color="red">Killall lond: '.  
                     system('killall lond').' - ';  
           sleep 60;  
           print $fh unlink($londfile).' - '.system('killall -9 lond').  
                     '</font><br>';  
    print $fh "<h3>lond not running, trying to start</h3>";  
    system(  
      "$perlvar{'lonDaemons'}/lond 2>>$perlvar{'lonDaemons'}/logs/lond_errors");  
    sleep 10;  
    if (-e $londfile) {  
        print $fh "Seems like it started ...<p>";  
        my $lfh=IO::File->new("$londfile");  
        my $londpid=<$lfh>;  
        chomp($londpid);  
        sleep 30;  
        if (kill 0 => $londpid) {  
           print $fh "<h3>lond at pid $londpid responding</h3>";  
        } else {  
           $errors++; $errors++;  
           print $fh "<h3>lond at pid $londpid not responding</h3>";  
           print $fh "Give it one more try ...<p>";  
   system(  
  "$perlvar{'lonDaemons'}/lond 2>>$perlvar{'lonDaemons'}/logs/lond_errors");  
           sleep 10;  
        }  
    } else {  
        print $fh "Seems like that did not work!<p>";  
        $errors++;  
    }  
    if (-e "$perlvar{'lonDaemons'}/logs/lond.log"){  
     print $fh "<p><pre>";  
     open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lond.log|");  
     while ($line=<DFH>) {   
       print $fh "$line";  
       if ($line=~/WARNING/) { $notices++; }  
       if ($line=~/CRITICAL/) { $notices++; }  
     };  
     close (DFH);  
     print $fh "</pre>";  
    }  
 }  
   
 $fname="$perlvar{'lonDaemons'}/logs/lond.log";      &errout($fh);
   # ------------------------------------------------------------ Delayed messages
   
                           my ($dev,$ino,$mode,$nlink,      print $fh '<hr><a name="delayed"><h2>Delayed Messages</h2>';
                               $uid,$gid,$rdev,$size,      print "checking buffers\n";
                               $atime,$mtime,$ctime,  
                               $blksize,$blocks)=stat($fname);  
   
 if ($size>40000) {      print $fh '<h3>Scanning Permanent Log</h3>';
     print $fh "Rotating logs ...<p>";  
     rename("$fname.2","$fname.3");  
     rename("$fname.1","$fname.2");  
     rename("$fname","$fname.1");  
 }  
   
 &errout($fh);      $unsend=0;
 # ------------------------------------------------------------------------ lonc      {
    my $dfh=IO::File->new("$perlvar{'lonDaemons'}/logs/lonnet.perm.log");
    while ($line=<$dfh>) {
       ($time,$sdf,$dserv,$dcmd)=split(/:/,$line);
       if ($sdf eq 'F') { 
    $local=localtime($time);
    print $fh "<b>Failed: $time, $dserv, $dcmd</b><br>";
    $warnings++;
       }
       if ($sdf eq 'S') { $unsend--; }
       if ($sdf eq 'D') { $unsend++; }
    }
       }
       print $fh "Total unsend messages: <b>$unsend</b><p>\n";
       $warnings=$warnings+5*$unsend;
   
 print $fh '<hr><a name="lonc"><h2>lonc</h2><h3>Log</h3><pre>';      if ($unsend) { $simplestatus{'unsend'}=$unsend; }
 print "lonc\n";      print $fh "<h3>Outgoing Buffer</h3>";
   
 if (-e "$perlvar{'lonDaemons'}/logs/lonc.log"){      open (DFH,"ls -lF $perlvar{'lonSockDir'}/delayed|");
 open (DFH,"tail -n25 $perlvar{'lonDaemons'}/logs/lonc.log|");  
 while ($line=<DFH>) {   
    print $fh "$line";  
    if ($line=~/INFO/) { $notices++; }  
    if ($line=~/WARNING/) { $notices++; }  
    if ($line=~/CRITICAL/) { $warnings++; }  
 };  
 close (DFH);  
 }  
 print $fh "</pre>";  
   
 my $loncfile="$perlvar{'lonDaemons'}/logs/lonc.pid";  
   
 $restartflag=1;  
 if (-e $loncfile) {  
    my $lfh=IO::File->new("$loncfile");  
    my $loncpid=<$lfh>;  
    chomp($loncpid);  
    if (kill 0 => $loncpid) {  
       print $fh "<h3>lonc at pid $loncpid responding, sending USR1</h3>";  
       kill USR1 => $loncpid;  
       $restartflag=0;  
    } else {  
       $errors++;  
       print $fh "<h3>lonc at pid $loncpid not responding</h3>";  
       # Solution: kill parent and children processes, remove .pid and restart  
   $restartflag=1;  
       print $fh   
   "<h3>Decided to clean up stale .pid file and restart lonc</h3>";  
    }  
 }   
 if ($restartflag==1) {  
    $errors++;  
   print $fh '<br><font color="red">Killall lonc: '.  
             system('killall lonc').' - ';  
           sleep 60;  
           print $fh unlink($loncfile).' - '.system('killall -9 lonc').  
                     '</font><br>';  
    print $fh "<h3>lonc not running, trying to start</h3>";  
  system(  
  "$perlvar{'lonDaemons'}/lonc 2>>$perlvar{'lonDaemons'}/logs/lonc_errors");  
    sleep 10;  
    if (-e $loncfile) {  
        print $fh "Seems like it started ...<p>";  
        my $lfh=IO::File->new("$loncfile");  
        my $loncpid=<$lfh>;  
        chomp($loncpid);  
        sleep 30;  
        if (kill 0 => $loncpid) {  
           print $fh "<h3>lonc at pid $loncpid responding</h3>";  
        } else {  
           $errors++; $errors++;  
           print $fh "<h3>lonc at pid $loncpid not responding</h3>";  
           print $fh "Give it one more try ...<p>";  
    system(  
  "$perlvar{'lonDaemons'}/lonc 2>>$perlvar{'lonDaemons'}/logs/lonc_errors");  
           sleep 10;  
        }  
    } else {  
        print $fh "Seems like that did not work!<p>";  
        $errors++;  
    }  
    if (-e "$perlvar{'lonDaemons'}/logs/lonc.log") {  
     print $fh "<p><pre>";  
     open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonc.log|");  
     while ($line=<DFH>) {       while ($line=<DFH>) { 
       print $fh "$line";   print $fh "$line<br>";
       if ($line=~/WARNING/) { $notices++; }  
       if ($line=~/CRITICAL/) { $notices++; }  
     };      };
     close (DFH);      close (DFH);
     print $fh "</pre>";  
    }  
 }  
   
 $fname="$perlvar{'lonDaemons'}/logs/lonc.log";  
   
                           my ($dev,$ino,$mode,$nlink,  
                               $uid,$gid,$rdev,$size,  
                               $atime,$mtime,$ctime,  
                               $blksize,$blocks)=stat($fname);  
   
 if ($size>40000) {  
     print $fh "Rotating logs ...<p>";  
     rename("$fname.2","$fname.3");  
     rename("$fname.1","$fname.2");  
     rename("$fname","$fname.1");  
 }  
   
      
 &errout($fh);  
 # ---------------------------------------------------------------------- lonnet  
   
 print $fh '<hr><a name="lonnet"><h2>lonnet</h2><h3>Temp Log</h3><pre>';  
 print "lonnet\n";  
 if (-e "$perlvar{'lonDaemons'}/logs/lonnet.log"){  
 open (DFH,"tail -n50 $perlvar{'lonDaemons'}/logs/lonnet.log|");  
 while ($line=<DFH>) {   
     print $fh "$line";  
 };  
 close (DFH);  
 }  
 print $fh "</pre><h3>Perm Log</h3><pre>";  
   
 if (-e "$perlvar{'lonDaemons'}/logs/lonnet.perm.log") {  
     open(DFH,"tail -n10 $perlvar{'lonDaemons'}/logs/lonnet.perm.log|");  
 while ($line=<DFH>) {   
    print $fh "$line";  
 };  
 close (DFH);  
 } else { print $fh "No perm log\n" }  
   
 $fname="$perlvar{'lonDaemons'}/logs/lonnet.log";  
   
                           my ($dev,$ino,$mode,$nlink,  
                               $uid,$gid,$rdev,$size,  
                               $atime,$mtime,$ctime,  
                               $blksize,$blocks)=stat($fname);  
   
 if ($size>40000) {  
     print $fh "Rotating logs ...<p>";  
     rename("$fname.2","$fname.3");  
     rename("$fname.1","$fname.2");  
     rename("$fname","$fname.1");  
 }  
   
 print $fh "</pre>";  
 &errout($fh);  
 # ----------------------------------------------------------------- Connections  
   
 print $fh '<hr><a name="connections"><h2>Connections</h2>';  
   
 print $fh "<table border=2>";  
 foreach $tryserver (keys %hostname) {  
   
     $answer=reply("pong",$tryserver);  
     if ($answer eq "$tryserver:$perlvar{'lonHostID'}") {  
  $result="<b>ok</b>";  
     } else {  
         $result=$answer;  
         $warnings++;  
         if ($answer eq 'con_lost') { $warnings++; }  
     }  
     print $fh "<tr><td>$tryserver</td><td>$result</td></tr>\n";  
   
 }  
 print $fh "</table>";  
   
 &errout($fh);  
 # ------------------------------------------------------------ Delayed messages  
   
 print $fh '<hr><a name="delayed"><h2>Delayed Messages</h2>';  
 print "buffers\n";  
   
 print $fh '<h3>Scanning Permanent Log</h3>';  
   
 $unsend=0;  
 {  
     my $dfh=IO::File->new("$perlvar{'lonDaemons'}/logs/lonnet.perm.log");  
     while ($line=<$dfh>) {  
  ($time,$sdf,$dserv,$dcmd)=split(/:/,$line);  
         if ($sdf eq 'F') {   
     $local=localtime($time);  
             print "<b>Failed: $time, $dserv, $dcmd</b><br>";  
             $warnings++;  
         }  
         if ($sdf eq 'S') { $unsend--; }  
         if ($sdf eq 'D') { $unsend++; }  
     }  
 }  
 print $fh "Total unsend messages: <b>$unsend</b><p>\n";  
 $warnings=$warnings+5*$unsend;  
   
 print $fh "<h3>Outgoing Buffer</h3>";  
   
 open (DFH,"ls -lF $perlvar{'lonSockDir'}/delayed|");  
 while ($line=<DFH>) {   
     print $fh "$line<br>";  
 };  
 close (DFH);  
   
 # ------------------------------------------------------------------------- End  # ------------------------------------------------------------------------- End
 print $fh "<a name=errcount>\n";      print $fh "<a name=errcount>\n";
 $totalcount=$notices+4*$warnings+100*$errors;      $totalcount=$notices+4*$warnings+100*$errors;
 &errout($fh);      &errout($fh);
 print $fh "<h1>Total Error Count: $totalcount</h1>";      print $fh "<h1>Total Error Count: $totalcount</h1>";
 $now=time;      $now=time;
 $date=localtime($now);      $date=localtime($now);
 print $fh "<hr>$date ($now)</body></html>\n";      print $fh "<hr>$date ($now)</body></html>\n";
 print "writing done\n";      print "lon-status webpage updated\n";
 }      $fh->close();
   }
   if ($errors) { $simplestatus{'errors'}=$errors; }
   if ($warnings) { $simplestatus{'warnings'}=$warnings; }
   if ($notices) { $simplestatus{'notices'}=$notices; }
   $simplestatus{'time'}=time;
   
 rename ("$statusdir/newstatus.html","$statusdir/index.html");  rename ("$statusdir/newstatus.html","$statusdir/index.html");
   {
       my $sfh=IO::File->new(">$statusdir/loncron_simple.txt");
       foreach (keys %simplestatus) {
    print $sfh $_.'='.$simplestatus{$_}.'&';
       }
       print $sfh "\n";
       $sfh->close();
   }
 if ($totalcount>200) {  if ($totalcount>200) {
    print "mailing\n";      print "sending mail\n";
    $emailto="$perlvar{'lonAdmEMail'},$perlvar{'lonSysEMail'}";      $emailto="$perlvar{'lonAdmEMail'}";
    $subj="LON: $perlvar{'lonHostID'} E:$errors W:$warnings N:$notices";       if ($totalcount>1000) {
    system(   $emailto.=",$perlvar{'lonSysEMail'}";
  "metasend -b -t $emailto -s '$subj' -f $statusdir/index.html -m text/html");      }
       $subj="LON: $perlvar{'lonHostID'} E:$errors W:$warnings N:$notices"; 
       system("metasend -b -t $emailto -s '$subj' -f $statusdir/index.html -m text/html");
 }  }
 1;  1;
   

Removed from v.1.29  
changed lines
  Added in v.1.43


FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>