Annotation of loncom/loncron, revision 1.37

1.1       albertel    1: #!/usr/bin/perl
                      2: 
                      3: # The LearningOnline Network
                      4: # Housekeeping program, started by cron
                      5: #
                      6: # (TCP networking package
                      7: # 6/1/99,6/2,6/10,6/11,6/12,6/14,6/26,6/28,6/29,6/30,
                      8: # 7/1,7/2,7/9,7/10,7/12 Gerd Kortemeyer)
                      9: #
1.3       www        10: # 7/14,7/15,7/19,7/21,7/22,11/18,
                     11: # 2/8 Gerd Kortemeyer
1.11      www        12: # 12/23 Gerd Kortemeyer
1.22      harris41   13: # YEAR=2001
1.25      www        14: # 09/04,09/06,11/26 Gerd Kortemeyer
1.24      www        15: 
                     16: $|=1;
1.1       albertel   17: 
1.26      harris41   18: use lib '/home/httpd/lib/perl/';
                     19: use LONCAPA::Configuration;
                     20: 
1.1       albertel   21: use IO::File;
                     22: use IO::Socket;
                     23: 
                     24: # -------------------------------------------------- Non-critical communication
                     25: sub reply {
                     26:     my ($cmd,$server)=@_;
                     27:     my $peerfile="$perlvar{'lonSockDir'}/$server";
                     28:     my $client=IO::Socket::UNIX->new(Peer    =>"$peerfile",
                     29:                                      Type    => SOCK_STREAM,
                     30:                                      Timeout => 10)
                     31:        or return "con_lost";
                     32:     print $client "$cmd\n";
                     33:     my $answer=<$client>;
                     34:     chomp($answer);
                     35:     if (!$answer) { $answer="con_lost"; }
                     36:     return $answer;
                     37: }
                     38: 
                     39: # --------------------------------------------------------- Output error status
                     40: 
                     41: sub errout {
                     42:    my $fh=shift;
                     43:    print $fh (<<ENDERROUT);
                     44:      <p><table border=2 bgcolor="#CCCCCC">
                     45:      <tr><td>Notices</td><td>$notices</td></tr>
                     46:      <tr><td>Warnings</td><td>$warnings</td></tr>
                     47:      <tr><td>Errors</td><td>$errors</td></tr>
                     48:      </table><p><a href="#top">Top</a><p>
                     49: ENDERROUT
                     50: }
                     51: 
                     52: # ================================================================ Main Program
                     53: 
1.27      matthew    54: # --------------------------------- Read loncapa_apache.conf and loncapa.conf
1.33      harris41   55: my $perlvarref=LONCAPA::Configuration::read_conf('loncapa.conf');
1.28      albertel   56: %perlvar=%{$perlvarref};
1.26      harris41   57: undef $perlvarref;
                     58: delete $perlvar{'lonReceipt'}; # remove since sensitive and not needed
                     59: delete $perlvar{'lonSqlAccess'}; # remove since sensitive and not needed
1.13      harris41   60: 
1.14      harris41   61: # --------------------------------------- Make sure that LON-CAPA is configured
                     62: # I only test for one thing here (lonHostID).  This is just a safeguard.
                     63: if ('{[[[[lonHostID]]]]}' eq $perlvar{'lonHostID'}) {
1.15      harris41   64:    print("Unconfigured machine.\n");
1.14      harris41   65:    $emailto=$perlvar{'lonSysEMail'};
                     66:    $hostname=`/bin/hostname`;
                     67:    chop $hostname;
                     68:    $hostname=~s/[^\w\.]//g; # make sure is safe to pass through shell
                     69:    $subj="LON: Unconfigured machine $hostname";
                     70:    system("echo 'Unconfigured machine $hostname.' |\
                     71:  mailto $emailto -s '$subj' > /dev/null");
                     72:     exit 1;
                     73: }
                     74: 
1.13      harris41   75: # ----------------------------- Make sure this process is running from user=www
                     76: my $wwwid=getpwnam('www');
                     77: if ($wwwid!=$<) {
1.14      harris41   78:    print("User ID mismatch.  This program must be run as user 'www'\n");
1.13      harris41   79:    $emailto="$perlvar{'lonAdmEMail'},$perlvar{'lonSysEMail'}";
                     80:    $subj="LON: $perlvar{'lonHostID'} User ID mismatch";
                     81:    system("echo 'User ID mismatch.  loncron must be run as user www.' |\
                     82:  mailto $emailto -s '$subj' > /dev/null");
1.14      harris41   83:    exit 1;
1.1       albertel   84: }
                     85: 
                     86: # ------------------------------------------------------------- Read hosts file
                     87: {
                     88:     my $config=IO::File->new("$perlvar{'lonTabDir'}/hosts.tab");
                     89: 
                     90:     while (my $configline=<$config>) {
1.31      albertel   91: 	my ($id,$domain,$role,$name,$ip,$domdescr)=split(/:/,$configline);
                     92: 	if ($id && $domain && $role && $name && $ip) {
                     93: 	    $hostname{$id}=$name;
                     94: 	    $hostdom{$id}=$domain;
                     95: 	    $hostip{$id}=$ip;
                     96: 	    $hostrole{$id}=$role;
                     97: 	    if ($domdescr) { $domaindescription{$domain}=$domdescr; }
                     98: 	    if (($role eq 'library') && ($id ne $perlvar{'lonHostID'})) {
                     99: 		$libserv{$id}=$name;
                    100: 	    }
                    101: 	} else {
                    102: 	    if ($configline) {
                    103: #		&logthis("Skipping hosts.tab line -$configline-");
                    104: 	    }
                    105: 	}
1.1       albertel  106:     }
                    107: }
                    108: 
                    109: # ------------------------------------------------------ Read spare server file
                    110: {
                    111:     my $config=IO::File->new("$perlvar{'lonTabDir'}/spare.tab");
                    112: 
                    113:     while (my $configline=<$config>) {
                    114:        chomp($configline);
                    115:        if (($configline) && ($configline ne $perlvar{'lonHostID'})) {
                    116:           $spareid{$configline}=1;
                    117:        }
                    118:     }
                    119: }
                    120: 
                    121: # ---------------------------------------------------------------- Start report
                    122: 
                    123: $statusdir="/home/httpd/html/lon-status";
                    124: 
                    125: $errors=0;
                    126: $warnings=0;
                    127: $notices=0;
                    128: 
                    129: $now=time;
                    130: $date=localtime($now);
                    131: 
                    132: {
                    133: my $fh=IO::File->new(">$statusdir/newstatus.html");
                    134: 
                    135: print $fh (<<ENDHEADERS);
                    136: <html>
                    137: <head>
                    138: <title>LON Status Report $perlvar{'lonHostID'}</title>
                    139: </head>
1.3       www       140: <body bgcolor="#AAAAAA">
1.1       albertel  141: <a name="top">
                    142: <h1>LON Status Report $perlvar{'lonHostID'}</h1>
                    143: <h2>$date ($now)</h2>
                    144: <ol>
                    145: <li><a href="#configuration">Configuration</a>
                    146: <li><a href="#machine">Machine Information</a>
1.11      www       147: <li><a href="#tmp">Temporary Files</a>
                    148: <li><a href="#tokens">Session Tokens</a>
1.1       albertel  149: <li><a href="#httpd">httpd</a>
1.11      www       150: <li><a href="#lonsql">lonsql</a>
1.1       albertel  151: <li><a href="#lond">lond</a>
                    152: <li><a href="#lonc">lonc</a>
1.34      www       153: <li><a href="#lonhttpd">lonhttpd</a>
1.1       albertel  154: <li><a href="#lonnet">lonnet</a>
                    155: <li><a href="#connections">Connections</a>
                    156: <li><a href="#delayed">Delayed Messages</a>
                    157: <li><a href="#errcount">Error Count</a>
                    158: </ol>
                    159: <hr>
                    160: <a name="configuration">
                    161: <h2>Configuration</h2>
                    162: <h3>PerlVars</h3>
                    163: <table border=2>
                    164: ENDHEADERS
                    165: 
1.31      albertel  166: foreach $varname (sort(keys(%perlvar))) {
1.1       albertel  167:     print $fh "<tr><td>$varname</td><td>$perlvar{$varname}</td></tr>\n";
                    168: }
                    169: print $fh "</table><h3>Hosts</h3><table border=2>";
1.31      albertel  170: foreach $id (sort(keys(%hostname))) {
                    171:     print $fh 
                    172: 	"<tr><td>$id</td><td>$hostdom{$id}</td><td>$hostrole{$id}</td>";
                    173:     print $fh "<td>$hostname{$id}</td><td>$hostip{$id}</td></tr>\n";
1.1       albertel  174: }
                    175: print $fh "</table><h3>Spare Hosts</h3><ol>";
1.31      albertel  176: foreach $id (sort(keys(%spareid))) {
1.1       albertel  177:     print $fh "<li>$id\n";
                    178: }
                    179: 
                    180: print $fh "</ol>\n";
                    181: 
                    182: # --------------------------------------------------------------------- Machine
                    183: 
                    184: print $fh '<hr><a name="machine"><h2>Machine Information</h2>';
                    185: print $fh "<h3>loadavg</h3>";
                    186: 
                    187: open (LOADAVGH,"/proc/loadavg");
                    188: $loadavg=<LOADAVGH>;
                    189: close (LOADAVGH);
                    190: 
                    191: print $fh "<tt>$loadavg</tt>";
                    192: 
                    193: @parts=split(/\s+/,$loadavg);
1.4       www       194: if ($parts[1]>4.0) {
1.1       albertel  195:     $errors++;
                    196: } elsif ($parts[1]>2.0) {
                    197:     $warnings++;
                    198: } elsif ($parts[1]>1.0) {
                    199:     $notices++;
                    200: }
                    201: 
                    202: print $fh "<h3>df</h3>";
                    203: print $fh "<pre>";
                    204: 
                    205: open (DFH,"df|");
                    206: while ($line=<DFH>) { 
                    207:    print $fh "$line"; 
                    208:    @parts=split(/\s+/,$line);
                    209:    $usage=$parts[4];
                    210:    $usage=~s/\W//g;
                    211:    if ($usage>90) { 
1.24      www       212:       $warnings++;
                    213:       $notices++; 
1.1       albertel  214:    } elsif ($usage>80) {
                    215:       $warnings++;
                    216:    } elsif ($usage>60) {
                    217:       $notices++;
                    218:    }
1.4       www       219:    if ($usage>95) { $warnings++; $warnings++ }
1.1       albertel  220: }
                    221: close (DFH);
                    222: print $fh "</pre>";
1.24      www       223: 
                    224: 
                    225: print $fh "<h3>ps</h3>";
                    226: print $fh "<pre>";
                    227: $psproc=0;
                    228: 
                    229: open (PSH,"ps -aux|");
                    230: while ($line=<PSH>) { 
                    231:    print $fh "$line"; 
                    232:    $psproc++;
                    233: }
                    234: close (PSH);
                    235: print $fh "</pre>";
                    236: 
                    237: if ($psproc>200) { $notices++; }
                    238: if ($psproc>250) { $notices++; }
                    239: 
1.1       albertel  240: &errout($fh);
1.11      www       241: 
                    242: # --------------------------------------------------------------- clean out tmp
                    243: print $fh '<hr><a name="tmp"><h2>Temporary Files</h2>';
                    244: $cleaned=0;
1.29      www       245: $old=0;
1.11      www       246: while ($fname=<$perlvar{'lonDaemons'}/tmp/*>) {
                    247:                           my ($dev,$ino,$mode,$nlink,
                    248:                               $uid,$gid,$rdev,$size,
                    249:                               $atime,$mtime,$ctime,
                    250:                               $blksize,$blocks)=stat($fname);
                    251:                           $now=time;
                    252:                           $since=$now-$mtime;
                    253:                           if ($since>$perlvar{'lonExpire'}) {
1.29      www       254:                               $line='';
                    255:                               if (open(PROBE,$fname)) {
                    256: 				  $line=<PROBE>;
                    257:                                   close(PROBE);
                    258: 			      }
                    259: 			      unless ($line=~/^CHECKOUTTOKEN\&/) {
                    260:                                  $cleaned++;
                    261:                                  unlink("$fname");
                    262: 			      } else {
1.32      www       263: 				  if ($since>365*$perlvar{'lonExpire'}) {
1.29      www       264:                                      $cleaned++;
                    265:                                      unlink("$fname");
                    266: 				 } else { $old++; }
                    267:                               }
1.11      www       268:                           }
                    269:     
                    270: }
1.29      www       271: print $fh "Cleaned up ".$cleaned." files (".$old." old checkout tokens).";
1.11      www       272: 
                    273: # ------------------------------------------------------------ clean out lonIDs
                    274: print $fh '<hr><a name="tokens"><h2>Session Tokens</h2>';
                    275: $cleaned=0;
                    276: $active=0;
                    277: while ($fname=<$perlvar{'lonIDsDir'}/*>) {
                    278:                           my ($dev,$ino,$mode,$nlink,
                    279:                               $uid,$gid,$rdev,$size,
                    280:                               $atime,$mtime,$ctime,
                    281:                               $blksize,$blocks)=stat($fname);
                    282:                           $now=time;
                    283:                           $since=$now-$mtime;
                    284:                           if ($since>$perlvar{'lonExpire'}) {
                    285:                               $cleaned++;
                    286:                               print $fh "Unlinking $fname<br>";
                    287:                               unlink("$fname");
                    288:                           } else {
                    289:                               $active++;
                    290:                           }
                    291:     
                    292: }
                    293: print $fh "<p>Cleaned up ".$cleaned." stale session token(s).";
                    294: print $fh "<h3>$active open session(s)</h3>";
                    295: 
1.1       albertel  296: # ----------------------------------------------------------------------- httpd
                    297: 
                    298: print $fh '<hr><a name="httpd"><h2>httpd</h2><h3>Access Log</h3><pre>';
                    299: 
1.23      www       300: open (DFH,"tail -n25 /etc/httpd/logs/access_log|");
1.1       albertel  301: while ($line=<DFH>) { print $fh "$line" };
                    302: close (DFH);
                    303: 
                    304: print $fh "</pre><h3>Error Log</h3><pre>";
                    305: 
1.23      www       306: open (DFH,"tail -n25 /etc/httpd/logs/error_log|");
1.1       albertel  307: while ($line=<DFH>) { 
                    308:    print $fh "$line";
                    309:    if ($line=~/\[error\]/) { $notices++; } 
                    310: };
                    311: close (DFH);
                    312: print $fh "</pre>";
                    313: &errout($fh);
1.5       harris41  314: 
                    315: 
1.11      www       316: # ---------------------------------------------------------------------- lonsql
1.22      harris41  317: 
                    318: my $restartflag=1;
1.18      harris41  319: if ($perlvar{'lonRole'} eq "library") {
1.5       harris41  320: 
1.11      www       321:     print $fh '<hr><a name="lonsql"><h2>lonsql</h2><h3>Log</h3><pre>';
1.23      www       322:     print "lonsql\n";
1.5       harris41  323:     if (-e "$perlvar{'lonDaemons'}/logs/lonsql.log"){
                    324: 	open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonsql.log|");
                    325: 	while ($line=<DFH>) { 
                    326: 	    print $fh "$line";
                    327: 	    if ($line=~/INFO/) { $notices++; }
                    328: 	    if ($line=~/WARNING/) { $notices++; }
                    329: 	    if ($line=~/CRITICAL/) { $warnings++; }
                    330: 	};
                    331: 	close (DFH);
                    332:     }
                    333:     print $fh "</pre>";
                    334:     
                    335:     my $lonsqlfile="$perlvar{'lonDaemons'}/logs/lonsql.pid";
1.23      www       336:  
                    337:     $restartflag=1;
                    338:    
1.5       harris41  339:     if (-e $lonsqlfile) {
                    340: 	my $lfh=IO::File->new("$lonsqlfile");
                    341: 	my $lonsqlpid=<$lfh>;
                    342: 	chomp($lonsqlpid);
                    343: 	if (kill 0 => $lonsqlpid) {
                    344: 	    print $fh "<h3>lonsql at pid $lonsqlpid responding</h3>";
1.22      harris41  345: 	    $restartflag=0;
1.5       harris41  346: 	} else {
                    347: 	    $errors++; $errors++;
                    348: 	    print $fh "<h3>lonsql at pid $lonsqlpid not responding</h3>";
1.22      harris41  349: 		$restartflag=1;
1.23      www       350: 	print $fh 
                    351: 	    "<h3>Decided to clean up stale .pid file and restart lonsql</h3>";
1.5       harris41  352: 	}
1.22      harris41  353:     }
                    354:     if ($restartflag==1) {
1.5       harris41  355: 	$errors++;
1.23      www       356: 	         print $fh '<br><font color="red">Killall lonsql: '.
                    357:                     system('killall lonsql').' - ';
1.30      albertel  358:                     sleep 2;
1.23      www       359:                     print $fh unlink($lonsqlfile).' - '.
                    360:                               system('killall -9 lonsql').
                    361:                     '</font><br>';
1.5       harris41  362: 	print $fh "<h3>lonsql not running, trying to start</h3>";
1.16      harris41  363: 	system(
                    364:  "$perlvar{'lonDaemons'}/lonsql 2>>$perlvar{'lonDaemons'}/logs/lonsql_errors");
1.30      albertel  365: 	sleep 2;
1.5       harris41  366: 	if (-e $lonsqlfile) {
                    367: 	    print $fh "Seems like it started ...<p>";
                    368: 	    my $lfh=IO::File->new("$lonsqlfile");
                    369: 	    my $lonsqlpid=<$lfh>;
                    370: 	    chomp($lonsqlpid);
1.30      albertel  371: 	    sleep 2;
1.5       harris41  372: 	    if (kill 0 => $lonsqlpid) {
                    373: 		print $fh "<h3>lonsql at pid $lonsqlpid responding</h3>";
                    374: 	    } else {
                    375: 		$errors++; $errors++;
                    376: 		print $fh "<h3>lonsql at pid $lonsqlpid not responding</h3>";
                    377: 		print $fh "Give it one more try ...<p>";
1.16      harris41  378: 		system(
                    379:  "$perlvar{'lonDaemons'}/lonsql 2>>$perlvar{'lonDaemons'}/logs/lonsql_errors");
1.30      albertel  380: 		sleep 2;
1.5       harris41  381: 	    }
                    382: 	} else {
                    383: 	    print $fh "Seems like that did not work!<p>";
                    384: 	    $errors++;
                    385: 	}
                    386: 	if (-e "$perlvar{'lonDaemons'}/logs/lonsql.log"){
                    387: 	    print $fh "<p><pre>";
                    388: 	    open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonsql.log|");
                    389: 	    while ($line=<DFH>) { 
                    390: 		print $fh "$line";
                    391: 		if ($line=~/WARNING/) { $notices++; }
                    392: 		if ($line=~/CRITICAL/) { $notices++; }
                    393: 	    };
                    394: 	    close (DFH);
                    395: 	    print $fh "</pre>";
                    396: 	}
                    397:     }
                    398: 
                    399:     $fname="$perlvar{'lonDaemons'}/logs/lonsql.log";
                    400: 
                    401:     my ($dev,$ino,$mode,$nlink,
                    402: 	$uid,$gid,$rdev,$size,
                    403: 	$atime,$mtime,$ctime,
                    404: 	$blksize,$blocks)=stat($fname);
                    405: 
                    406:     if ($size>40000) {
                    407: 	print $fh "Rotating logs ...<p>";
                    408: 	rename("$fname.2","$fname.3");
                    409: 	rename("$fname.1","$fname.2");
                    410: 	rename("$fname","$fname.1");
                    411:     }
                    412: 
                    413:     &errout($fh);
                    414: }
1.1       albertel  415: # ------------------------------------------------------------------------ lond
                    416: 
                    417: print $fh '<hr><a name="lond"><h2>lond</h2><h3>Log</h3><pre>';
1.23      www       418: print "lond\n";
1.1       albertel  419: 
                    420: if (-e "$perlvar{'lonDaemons'}/logs/lond.log"){
1.23      www       421: open (DFH,"tail -n25 $perlvar{'lonDaemons'}/logs/lond.log|");
1.1       albertel  422: while ($line=<DFH>) { 
                    423:    print $fh "$line";
1.3       www       424:    if ($line=~/INFO/) { $notices++; }
1.4       www       425:    if ($line=~/WARNING/) { $notices++; }
                    426:    if ($line=~/CRITICAL/) { $warnings++; }
1.1       albertel  427: };
                    428: close (DFH);
                    429: }
                    430: print $fh "</pre>";
                    431: 
                    432: my $londfile="$perlvar{'lonDaemons'}/logs/lond.pid";
                    433: 
1.22      harris41  434: $restartflag=1;
1.7       harris41  435: if (-e $londfile) {    
1.1       albertel  436:    my $lfh=IO::File->new("$londfile");
                    437:    my $londpid=<$lfh>;
                    438:    chomp($londpid);
                    439:    if (kill 0 => $londpid) {
1.25      www       440:       print $fh "<h3>lond at pid $londpid responding, sending USR1</h3>";
                    441:       kill USR1 => $londpid;
1.7       harris41  442:       $restartflag=0;
1.1       albertel  443:    } else {
1.8       harris41  444:       $errors++;
1.1       albertel  445:       print $fh "<h3>lond at pid $londpid not responding</h3>";
1.23      www       446:       $restartflag=1;
1.8       harris41  447:       print $fh 
1.23      www       448: 	  "<h3>Decided to clean up stale .pid file and restart lond</h3>";
1.1       albertel  449:    }
1.7       harris41  450: } 
                    451: if ($restartflag==1) {
1.1       albertel  452:    $errors++;
1.23      www       453: 	  print $fh '<br><font color="red">Killall lond: '.
                    454:                     system('killall lond').' - ';
1.30      albertel  455:           sleep 2;
1.23      www       456:           print $fh unlink($londfile).' - '.system('killall -9 lond').
                    457:                     '</font><br>';
1.1       albertel  458:    print $fh "<h3>lond not running, trying to start</h3>";
1.16      harris41  459:    system(
                    460:      "$perlvar{'lonDaemons'}/lond 2>>$perlvar{'lonDaemons'}/logs/lond_errors");
1.30      albertel  461:    sleep 2;
1.1       albertel  462:    if (-e $londfile) {
                    463:        print $fh "Seems like it started ...<p>";
                    464:        my $lfh=IO::File->new("$londfile");
                    465:        my $londpid=<$lfh>;
                    466:        chomp($londpid);
1.30      albertel  467:        sleep 2;
1.1       albertel  468:        if (kill 0 => $londpid) {
                    469:           print $fh "<h3>lond at pid $londpid responding</h3>";
                    470:        } else {
                    471:           $errors++; $errors++;
                    472:           print $fh "<h3>lond at pid $londpid not responding</h3>";
                    473:           print $fh "Give it one more try ...<p>";
1.16      harris41  474: 	  system(
                    475:  "$perlvar{'lonDaemons'}/lond 2>>$perlvar{'lonDaemons'}/logs/lond_errors");
1.30      albertel  476:           sleep 2;
1.1       albertel  477:        }
                    478:    } else {
                    479:        print $fh "Seems like that did not work!<p>";
                    480:        $errors++;
                    481:    }
1.3       www       482:    if (-e "$perlvar{'lonDaemons'}/logs/lond.log"){
                    483:     print $fh "<p><pre>";
                    484:     open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lond.log|");
                    485:     while ($line=<DFH>) { 
                    486:       print $fh "$line";
1.4       www       487:       if ($line=~/WARNING/) { $notices++; }
                    488:       if ($line=~/CRITICAL/) { $notices++; }
1.3       www       489:     };
                    490:     close (DFH);
                    491:     print $fh "</pre>";
                    492:    }
1.1       albertel  493: }
                    494: 
                    495: $fname="$perlvar{'lonDaemons'}/logs/lond.log";
                    496: 
                    497:                           my ($dev,$ino,$mode,$nlink,
                    498:                               $uid,$gid,$rdev,$size,
                    499:                               $atime,$mtime,$ctime,
                    500:                               $blksize,$blocks)=stat($fname);
                    501: 
                    502: if ($size>40000) {
                    503:     print $fh "Rotating logs ...<p>";
                    504:     rename("$fname.2","$fname.3");
                    505:     rename("$fname.1","$fname.2");
                    506:     rename("$fname","$fname.1");
                    507: }
                    508: 
                    509: &errout($fh);
                    510: # ------------------------------------------------------------------------ lonc
                    511: 
                    512: print $fh '<hr><a name="lonc"><h2>lonc</h2><h3>Log</h3><pre>';
1.23      www       513: print "lonc\n";
1.1       albertel  514: 
                    515: if (-e "$perlvar{'lonDaemons'}/logs/lonc.log"){
1.23      www       516: open (DFH,"tail -n25 $perlvar{'lonDaemons'}/logs/lonc.log|");
1.1       albertel  517: while ($line=<DFH>) { 
                    518:    print $fh "$line";
1.3       www       519:    if ($line=~/INFO/) { $notices++; }
1.4       www       520:    if ($line=~/WARNING/) { $notices++; }
                    521:    if ($line=~/CRITICAL/) { $warnings++; }
1.1       albertel  522: };
                    523: close (DFH);
                    524: }
                    525: print $fh "</pre>";
                    526: 
                    527: my $loncfile="$perlvar{'lonDaemons'}/logs/lonc.pid";
                    528: 
1.7       harris41  529: $restartflag=1;
1.1       albertel  530: if (-e $loncfile) {
                    531:    my $lfh=IO::File->new("$loncfile");
                    532:    my $loncpid=<$lfh>;
                    533:    chomp($loncpid);
                    534:    if (kill 0 => $loncpid) {
                    535:       print $fh "<h3>lonc at pid $loncpid responding, sending USR1</h3>";
                    536:       kill USR1 => $loncpid;
1.7       harris41  537:       $restartflag=0;
1.1       albertel  538:    } else {
1.8       harris41  539:       $errors++;
1.1       albertel  540:       print $fh "<h3>lonc at pid $loncpid not responding</h3>";
1.10      harris41  541:       # Solution: kill parent and children processes, remove .pid and restart
1.8       harris41  542: 	  $restartflag=1;
                    543:       print $fh 
1.23      www       544: 	  "<h3>Decided to clean up stale .pid file and restart lonc</h3>";
1.1       albertel  545:    }
1.7       harris41  546: } 
                    547: if ($restartflag==1) {
1.1       albertel  548:    $errors++;
1.23      www       549: 	  print $fh '<br><font color="red">Killall lonc: '.
                    550: 	            system('killall lonc').' - ';
1.30      albertel  551:           sleep 2;
1.23      www       552:           print $fh unlink($loncfile).' - '.system('killall -9 lonc').
                    553:                     '</font><br>';
1.1       albertel  554:    print $fh "<h3>lonc not running, trying to start</h3>";
1.16      harris41  555: 	system(
1.17      harris41  556:  "$perlvar{'lonDaemons'}/lonc 2>>$perlvar{'lonDaemons'}/logs/lonc_errors");
1.30      albertel  557:    sleep 2;
1.1       albertel  558:    if (-e $loncfile) {
                    559:        print $fh "Seems like it started ...<p>";
                    560:        my $lfh=IO::File->new("$loncfile");
                    561:        my $loncpid=<$lfh>;
                    562:        chomp($loncpid);
1.30      albertel  563:        sleep 2;
1.1       albertel  564:        if (kill 0 => $loncpid) {
                    565:           print $fh "<h3>lonc at pid $loncpid responding</h3>";
                    566:        } else {
                    567:           $errors++; $errors++;
                    568:           print $fh "<h3>lonc at pid $loncpid not responding</h3>";
                    569:           print $fh "Give it one more try ...<p>";
1.16      harris41  570:  	  system(
1.17      harris41  571:  "$perlvar{'lonDaemons'}/lonc 2>>$perlvar{'lonDaemons'}/logs/lonc_errors");
1.30      albertel  572:           sleep 2;
1.1       albertel  573:        }
                    574:    } else {
                    575:        print $fh "Seems like that did not work!<p>";
                    576:        $errors++;
                    577:    }
1.3       www       578:    if (-e "$perlvar{'lonDaemons'}/logs/lonc.log") {
                    579:     print $fh "<p><pre>";
                    580:     open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonc.log|");
                    581:     while ($line=<DFH>) { 
                    582:       print $fh "$line";
1.4       www       583:       if ($line=~/WARNING/) { $notices++; }
                    584:       if ($line=~/CRITICAL/) { $notices++; }
1.3       www       585:     };
                    586:     close (DFH);
                    587:     print $fh "</pre>";
                    588:    }
1.1       albertel  589: }
                    590: 
                    591: $fname="$perlvar{'lonDaemons'}/logs/lonc.log";
1.34      www       592: 
                    593:                           my ($dev,$ino,$mode,$nlink,
                    594:                               $uid,$gid,$rdev,$size,
                    595:                               $atime,$mtime,$ctime,
                    596:                               $blksize,$blocks)=stat($fname);
                    597: 
                    598: if ($size>40000) {
                    599:     print $fh "Rotating logs ...<p>";
                    600:     rename("$fname.2","$fname.3");
                    601:     rename("$fname.1","$fname.2");
                    602:     rename("$fname","$fname.1");
                    603: }
                    604: 
                    605:    
                    606: &errout($fh);
                    607: # -------------------------------------------------------------------- lonhttpd
                    608: 
                    609: print $fh '<hr><a name="lonhttpd"><h2>lonhttpd</h2><h3>Log</h3><pre>';
                    610: print "lonhttpd\n";
                    611: 
                    612: if (-e "$perlvar{'lonDaemons'}/logs/lonhttpd.log"){
                    613: open (DFH,"tail -n25 $perlvar{'lonDaemons'}/logs/lonhttpd.log|");
                    614: while ($line=<DFH>) { 
                    615:    print $fh "$line";
                    616:    if ($line=~/INFO/) { $notices++; }
                    617:    if ($line=~/WARNING/) { $notices++; }
                    618:    if ($line=~/CRITICAL/) { $warnings++; }
                    619: };
                    620: close (DFH);
                    621: }
                    622: print $fh "</pre>";
                    623: 
                    624: my $lonhttpdfile="$perlvar{'lonDaemons'}/logs/lonhttpd.pid";
                    625: 
                    626: $restartflag=1;
                    627: if (-e $lonhttpdfile) {
                    628:    my $lfh=IO::File->new("$lonhttpdfile");
                    629:    my $lonhttpdpid=<$lfh>;
                    630:    chomp($lonhttpdpid);
                    631:    if (kill 0 => $lonhttpdpid) {
1.35      albertel  632:       print $fh "<h3>lonhttpd at pid $lonhttpdpid responding</h3>";
1.34      www       633:       $restartflag=0;
                    634:    } else {
                    635:       $errors++;
                    636:       print $fh "<h3>lonhttpd at pid $lonhttpdpid not responding</h3>";
                    637:       # Solution: kill parent and children processes, remove .pid and restart
                    638: 	  $restartflag=1;
                    639:       print $fh 
                    640: 	  "<h3>Decided to clean up stale .pid file and restart lonhttpd</h3>";
                    641:    }
                    642: } 
                    643: if ($restartflag==1) {
                    644:    $errors++;
                    645: 	  print $fh '<br><font color="red">Killall lonhttpd: '.
                    646: 	            system('killall lonhttpd').' - ';
                    647:           sleep 2;
                    648:           print $fh unlink($lonhttpdfile).' - '.system('killall -9 lonhttpd').
                    649:                     '</font><br>';
                    650:    print $fh "<h3>lonhttpd not running, trying to start</h3>";
                    651: 	system(
                    652:  "$perlvar{'lonDaemons'}/lonhttpd 2>>$perlvar{'lonDaemons'}/logs/lonhttpd_errors");
                    653:    sleep 2;
                    654:    if (-e $lonhttpdfile) {
                    655:        print $fh "Seems like it started ...<p>";
                    656:        my $lfh=IO::File->new("$lonhttpdfile");
                    657:        my $lonhttpdpid=<$lfh>;
                    658:        chomp($lonhttpdpid);
                    659:        sleep 2;
                    660:        if (kill 0 => $lonhttpdpid) {
                    661:           print $fh "<h3>lonhttpd at pid $lonhttpdpid responding</h3>";
                    662:        } else {
                    663:           $errors++; $errors++;
                    664:           print $fh "<h3>lonhttpd at pid $lonhttpdpid not responding</h3>";
                    665:           print $fh "Give it one more try ...<p>";
                    666:  	  system(
                    667:  "$perlvar{'lonDaemons'}/lonhttpd 2>>$perlvar{'lonDaemons'}/logs/lonhttpd_errors");
                    668:           sleep 2;
                    669:        }
                    670:    } else {
                    671:        print $fh "Seems like that did not work!<p>";
                    672:        $errors++;
                    673:    }
                    674:    if (-e "$perlvar{'lonDaemons'}/logs/lonhttpd.log") {
                    675:     print $fh "<p><pre>";
                    676:     open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonhttpd.log|");
                    677:     while ($line=<DFH>) { 
                    678:       print $fh "$line";
                    679:       if ($line=~/WARNING/) { $notices++; }
                    680:       if ($line=~/CRITICAL/) { $notices++; }
                    681:     };
                    682:     close (DFH);
                    683:     print $fh "</pre>";
                    684:    }
                    685: }
                    686: 
                    687: $fname="$perlvar{'lonDaemons'}/logs/lonhttpd.log";
1.1       albertel  688: 
                    689:                           my ($dev,$ino,$mode,$nlink,
                    690:                               $uid,$gid,$rdev,$size,
                    691:                               $atime,$mtime,$ctime,
                    692:                               $blksize,$blocks)=stat($fname);
                    693: 
                    694: if ($size>40000) {
                    695:     print $fh "Rotating logs ...<p>";
                    696:     rename("$fname.2","$fname.3");
                    697:     rename("$fname.1","$fname.2");
                    698:     rename("$fname","$fname.1");
                    699: }
                    700: 
                    701:    
                    702: &errout($fh);
                    703: # ---------------------------------------------------------------------- lonnet
                    704: 
                    705: print $fh '<hr><a name="lonnet"><h2>lonnet</h2><h3>Temp Log</h3><pre>';
1.23      www       706: print "lonnet\n";
1.1       albertel  707: if (-e "$perlvar{'lonDaemons'}/logs/lonnet.log"){
                    708: open (DFH,"tail -n50 $perlvar{'lonDaemons'}/logs/lonnet.log|");
                    709: while ($line=<DFH>) { 
                    710:     print $fh "$line";
                    711: };
                    712: close (DFH);
                    713: }
1.11      www       714: print $fh "</pre><h3>Perm Log</h3><pre>";
1.1       albertel  715: 
                    716: if (-e "$perlvar{'lonDaemons'}/logs/lonnet.perm.log") {
                    717:     open(DFH,"tail -n10 $perlvar{'lonDaemons'}/logs/lonnet.perm.log|");
                    718: while ($line=<DFH>) { 
                    719:    print $fh "$line";
                    720: };
                    721: close (DFH);
                    722: } else { print $fh "No perm log\n" }
                    723: 
                    724: $fname="$perlvar{'lonDaemons'}/logs/lonnet.log";
                    725: 
                    726:                           my ($dev,$ino,$mode,$nlink,
                    727:                               $uid,$gid,$rdev,$size,
                    728:                               $atime,$mtime,$ctime,
                    729:                               $blksize,$blocks)=stat($fname);
                    730: 
                    731: if ($size>40000) {
                    732:     print $fh "Rotating logs ...<p>";
                    733:     rename("$fname.2","$fname.3");
                    734:     rename("$fname.1","$fname.2");
                    735:     rename("$fname","$fname.1");
                    736: }
                    737: 
                    738: print $fh "</pre>";
                    739: &errout($fh);
                    740: # ----------------------------------------------------------------- Connections
                    741: 
                    742: print $fh '<hr><a name="connections"><h2>Connections</h2>';
                    743: 
                    744: print $fh "<table border=2>";
1.31      albertel  745: foreach $tryserver (sort(keys(%hostname))) {
1.1       albertel  746: 
                    747:     $answer=reply("pong",$tryserver);
                    748:     if ($answer eq "$tryserver:$perlvar{'lonHostID'}") {
                    749: 	$result="<b>ok</b>";
                    750:     } else {
                    751:         $result=$answer;
                    752:         $warnings++;
                    753:         if ($answer eq 'con_lost') { $warnings++; }
                    754:     }
                    755:     print $fh "<tr><td>$tryserver</td><td>$result</td></tr>\n";
                    756: 
                    757: }
                    758: print $fh "</table>";
                    759: 
                    760: &errout($fh);
                    761: # ------------------------------------------------------------ Delayed messages
                    762: 
                    763: print $fh '<hr><a name="delayed"><h2>Delayed Messages</h2>';
1.23      www       764: print "buffers\n";
1.1       albertel  765: 
                    766: print $fh '<h3>Scanning Permanent Log</h3>';
                    767: 
                    768: $unsend=0;
                    769: {
                    770:     my $dfh=IO::File->new("$perlvar{'lonDaemons'}/logs/lonnet.perm.log");
                    771:     while ($line=<$dfh>) {
                    772: 	($time,$sdf,$dserv,$dcmd)=split(/:/,$line);
                    773:         if ($sdf eq 'F') { 
                    774: 	    $local=localtime($time);
                    775:             print "<b>Failed: $time, $dserv, $dcmd</b><br>";
                    776:             $warnings++;
                    777:         }
                    778:         if ($sdf eq 'S') { $unsend--; }
                    779:         if ($sdf eq 'D') { $unsend++; }
                    780:     }
                    781: }
                    782: print $fh "Total unsend messages: <b>$unsend</b><p>\n";
                    783: $warnings=$warnings+5*$unsend;
                    784: 
                    785: print $fh "<h3>Outgoing Buffer</h3>";
                    786: 
                    787: open (DFH,"ls -lF $perlvar{'lonSockDir'}/delayed|");
                    788: while ($line=<DFH>) { 
                    789:     print $fh "$line<br>";
                    790: };
                    791: close (DFH);
                    792: 
                    793: # ------------------------------------------------------------------------- End
                    794: print $fh "<a name=errcount>\n";
                    795: $totalcount=$notices+4*$warnings+100*$errors;
                    796: &errout($fh);
                    797: print $fh "<h1>Total Error Count: $totalcount</h1>";
                    798: $now=time;
                    799: $date=localtime($now);
                    800: print $fh "<hr>$date ($now)</body></html>\n";
1.23      www       801: print "writing done\n";
1.1       albertel  802: }
                    803: 
                    804: rename ("$statusdir/newstatus.html","$statusdir/index.html");
                    805: 
                    806: if ($totalcount>200) {
1.23      www       807:    print "mailing\n";
1.37    ! www       808:    $emailto="$perlvar{'lonAdmEMail'}";
        !           809:    if ($totalcount>600) {
        !           810:       $emailto.=",$perlvar{'lonSysEMail'}";
        !           811:    }
1.1       albertel  812:    $subj="LON: $perlvar{'lonHostID'} E:$errors W:$warnings N:$notices"; 
                    813:    system(
1.24      www       814:  "metasend -b -t $emailto -s '$subj' -f $statusdir/index.html -m text/html");
1.1       albertel  815: }
                    816: 1;
                    817: 
                    818: 
                    819: 
                    820: 
                    821: 
                    822: 
                    823: 
                    824: 

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>