Annotation of loncom/loncron, revision 1.35

1.1       albertel    1: #!/usr/bin/perl
                      2: 
                      3: # The LearningOnline Network
                      4: # Housekeeping program, started by cron
                      5: #
                      6: # (TCP networking package
                      7: # 6/1/99,6/2,6/10,6/11,6/12,6/14,6/26,6/28,6/29,6/30,
                      8: # 7/1,7/2,7/9,7/10,7/12 Gerd Kortemeyer)
                      9: #
1.3       www        10: # 7/14,7/15,7/19,7/21,7/22,11/18,
                     11: # 2/8 Gerd Kortemeyer
1.20      harris41   12: # 12/6/2000,12/8 Scott Harrison
1.11      www        13: # 12/23 Gerd Kortemeyer
1.22      harris41   14: # YEAR=2001
                     15: # 1/10/2001, 2/12/, 2/26, 3/15, 04/11, 04/21,8/27 Scott Harrison
1.25      www        16: # 09/04,09/06,11/26 Gerd Kortemeyer
1.26      harris41   17: # YEAR=2002
                     18: # 5/11/2002 Scott Harrison
1.24      www        19: 
                     20: $|=1;
1.1       albertel   21: 
1.26      harris41   22: use lib '/home/httpd/lib/perl/';
                     23: use LONCAPA::Configuration;
                     24: 
1.1       albertel   25: use IO::File;
                     26: use IO::Socket;
                     27: 
                     28: # -------------------------------------------------- Non-critical communication
                     29: sub reply {
                     30:     my ($cmd,$server)=@_;
                     31:     my $peerfile="$perlvar{'lonSockDir'}/$server";
                     32:     my $client=IO::Socket::UNIX->new(Peer    =>"$peerfile",
                     33:                                      Type    => SOCK_STREAM,
                     34:                                      Timeout => 10)
                     35:        or return "con_lost";
                     36:     print $client "$cmd\n";
                     37:     my $answer=<$client>;
                     38:     chomp($answer);
                     39:     if (!$answer) { $answer="con_lost"; }
                     40:     return $answer;
                     41: }
                     42: 
                     43: # --------------------------------------------------------- Output error status
                     44: 
                     45: sub errout {
                     46:    my $fh=shift;
                     47:    print $fh (<<ENDERROUT);
                     48:      <p><table border=2 bgcolor="#CCCCCC">
                     49:      <tr><td>Notices</td><td>$notices</td></tr>
                     50:      <tr><td>Warnings</td><td>$warnings</td></tr>
                     51:      <tr><td>Errors</td><td>$errors</td></tr>
                     52:      </table><p><a href="#top">Top</a><p>
                     53: ENDERROUT
                     54: }
                     55: 
                     56: # ================================================================ Main Program
                     57: 
1.27      matthew    58: # --------------------------------- Read loncapa_apache.conf and loncapa.conf
1.33      harris41   59: my $perlvarref=LONCAPA::Configuration::read_conf('loncapa.conf');
1.28      albertel   60: %perlvar=%{$perlvarref};
1.26      harris41   61: undef $perlvarref;
                     62: delete $perlvar{'lonReceipt'}; # remove since sensitive and not needed
                     63: delete $perlvar{'lonSqlAccess'}; # remove since sensitive and not needed
1.13      harris41   64: 
1.14      harris41   65: # --------------------------------------- Make sure that LON-CAPA is configured
                     66: # I only test for one thing here (lonHostID).  This is just a safeguard.
                     67: if ('{[[[[lonHostID]]]]}' eq $perlvar{'lonHostID'}) {
1.15      harris41   68:    print("Unconfigured machine.\n");
1.14      harris41   69:    $emailto=$perlvar{'lonSysEMail'};
                     70:    $hostname=`/bin/hostname`;
                     71:    chop $hostname;
                     72:    $hostname=~s/[^\w\.]//g; # make sure is safe to pass through shell
                     73:    $subj="LON: Unconfigured machine $hostname";
                     74:    system("echo 'Unconfigured machine $hostname.' |\
                     75:  mailto $emailto -s '$subj' > /dev/null");
                     76:     exit 1;
                     77: }
                     78: 
1.13      harris41   79: # ----------------------------- Make sure this process is running from user=www
                     80: my $wwwid=getpwnam('www');
                     81: if ($wwwid!=$<) {
1.14      harris41   82:    print("User ID mismatch.  This program must be run as user 'www'\n");
1.13      harris41   83:    $emailto="$perlvar{'lonAdmEMail'},$perlvar{'lonSysEMail'}";
                     84:    $subj="LON: $perlvar{'lonHostID'} User ID mismatch";
                     85:    system("echo 'User ID mismatch.  loncron must be run as user www.' |\
                     86:  mailto $emailto -s '$subj' > /dev/null");
1.14      harris41   87:    exit 1;
1.1       albertel   88: }
                     89: 
                     90: # ------------------------------------------------------------- Read hosts file
                     91: {
                     92:     my $config=IO::File->new("$perlvar{'lonTabDir'}/hosts.tab");
                     93: 
                     94:     while (my $configline=<$config>) {
1.31      albertel   95: 	my ($id,$domain,$role,$name,$ip,$domdescr)=split(/:/,$configline);
                     96: 	if ($id && $domain && $role && $name && $ip) {
                     97: 	    $hostname{$id}=$name;
                     98: 	    $hostdom{$id}=$domain;
                     99: 	    $hostip{$id}=$ip;
                    100: 	    $hostrole{$id}=$role;
                    101: 	    if ($domdescr) { $domaindescription{$domain}=$domdescr; }
                    102: 	    if (($role eq 'library') && ($id ne $perlvar{'lonHostID'})) {
                    103: 		$libserv{$id}=$name;
                    104: 	    }
                    105: 	} else {
                    106: 	    if ($configline) {
                    107: #		&logthis("Skipping hosts.tab line -$configline-");
                    108: 	    }
                    109: 	}
1.1       albertel  110:     }
                    111: }
                    112: 
                    113: # ------------------------------------------------------ Read spare server file
                    114: {
                    115:     my $config=IO::File->new("$perlvar{'lonTabDir'}/spare.tab");
                    116: 
                    117:     while (my $configline=<$config>) {
                    118:        chomp($configline);
                    119:        if (($configline) && ($configline ne $perlvar{'lonHostID'})) {
                    120:           $spareid{$configline}=1;
                    121:        }
                    122:     }
                    123: }
                    124: 
                    125: # ---------------------------------------------------------------- Start report
                    126: 
                    127: $statusdir="/home/httpd/html/lon-status";
                    128: 
                    129: $errors=0;
                    130: $warnings=0;
                    131: $notices=0;
                    132: 
                    133: $now=time;
                    134: $date=localtime($now);
                    135: 
                    136: {
                    137: my $fh=IO::File->new(">$statusdir/newstatus.html");
                    138: 
                    139: print $fh (<<ENDHEADERS);
                    140: <html>
                    141: <head>
                    142: <title>LON Status Report $perlvar{'lonHostID'}</title>
                    143: </head>
1.3       www       144: <body bgcolor="#AAAAAA">
1.1       albertel  145: <a name="top">
                    146: <h1>LON Status Report $perlvar{'lonHostID'}</h1>
                    147: <h2>$date ($now)</h2>
                    148: <ol>
                    149: <li><a href="#configuration">Configuration</a>
                    150: <li><a href="#machine">Machine Information</a>
1.11      www       151: <li><a href="#tmp">Temporary Files</a>
                    152: <li><a href="#tokens">Session Tokens</a>
1.1       albertel  153: <li><a href="#httpd">httpd</a>
1.11      www       154: <li><a href="#lonsql">lonsql</a>
1.1       albertel  155: <li><a href="#lond">lond</a>
                    156: <li><a href="#lonc">lonc</a>
1.34      www       157: <li><a href="#lonhttpd">lonhttpd</a>
1.1       albertel  158: <li><a href="#lonnet">lonnet</a>
                    159: <li><a href="#connections">Connections</a>
                    160: <li><a href="#delayed">Delayed Messages</a>
                    161: <li><a href="#errcount">Error Count</a>
                    162: </ol>
                    163: <hr>
                    164: <a name="configuration">
                    165: <h2>Configuration</h2>
                    166: <h3>PerlVars</h3>
                    167: <table border=2>
                    168: ENDHEADERS
                    169: 
1.31      albertel  170: foreach $varname (sort(keys(%perlvar))) {
1.1       albertel  171:     print $fh "<tr><td>$varname</td><td>$perlvar{$varname}</td></tr>\n";
                    172: }
                    173: print $fh "</table><h3>Hosts</h3><table border=2>";
1.31      albertel  174: foreach $id (sort(keys(%hostname))) {
                    175:     print $fh 
                    176: 	"<tr><td>$id</td><td>$hostdom{$id}</td><td>$hostrole{$id}</td>";
                    177:     print $fh "<td>$hostname{$id}</td><td>$hostip{$id}</td></tr>\n";
1.1       albertel  178: }
                    179: print $fh "</table><h3>Spare Hosts</h3><ol>";
1.31      albertel  180: foreach $id (sort(keys(%spareid))) {
1.1       albertel  181:     print $fh "<li>$id\n";
                    182: }
                    183: 
                    184: print $fh "</ol>\n";
                    185: 
                    186: # --------------------------------------------------------------------- Machine
                    187: 
                    188: print $fh '<hr><a name="machine"><h2>Machine Information</h2>';
                    189: print $fh "<h3>loadavg</h3>";
                    190: 
                    191: open (LOADAVGH,"/proc/loadavg");
                    192: $loadavg=<LOADAVGH>;
                    193: close (LOADAVGH);
                    194: 
                    195: print $fh "<tt>$loadavg</tt>";
                    196: 
                    197: @parts=split(/\s+/,$loadavg);
1.4       www       198: if ($parts[1]>4.0) {
1.1       albertel  199:     $errors++;
                    200: } elsif ($parts[1]>2.0) {
                    201:     $warnings++;
                    202: } elsif ($parts[1]>1.0) {
                    203:     $notices++;
                    204: }
                    205: 
                    206: print $fh "<h3>df</h3>";
                    207: print $fh "<pre>";
                    208: 
                    209: open (DFH,"df|");
                    210: while ($line=<DFH>) { 
                    211:    print $fh "$line"; 
                    212:    @parts=split(/\s+/,$line);
                    213:    $usage=$parts[4];
                    214:    $usage=~s/\W//g;
                    215:    if ($usage>90) { 
1.24      www       216:       $warnings++;
                    217:       $notices++; 
1.1       albertel  218:    } elsif ($usage>80) {
                    219:       $warnings++;
                    220:    } elsif ($usage>60) {
                    221:       $notices++;
                    222:    }
1.4       www       223:    if ($usage>95) { $warnings++; $warnings++ }
1.1       albertel  224: }
                    225: close (DFH);
                    226: print $fh "</pre>";
1.24      www       227: 
                    228: 
                    229: print $fh "<h3>ps</h3>";
                    230: print $fh "<pre>";
                    231: $psproc=0;
                    232: 
                    233: open (PSH,"ps -aux|");
                    234: while ($line=<PSH>) { 
                    235:    print $fh "$line"; 
                    236:    $psproc++;
                    237: }
                    238: close (PSH);
                    239: print $fh "</pre>";
                    240: 
                    241: if ($psproc>200) { $notices++; }
                    242: if ($psproc>250) { $notices++; }
                    243: 
1.1       albertel  244: &errout($fh);
1.11      www       245: 
                    246: # --------------------------------------------------------------- clean out tmp
                    247: print $fh '<hr><a name="tmp"><h2>Temporary Files</h2>';
                    248: $cleaned=0;
1.29      www       249: $old=0;
1.11      www       250: while ($fname=<$perlvar{'lonDaemons'}/tmp/*>) {
                    251:                           my ($dev,$ino,$mode,$nlink,
                    252:                               $uid,$gid,$rdev,$size,
                    253:                               $atime,$mtime,$ctime,
                    254:                               $blksize,$blocks)=stat($fname);
                    255:                           $now=time;
                    256:                           $since=$now-$mtime;
                    257:                           if ($since>$perlvar{'lonExpire'}) {
1.29      www       258:                               $line='';
                    259:                               if (open(PROBE,$fname)) {
                    260: 				  $line=<PROBE>;
                    261:                                   close(PROBE);
                    262: 			      }
                    263: 			      unless ($line=~/^CHECKOUTTOKEN\&/) {
                    264:                                  $cleaned++;
                    265:                                  unlink("$fname");
                    266: 			      } else {
1.32      www       267: 				  if ($since>365*$perlvar{'lonExpire'}) {
1.29      www       268:                                      $cleaned++;
                    269:                                      unlink("$fname");
                    270: 				 } else { $old++; }
                    271:                               }
1.11      www       272:                           }
                    273:     
                    274: }
1.29      www       275: print $fh "Cleaned up ".$cleaned." files (".$old." old checkout tokens).";
1.11      www       276: 
                    277: # ------------------------------------------------------------ clean out lonIDs
                    278: print $fh '<hr><a name="tokens"><h2>Session Tokens</h2>';
                    279: $cleaned=0;
                    280: $active=0;
                    281: while ($fname=<$perlvar{'lonIDsDir'}/*>) {
                    282:                           my ($dev,$ino,$mode,$nlink,
                    283:                               $uid,$gid,$rdev,$size,
                    284:                               $atime,$mtime,$ctime,
                    285:                               $blksize,$blocks)=stat($fname);
                    286:                           $now=time;
                    287:                           $since=$now-$mtime;
                    288:                           if ($since>$perlvar{'lonExpire'}) {
                    289:                               $cleaned++;
                    290:                               print $fh "Unlinking $fname<br>";
                    291:                               unlink("$fname");
                    292:                           } else {
                    293:                               $active++;
                    294:                           }
                    295:     
                    296: }
                    297: print $fh "<p>Cleaned up ".$cleaned." stale session token(s).";
                    298: print $fh "<h3>$active open session(s)</h3>";
                    299: 
1.1       albertel  300: # ----------------------------------------------------------------------- httpd
                    301: 
                    302: print $fh '<hr><a name="httpd"><h2>httpd</h2><h3>Access Log</h3><pre>';
                    303: 
1.23      www       304: open (DFH,"tail -n25 /etc/httpd/logs/access_log|");
1.1       albertel  305: while ($line=<DFH>) { print $fh "$line" };
                    306: close (DFH);
                    307: 
                    308: print $fh "</pre><h3>Error Log</h3><pre>";
                    309: 
1.23      www       310: open (DFH,"tail -n25 /etc/httpd/logs/error_log|");
1.1       albertel  311: while ($line=<DFH>) { 
                    312:    print $fh "$line";
                    313:    if ($line=~/\[error\]/) { $notices++; } 
                    314: };
                    315: close (DFH);
                    316: print $fh "</pre>";
                    317: &errout($fh);
1.5       harris41  318: 
                    319: 
1.11      www       320: # ---------------------------------------------------------------------- lonsql
1.22      harris41  321: 
                    322: my $restartflag=1;
1.18      harris41  323: if ($perlvar{'lonRole'} eq "library") {
1.5       harris41  324: 
1.11      www       325:     print $fh '<hr><a name="lonsql"><h2>lonsql</h2><h3>Log</h3><pre>';
1.23      www       326:     print "lonsql\n";
1.5       harris41  327:     if (-e "$perlvar{'lonDaemons'}/logs/lonsql.log"){
                    328: 	open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonsql.log|");
                    329: 	while ($line=<DFH>) { 
                    330: 	    print $fh "$line";
                    331: 	    if ($line=~/INFO/) { $notices++; }
                    332: 	    if ($line=~/WARNING/) { $notices++; }
                    333: 	    if ($line=~/CRITICAL/) { $warnings++; }
                    334: 	};
                    335: 	close (DFH);
                    336:     }
                    337:     print $fh "</pre>";
                    338:     
                    339:     my $lonsqlfile="$perlvar{'lonDaemons'}/logs/lonsql.pid";
1.23      www       340:  
                    341:     $restartflag=1;
                    342:    
1.5       harris41  343:     if (-e $lonsqlfile) {
                    344: 	my $lfh=IO::File->new("$lonsqlfile");
                    345: 	my $lonsqlpid=<$lfh>;
                    346: 	chomp($lonsqlpid);
                    347: 	if (kill 0 => $lonsqlpid) {
                    348: 	    print $fh "<h3>lonsql at pid $lonsqlpid responding</h3>";
1.22      harris41  349: 	    $restartflag=0;
1.5       harris41  350: 	} else {
                    351: 	    $errors++; $errors++;
                    352: 	    print $fh "<h3>lonsql at pid $lonsqlpid not responding</h3>";
1.22      harris41  353: 		$restartflag=1;
1.23      www       354: 	print $fh 
                    355: 	    "<h3>Decided to clean up stale .pid file and restart lonsql</h3>";
1.5       harris41  356: 	}
1.22      harris41  357:     }
                    358:     if ($restartflag==1) {
1.5       harris41  359: 	$errors++;
1.23      www       360: 	         print $fh '<br><font color="red">Killall lonsql: '.
                    361:                     system('killall lonsql').' - ';
1.30      albertel  362:                     sleep 2;
1.23      www       363:                     print $fh unlink($lonsqlfile).' - '.
                    364:                               system('killall -9 lonsql').
                    365:                     '</font><br>';
1.5       harris41  366: 	print $fh "<h3>lonsql not running, trying to start</h3>";
1.16      harris41  367: 	system(
                    368:  "$perlvar{'lonDaemons'}/lonsql 2>>$perlvar{'lonDaemons'}/logs/lonsql_errors");
1.30      albertel  369: 	sleep 2;
1.5       harris41  370: 	if (-e $lonsqlfile) {
                    371: 	    print $fh "Seems like it started ...<p>";
                    372: 	    my $lfh=IO::File->new("$lonsqlfile");
                    373: 	    my $lonsqlpid=<$lfh>;
                    374: 	    chomp($lonsqlpid);
1.30      albertel  375: 	    sleep 2;
1.5       harris41  376: 	    if (kill 0 => $lonsqlpid) {
                    377: 		print $fh "<h3>lonsql at pid $lonsqlpid responding</h3>";
                    378: 	    } else {
                    379: 		$errors++; $errors++;
                    380: 		print $fh "<h3>lonsql at pid $lonsqlpid not responding</h3>";
                    381: 		print $fh "Give it one more try ...<p>";
1.16      harris41  382: 		system(
                    383:  "$perlvar{'lonDaemons'}/lonsql 2>>$perlvar{'lonDaemons'}/logs/lonsql_errors");
1.30      albertel  384: 		sleep 2;
1.5       harris41  385: 	    }
                    386: 	} else {
                    387: 	    print $fh "Seems like that did not work!<p>";
                    388: 	    $errors++;
                    389: 	}
                    390: 	if (-e "$perlvar{'lonDaemons'}/logs/lonsql.log"){
                    391: 	    print $fh "<p><pre>";
                    392: 	    open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonsql.log|");
                    393: 	    while ($line=<DFH>) { 
                    394: 		print $fh "$line";
                    395: 		if ($line=~/WARNING/) { $notices++; }
                    396: 		if ($line=~/CRITICAL/) { $notices++; }
                    397: 	    };
                    398: 	    close (DFH);
                    399: 	    print $fh "</pre>";
                    400: 	}
                    401:     }
                    402: 
                    403:     $fname="$perlvar{'lonDaemons'}/logs/lonsql.log";
                    404: 
                    405:     my ($dev,$ino,$mode,$nlink,
                    406: 	$uid,$gid,$rdev,$size,
                    407: 	$atime,$mtime,$ctime,
                    408: 	$blksize,$blocks)=stat($fname);
                    409: 
                    410:     if ($size>40000) {
                    411: 	print $fh "Rotating logs ...<p>";
                    412: 	rename("$fname.2","$fname.3");
                    413: 	rename("$fname.1","$fname.2");
                    414: 	rename("$fname","$fname.1");
                    415:     }
                    416: 
                    417:     &errout($fh);
                    418: }
1.1       albertel  419: # ------------------------------------------------------------------------ lond
                    420: 
                    421: print $fh '<hr><a name="lond"><h2>lond</h2><h3>Log</h3><pre>';
1.23      www       422: print "lond\n";
1.1       albertel  423: 
                    424: if (-e "$perlvar{'lonDaemons'}/logs/lond.log"){
1.23      www       425: open (DFH,"tail -n25 $perlvar{'lonDaemons'}/logs/lond.log|");
1.1       albertel  426: while ($line=<DFH>) { 
                    427:    print $fh "$line";
1.3       www       428:    if ($line=~/INFO/) { $notices++; }
1.4       www       429:    if ($line=~/WARNING/) { $notices++; }
                    430:    if ($line=~/CRITICAL/) { $warnings++; }
1.1       albertel  431: };
                    432: close (DFH);
                    433: }
                    434: print $fh "</pre>";
                    435: 
                    436: my $londfile="$perlvar{'lonDaemons'}/logs/lond.pid";
                    437: 
1.22      harris41  438: $restartflag=1;
1.7       harris41  439: if (-e $londfile) {    
1.1       albertel  440:    my $lfh=IO::File->new("$londfile");
                    441:    my $londpid=<$lfh>;
                    442:    chomp($londpid);
                    443:    if (kill 0 => $londpid) {
1.25      www       444:       print $fh "<h3>lond at pid $londpid responding, sending USR1</h3>";
                    445:       kill USR1 => $londpid;
1.7       harris41  446:       $restartflag=0;
1.1       albertel  447:    } else {
1.8       harris41  448:       $errors++;
1.1       albertel  449:       print $fh "<h3>lond at pid $londpid not responding</h3>";
1.23      www       450:       $restartflag=1;
1.8       harris41  451:       print $fh 
1.23      www       452: 	  "<h3>Decided to clean up stale .pid file and restart lond</h3>";
1.1       albertel  453:    }
1.7       harris41  454: } 
                    455: if ($restartflag==1) {
1.1       albertel  456:    $errors++;
1.23      www       457: 	  print $fh '<br><font color="red">Killall lond: '.
                    458:                     system('killall lond').' - ';
1.30      albertel  459:           sleep 2;
1.23      www       460:           print $fh unlink($londfile).' - '.system('killall -9 lond').
                    461:                     '</font><br>';
1.1       albertel  462:    print $fh "<h3>lond not running, trying to start</h3>";
1.16      harris41  463:    system(
                    464:      "$perlvar{'lonDaemons'}/lond 2>>$perlvar{'lonDaemons'}/logs/lond_errors");
1.30      albertel  465:    sleep 2;
1.1       albertel  466:    if (-e $londfile) {
                    467:        print $fh "Seems like it started ...<p>";
                    468:        my $lfh=IO::File->new("$londfile");
                    469:        my $londpid=<$lfh>;
                    470:        chomp($londpid);
1.30      albertel  471:        sleep 2;
1.1       albertel  472:        if (kill 0 => $londpid) {
                    473:           print $fh "<h3>lond at pid $londpid responding</h3>";
                    474:        } else {
                    475:           $errors++; $errors++;
                    476:           print $fh "<h3>lond at pid $londpid not responding</h3>";
                    477:           print $fh "Give it one more try ...<p>";
1.16      harris41  478: 	  system(
                    479:  "$perlvar{'lonDaemons'}/lond 2>>$perlvar{'lonDaemons'}/logs/lond_errors");
1.30      albertel  480:           sleep 2;
1.1       albertel  481:        }
                    482:    } else {
                    483:        print $fh "Seems like that did not work!<p>";
                    484:        $errors++;
                    485:    }
1.3       www       486:    if (-e "$perlvar{'lonDaemons'}/logs/lond.log"){
                    487:     print $fh "<p><pre>";
                    488:     open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lond.log|");
                    489:     while ($line=<DFH>) { 
                    490:       print $fh "$line";
1.4       www       491:       if ($line=~/WARNING/) { $notices++; }
                    492:       if ($line=~/CRITICAL/) { $notices++; }
1.3       www       493:     };
                    494:     close (DFH);
                    495:     print $fh "</pre>";
                    496:    }
1.1       albertel  497: }
                    498: 
                    499: $fname="$perlvar{'lonDaemons'}/logs/lond.log";
                    500: 
                    501:                           my ($dev,$ino,$mode,$nlink,
                    502:                               $uid,$gid,$rdev,$size,
                    503:                               $atime,$mtime,$ctime,
                    504:                               $blksize,$blocks)=stat($fname);
                    505: 
                    506: if ($size>40000) {
                    507:     print $fh "Rotating logs ...<p>";
                    508:     rename("$fname.2","$fname.3");
                    509:     rename("$fname.1","$fname.2");
                    510:     rename("$fname","$fname.1");
                    511: }
                    512: 
                    513: &errout($fh);
                    514: # ------------------------------------------------------------------------ lonc
                    515: 
                    516: print $fh '<hr><a name="lonc"><h2>lonc</h2><h3>Log</h3><pre>';
1.23      www       517: print "lonc\n";
1.1       albertel  518: 
                    519: if (-e "$perlvar{'lonDaemons'}/logs/lonc.log"){
1.23      www       520: open (DFH,"tail -n25 $perlvar{'lonDaemons'}/logs/lonc.log|");
1.1       albertel  521: while ($line=<DFH>) { 
                    522:    print $fh "$line";
1.3       www       523:    if ($line=~/INFO/) { $notices++; }
1.4       www       524:    if ($line=~/WARNING/) { $notices++; }
                    525:    if ($line=~/CRITICAL/) { $warnings++; }
1.1       albertel  526: };
                    527: close (DFH);
                    528: }
                    529: print $fh "</pre>";
                    530: 
                    531: my $loncfile="$perlvar{'lonDaemons'}/logs/lonc.pid";
                    532: 
1.7       harris41  533: $restartflag=1;
1.1       albertel  534: if (-e $loncfile) {
                    535:    my $lfh=IO::File->new("$loncfile");
                    536:    my $loncpid=<$lfh>;
                    537:    chomp($loncpid);
                    538:    if (kill 0 => $loncpid) {
                    539:       print $fh "<h3>lonc at pid $loncpid responding, sending USR1</h3>";
                    540:       kill USR1 => $loncpid;
1.7       harris41  541:       $restartflag=0;
1.1       albertel  542:    } else {
1.8       harris41  543:       $errors++;
1.1       albertel  544:       print $fh "<h3>lonc at pid $loncpid not responding</h3>";
1.10      harris41  545:       # Solution: kill parent and children processes, remove .pid and restart
1.8       harris41  546: 	  $restartflag=1;
                    547:       print $fh 
1.23      www       548: 	  "<h3>Decided to clean up stale .pid file and restart lonc</h3>";
1.1       albertel  549:    }
1.7       harris41  550: } 
                    551: if ($restartflag==1) {
1.1       albertel  552:    $errors++;
1.23      www       553: 	  print $fh '<br><font color="red">Killall lonc: '.
                    554: 	            system('killall lonc').' - ';
1.30      albertel  555:           sleep 2;
1.23      www       556:           print $fh unlink($loncfile).' - '.system('killall -9 lonc').
                    557:                     '</font><br>';
1.1       albertel  558:    print $fh "<h3>lonc not running, trying to start</h3>";
1.16      harris41  559: 	system(
1.17      harris41  560:  "$perlvar{'lonDaemons'}/lonc 2>>$perlvar{'lonDaemons'}/logs/lonc_errors");
1.30      albertel  561:    sleep 2;
1.1       albertel  562:    if (-e $loncfile) {
                    563:        print $fh "Seems like it started ...<p>";
                    564:        my $lfh=IO::File->new("$loncfile");
                    565:        my $loncpid=<$lfh>;
                    566:        chomp($loncpid);
1.30      albertel  567:        sleep 2;
1.1       albertel  568:        if (kill 0 => $loncpid) {
                    569:           print $fh "<h3>lonc at pid $loncpid responding</h3>";
                    570:        } else {
                    571:           $errors++; $errors++;
                    572:           print $fh "<h3>lonc at pid $loncpid not responding</h3>";
                    573:           print $fh "Give it one more try ...<p>";
1.16      harris41  574:  	  system(
1.17      harris41  575:  "$perlvar{'lonDaemons'}/lonc 2>>$perlvar{'lonDaemons'}/logs/lonc_errors");
1.30      albertel  576:           sleep 2;
1.1       albertel  577:        }
                    578:    } else {
                    579:        print $fh "Seems like that did not work!<p>";
                    580:        $errors++;
                    581:    }
1.3       www       582:    if (-e "$perlvar{'lonDaemons'}/logs/lonc.log") {
                    583:     print $fh "<p><pre>";
                    584:     open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonc.log|");
                    585:     while ($line=<DFH>) { 
                    586:       print $fh "$line";
1.4       www       587:       if ($line=~/WARNING/) { $notices++; }
                    588:       if ($line=~/CRITICAL/) { $notices++; }
1.3       www       589:     };
                    590:     close (DFH);
                    591:     print $fh "</pre>";
                    592:    }
1.1       albertel  593: }
                    594: 
                    595: $fname="$perlvar{'lonDaemons'}/logs/lonc.log";
1.34      www       596: 
                    597:                           my ($dev,$ino,$mode,$nlink,
                    598:                               $uid,$gid,$rdev,$size,
                    599:                               $atime,$mtime,$ctime,
                    600:                               $blksize,$blocks)=stat($fname);
                    601: 
                    602: if ($size>40000) {
                    603:     print $fh "Rotating logs ...<p>";
                    604:     rename("$fname.2","$fname.3");
                    605:     rename("$fname.1","$fname.2");
                    606:     rename("$fname","$fname.1");
                    607: }
                    608: 
                    609:    
                    610: &errout($fh);
                    611: # -------------------------------------------------------------------- lonhttpd
                    612: 
                    613: print $fh '<hr><a name="lonhttpd"><h2>lonhttpd</h2><h3>Log</h3><pre>';
                    614: print "lonhttpd\n";
                    615: 
                    616: if (-e "$perlvar{'lonDaemons'}/logs/lonhttpd.log"){
                    617: open (DFH,"tail -n25 $perlvar{'lonDaemons'}/logs/lonhttpd.log|");
                    618: while ($line=<DFH>) { 
                    619:    print $fh "$line";
                    620:    if ($line=~/INFO/) { $notices++; }
                    621:    if ($line=~/WARNING/) { $notices++; }
                    622:    if ($line=~/CRITICAL/) { $warnings++; }
                    623: };
                    624: close (DFH);
                    625: }
                    626: print $fh "</pre>";
                    627: 
                    628: my $lonhttpdfile="$perlvar{'lonDaemons'}/logs/lonhttpd.pid";
                    629: 
                    630: $restartflag=1;
                    631: if (-e $lonhttpdfile) {
                    632:    my $lfh=IO::File->new("$lonhttpdfile");
                    633:    my $lonhttpdpid=<$lfh>;
                    634:    chomp($lonhttpdpid);
                    635:    if (kill 0 => $lonhttpdpid) {
1.35    ! albertel  636:       print $fh "<h3>lonhttpd at pid $lonhttpdpid responding</h3>";
1.34      www       637:       $restartflag=0;
                    638:    } else {
                    639:       $errors++;
                    640:       print $fh "<h3>lonhttpd at pid $lonhttpdpid not responding</h3>";
                    641:       # Solution: kill parent and children processes, remove .pid and restart
                    642: 	  $restartflag=1;
                    643:       print $fh 
                    644: 	  "<h3>Decided to clean up stale .pid file and restart lonhttpd</h3>";
                    645:    }
                    646: } 
                    647: if ($restartflag==1) {
                    648:    $errors++;
                    649: 	  print $fh '<br><font color="red">Killall lonhttpd: '.
                    650: 	            system('killall lonhttpd').' - ';
                    651:           sleep 2;
                    652:           print $fh unlink($lonhttpdfile).' - '.system('killall -9 lonhttpd').
                    653:                     '</font><br>';
                    654:    print $fh "<h3>lonhttpd not running, trying to start</h3>";
                    655: 	system(
                    656:  "$perlvar{'lonDaemons'}/lonhttpd 2>>$perlvar{'lonDaemons'}/logs/lonhttpd_errors");
                    657:    sleep 2;
                    658:    if (-e $lonhttpdfile) {
                    659:        print $fh "Seems like it started ...<p>";
                    660:        my $lfh=IO::File->new("$lonhttpdfile");
                    661:        my $lonhttpdpid=<$lfh>;
                    662:        chomp($lonhttpdpid);
                    663:        sleep 2;
                    664:        if (kill 0 => $lonhttpdpid) {
                    665:           print $fh "<h3>lonhttpd at pid $lonhttpdpid responding</h3>";
                    666:        } else {
                    667:           $errors++; $errors++;
                    668:           print $fh "<h3>lonhttpd at pid $lonhttpdpid not responding</h3>";
                    669:           print $fh "Give it one more try ...<p>";
                    670:  	  system(
                    671:  "$perlvar{'lonDaemons'}/lonhttpd 2>>$perlvar{'lonDaemons'}/logs/lonhttpd_errors");
                    672:           sleep 2;
                    673:        }
                    674:    } else {
                    675:        print $fh "Seems like that did not work!<p>";
                    676:        $errors++;
                    677:    }
                    678:    if (-e "$perlvar{'lonDaemons'}/logs/lonhttpd.log") {
                    679:     print $fh "<p><pre>";
                    680:     open (DFH,"tail -n100 $perlvar{'lonDaemons'}/logs/lonhttpd.log|");
                    681:     while ($line=<DFH>) { 
                    682:       print $fh "$line";
                    683:       if ($line=~/WARNING/) { $notices++; }
                    684:       if ($line=~/CRITICAL/) { $notices++; }
                    685:     };
                    686:     close (DFH);
                    687:     print $fh "</pre>";
                    688:    }
                    689: }
                    690: 
                    691: $fname="$perlvar{'lonDaemons'}/logs/lonhttpd.log";
1.1       albertel  692: 
                    693:                           my ($dev,$ino,$mode,$nlink,
                    694:                               $uid,$gid,$rdev,$size,
                    695:                               $atime,$mtime,$ctime,
                    696:                               $blksize,$blocks)=stat($fname);
                    697: 
                    698: if ($size>40000) {
                    699:     print $fh "Rotating logs ...<p>";
                    700:     rename("$fname.2","$fname.3");
                    701:     rename("$fname.1","$fname.2");
                    702:     rename("$fname","$fname.1");
                    703: }
                    704: 
                    705:    
                    706: &errout($fh);
                    707: # ---------------------------------------------------------------------- lonnet
                    708: 
                    709: print $fh '<hr><a name="lonnet"><h2>lonnet</h2><h3>Temp Log</h3><pre>';
1.23      www       710: print "lonnet\n";
1.1       albertel  711: if (-e "$perlvar{'lonDaemons'}/logs/lonnet.log"){
                    712: open (DFH,"tail -n50 $perlvar{'lonDaemons'}/logs/lonnet.log|");
                    713: while ($line=<DFH>) { 
                    714:     print $fh "$line";
                    715: };
                    716: close (DFH);
                    717: }
1.11      www       718: print $fh "</pre><h3>Perm Log</h3><pre>";
1.1       albertel  719: 
                    720: if (-e "$perlvar{'lonDaemons'}/logs/lonnet.perm.log") {
                    721:     open(DFH,"tail -n10 $perlvar{'lonDaemons'}/logs/lonnet.perm.log|");
                    722: while ($line=<DFH>) { 
                    723:    print $fh "$line";
                    724: };
                    725: close (DFH);
                    726: } else { print $fh "No perm log\n" }
                    727: 
                    728: $fname="$perlvar{'lonDaemons'}/logs/lonnet.log";
                    729: 
                    730:                           my ($dev,$ino,$mode,$nlink,
                    731:                               $uid,$gid,$rdev,$size,
                    732:                               $atime,$mtime,$ctime,
                    733:                               $blksize,$blocks)=stat($fname);
                    734: 
                    735: if ($size>40000) {
                    736:     print $fh "Rotating logs ...<p>";
                    737:     rename("$fname.2","$fname.3");
                    738:     rename("$fname.1","$fname.2");
                    739:     rename("$fname","$fname.1");
                    740: }
                    741: 
                    742: print $fh "</pre>";
                    743: &errout($fh);
                    744: # ----------------------------------------------------------------- Connections
                    745: 
                    746: print $fh '<hr><a name="connections"><h2>Connections</h2>';
                    747: 
                    748: print $fh "<table border=2>";
1.31      albertel  749: foreach $tryserver (sort(keys(%hostname))) {
1.1       albertel  750: 
                    751:     $answer=reply("pong",$tryserver);
                    752:     if ($answer eq "$tryserver:$perlvar{'lonHostID'}") {
                    753: 	$result="<b>ok</b>";
                    754:     } else {
                    755:         $result=$answer;
                    756:         $warnings++;
                    757:         if ($answer eq 'con_lost') { $warnings++; }
                    758:     }
                    759:     print $fh "<tr><td>$tryserver</td><td>$result</td></tr>\n";
                    760: 
                    761: }
                    762: print $fh "</table>";
                    763: 
                    764: &errout($fh);
                    765: # ------------------------------------------------------------ Delayed messages
                    766: 
                    767: print $fh '<hr><a name="delayed"><h2>Delayed Messages</h2>';
1.23      www       768: print "buffers\n";
1.1       albertel  769: 
                    770: print $fh '<h3>Scanning Permanent Log</h3>';
                    771: 
                    772: $unsend=0;
                    773: {
                    774:     my $dfh=IO::File->new("$perlvar{'lonDaemons'}/logs/lonnet.perm.log");
                    775:     while ($line=<$dfh>) {
                    776: 	($time,$sdf,$dserv,$dcmd)=split(/:/,$line);
                    777:         if ($sdf eq 'F') { 
                    778: 	    $local=localtime($time);
                    779:             print "<b>Failed: $time, $dserv, $dcmd</b><br>";
                    780:             $warnings++;
                    781:         }
                    782:         if ($sdf eq 'S') { $unsend--; }
                    783:         if ($sdf eq 'D') { $unsend++; }
                    784:     }
                    785: }
                    786: print $fh "Total unsend messages: <b>$unsend</b><p>\n";
                    787: $warnings=$warnings+5*$unsend;
                    788: 
                    789: print $fh "<h3>Outgoing Buffer</h3>";
                    790: 
                    791: open (DFH,"ls -lF $perlvar{'lonSockDir'}/delayed|");
                    792: while ($line=<DFH>) { 
                    793:     print $fh "$line<br>";
                    794: };
                    795: close (DFH);
                    796: 
                    797: # ------------------------------------------------------------------------- End
                    798: print $fh "<a name=errcount>\n";
                    799: $totalcount=$notices+4*$warnings+100*$errors;
                    800: &errout($fh);
                    801: print $fh "<h1>Total Error Count: $totalcount</h1>";
                    802: $now=time;
                    803: $date=localtime($now);
                    804: print $fh "<hr>$date ($now)</body></html>\n";
1.23      www       805: print "writing done\n";
1.1       albertel  806: }
                    807: 
                    808: rename ("$statusdir/newstatus.html","$statusdir/index.html");
                    809: 
                    810: if ($totalcount>200) {
1.23      www       811:    print "mailing\n";
1.1       albertel  812:    $emailto="$perlvar{'lonAdmEMail'},$perlvar{'lonSysEMail'}";
                    813:    $subj="LON: $perlvar{'lonHostID'} E:$errors W:$warnings N:$notices"; 
                    814:    system(
1.24      www       815:  "metasend -b -t $emailto -s '$subj' -f $statusdir/index.html -m text/html");
1.1       albertel  816: }
                    817: 1;
                    818: 
                    819: 
                    820: 
                    821: 
                    822: 
                    823: 
                    824: 
                    825: 

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>