File:  [LON-CAPA] / loncom / xml / lontexconvert.pm
Revision 1.95: download - view: text, annotated - select for diffs
Mon Jan 12 04:46:48 2009 UTC (15 years, 4 months ago) by raeburn
Branches: MAIN
CVS tags: version_2_8_1, version_2_8_0, HEAD, GCI_1, BZ5434-fox
- Add linefeed to HTTP header.

    1: # The LearningOnline Network with CAPA
    2: # TeX Conversion Module
    3: #
    4: # $Id: lontexconvert.pm,v 1.95 2009/01/12 04:46:48 raeburn Exp $
    5: #
    6: # Copyright Michigan State University Board of Trustees
    7: #
    8: # This file is part of the LearningOnline Network with CAPA (LON-CAPA).
    9: #
   10: # LON-CAPA is free software; you can redistribute it and/or modify
   11: # it under the terms of the GNU General Public License as published by
   12: # the Free Software Foundation; either version 2 of the License, or
   13: # (at your option) any later version.
   14: #
   15: # LON-CAPA is distributed in the hope that it will be useful,
   16: # but WITHOUT ANY WARRANTY; without even the implied warranty of
   17: # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   18: # GNU General Public License for more details.
   19: #
   20: # You should have received a copy of the GNU General Public License
   21: # along with LON-CAPA; if not, write to the Free Software
   22: # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
   23: #
   24: # /home/httpd/html/adm/gpl.txt
   25: #
   26: # http://www.lon-capa.org/
   27: #
   28: # Copyright for TtHfunc and TtMfunc by Ian Hutchinson. 
   29: # TtHfunc and TtMfunc (the "Code") may be compiled and linked into 
   30: # binary executable programs or libraries distributed by the 
   31: # Michigan State University (the "Licensee"), but any binaries so 
   32: # distributed are hereby licensed only for use in the context
   33: # of a program or computational system for which the Licensee is the 
   34: # primary author or distributor, and which performs substantial 
   35: # additional tasks beyond the translation of (La)TeX into HTML.
   36: # The C source of the Code may not be distributed by the Licensee
   37: # to any other parties under any circumstances.
   38: #
   39: 
   40: package Apache::lontexconvert;
   41: 
   42: use strict;
   43: use tth();
   44: use vars qw($errorstring);
   45: #use Apache::lonxml();
   46: use Apache::lonlocal;
   47: use Apache::lonnet;
   48: use lib '/home/httpd/lib/perl/';
   49: use LONCAPA;
   50: use URI::Escape;
   51: use IO::Socket::INET;
   52: use IO::Socket::SSL;
   53: 
   54: # ====================================================================== Header
   55: 
   56: sub init_tth {
   57:     my $options=$env{'course.'.$env{'request.course.id'}.'.tthoptions'};
   58:     if ($options =~ /\S/) {
   59: 	$options = ' '.$options;
   60:     } else {
   61: 	undef($options);
   62:     }
   63:     if ($env{'browser.mathml'}) {
   64: 	&tth::ttminit();
   65: 	if ($env{'browser.unicode'}) {
   66: 	    &tth::ttmoptions('-L -u1'.$options);
   67: 	} else {
   68: 	    &tth::ttmoptions('-L -u0'.$options);
   69: 	}
   70:     } else {
   71: 	&tth::tthinit();
   72: 	if ($env{'browser.unicode'}) {
   73: 	    &tth::tthoptions('-L -u1'.$options);
   74: 	} else {
   75: 	    &tth::tthoptions('-L -u0'.$options);
   76: 	}
   77:     }
   78: }
   79: 
   80: # ================================================================== Conversion
   81: 
   82: $Apache::lontexconvert::messedup=0;
   83: 
   84: 
   85: sub convert_real {
   86:     my ($texstring)=@_;
   87:     my ($xmlstring,$errorstring);
   88:     local $SIG{SEGV}=sub { $Apache::lontexconvert::messedup=1; die; };
   89:     local $SIG{ALRM}=sub { 
   90: 	&Apache::lonnet::logthis("ALRM");
   91: 	$xmlstring='['.&mt("TeX unconverted due to errors").']';
   92: 	$Apache::lontexconvert::messedup=1;
   93: 	die &mt("TeX unconverted due to errors");
   94:     };
   95:     &Apache::lonxml::start_alarm();
   96:     if ($env{'browser.mathml'}) {
   97: 	$xmlstring=&tth::ttm($$texstring);
   98: 	$xmlstring=~s/\<math\>/\<math xmlns=\"\&mathns\;\"\>/g;
   99: 	$xmlstring=~s/\<br\>/\<br\/\>/g;
  100: 	$xmlstring=~s/\<p\>/\<p\>\<\/p\>/g;
  101: 	$errorstring.=&tth::ttmerror();
  102:     } else {
  103: 	$xmlstring=&tth::tth($$texstring);
  104: 	$errorstring.=&tth::ttherror();
  105: 	$xmlstring=~s-</font(\s*)>-</font>-g;
  106:     }
  107:     $xmlstring=~s/^\s*\<br clear\=\"all\"/\<br/s;
  108:     $xmlstring=~s/^\s*//;
  109:     $xmlstring=~s/\s*$//;
  110:     #
  111:     # \rightleftharpoons is not converted by tth but maps
  112:     # reasonably well to &#8660;.  If we get many more of these,
  113:     # we're going to need to have a translation sub.
  114:     #
  115:     my $lrharpoon = pack("U", 0x21cc);
  116:     $xmlstring=~s/\\rightleftharpoons/$lrharpoon/g;
  117: 
  118:     &Apache::lonxml::end_alarm();
  119:     return ($xmlstring,$errorstring);
  120: }
  121: 
  122: sub tth_converted {
  123:     my $texstring=shift;
  124:     my $xmlstring='['.&mt('UNDISPLAYABLE').']';
  125:     if ($Apache::lontexconvert::messedup) {
  126: 	return '['.&mt('TeX unconverted due to previous errors').']';
  127:     }
  128:     $$texstring ='\\documentstyle{article}'.$$texstring;
  129: 
  130:     eval(<<'ENDCONV');
  131:     ($xmlstring,$errorstring)=&convert_real($texstring)
  132: ENDCONV
  133:     if ($@) {
  134: 	$errorstring.=&mt("Evaluation Error: ").$@;
  135: 	$Apache::lontexconvert::messedup=1;
  136:     }
  137:     if ($Apache::lontexconvert::messedup || &tth::tthmessedup() || 
  138: 	$errorstring) {
  139: 	&Apache::lonnet::logthis("Trying to kill myself");
  140: 	$Apache::lontexconvert::messedup=1;
  141: 	if (ref($Apache::lonxml::request)) {
  142: 	    $Apache::lonxml::request->child_terminate();
  143: 	} else {
  144: 	    my $request;
  145: 	    eval { $request=Apache->request; };
  146: 	    if (!$request) {
  147: 		eval { $request=Apache2::RequestUtil->request; };
  148: 	    }
  149: 	    if ($request) {
  150: 		$request->child_terminate();
  151: 	    } else {
  152: 		&Apache::lonnet::logthis("Unable to find a request to do child_terminate on");
  153: 	    }
  154: 	}
  155:     }
  156:     return $xmlstring;
  157: }
  158: 
  159: sub clean_out_math_mode {
  160:     my ($texstring)=@_;
  161:     $$texstring=~s/(?<!\\)\$//g;
  162:     $$texstring=~s/\\[\)\(\]\[]//g;
  163:     $$texstring=~s/\\ensuremath//g;
  164:     return '';
  165: }
  166: 
  167: sub displaystyle {
  168:     my ($texstring)=@_;
  169:     #has a $$ or \[ or \displaystyle in it, guessinng it's display mode
  170:     if ($$texstring=~/[^\\]\$\$/ ||
  171: 	$$texstring=~/\\\[/ ||
  172: 	$$texstring=~/\\displaystyle/) { return 1; }
  173:     return 0;
  174: }
  175: 
  176: sub jsMath_converted {
  177:     my $texstring=shift;
  178:     my $tag='span';
  179:     if (&displaystyle($texstring)) { $tag='div'; }
  180:     &clean_out_math_mode($texstring);
  181:     return &jsMath_header().
  182: 	'<'.$tag.' class="math">'.$$texstring.'</'.$tag.'>';
  183: }
  184: 
  185: {
  186:     my @jsMath_sent_header;
  187:     sub jsMath_reset {
  188: 	undef(@jsMath_sent_header);
  189:     }
  190:     sub jsMath_push {
  191: 	push(@jsMath_sent_header,0);
  192:     }
  193:     sub jsMath_header {
  194: 	if (!@jsMath_sent_header) {
  195: 	    &Apache::lonnet::logthis("mismatched calls of jsMath_header and jsMath_process");
  196: 	    return '';
  197: 	}
  198: 	return '' if $jsMath_sent_header[-1];
  199: 	$jsMath_sent_header[-1]=1;
  200: 	return
  201:             '<script type="text/javascript">
  202:                      function NoFontMessage () {}
  203:                      jsMath = {Parser: {prototype: {environments: {\'eqnarray*\' :[\'Array\',null,null,\'rcl\',[5/18,5/18],3,\'D\']}}}};
  204:                    </script>'."\n".
  205: 	    '<script type="text/javascript" src="/adm/jsMath/jsMath.js"></script>'."\n";
  206:     }
  207:     sub jsMath_process {
  208: 	my $state = pop(@jsMath_sent_header);
  209: 	return '' if !$state;
  210: 	return "\n".
  211: 	    '<script type="text/javascript">jsMath.Process()</script>'."\n";
  212:     }
  213:     sub jsMath_state {
  214: 	my ($level) = @_;
  215: 	return $jsMath_sent_header[$level];
  216:     }
  217: }
  218: 
  219: sub tex_engine {
  220:     if (exists($env{'form.texengine'})) {
  221: 	if ($env{'form.texengine'} ne '') {
  222:             return $env{'form.texengine'};
  223:         }
  224:     }    
  225:     if ($env{'request.course.id'}
  226: 	&& exists($env{'course.'.$env{'request.course.id'}.'.texengine'})) {
  227: 	return $env{'course.'.$env{'request.course.id'}.'.texengine'};
  228:     }
  229:     if (exists($env{'environment.texengine'})) {
  230: 	return $env{'environment.texengine'};
  231:     }
  232:     return 'tth';
  233: }
  234: 
  235: sub init_math_support {
  236:     my ($inherit_jsmath) = @_;
  237:     &init_tth();
  238:     &Apache::lontexconvert::jsMath_push();
  239:     if (lc(&tex_engine()) eq 'jsmath' ||
  240: 	($inherit_jsmath && &jsMath_state(-2))) {
  241: 	return &Apache::lontexconvert::jsMath_header();
  242:     }
  243:     return;
  244: }
  245: 
  246: sub mimetex_valign {
  247:     my ($esc_texstring)=@_;
  248:     my $valign = 0;
  249:     my $lonhost = $Apache::lonnet::perlvar{'lonHostID'};
  250:     my $hostname = &Apache::lonnet::hostname($lonhost);
  251:     my $protocol = $Apache::lonnet::protocol{$lonhost};
  252:     my $path = '/cgi-bin/mimetex.cgi?'.$esc_texstring;
  253:     my $socket;
  254:     &Apache::lonxml::start_alarm();
  255:     if ($protocol eq 'https') {
  256:         $socket = IO::Socket::SSL->new(PeerAddr => $hostname,
  257:                                        PeerPort => 'https(443)',
  258:                                        Proto    => 'tcp');
  259:     } else {
  260:         $socket = IO::Socket::INET->new(PeerAddr => $hostname,
  261:                                         PeerPort => 'http(80)',
  262:                                         Proto    => 'tcp');
  263:     }
  264:     if ($socket) {
  265:         my $headreq = "HEAD $path HTTP/1.0\r\nUser-Agent: Mozilla/5.0\r\n\r\n";
  266:         print $socket $headreq;
  267:         while (<$socket>) {
  268:             if (/Vertical\-Align\:\s*?([\-\d]+)/) {
  269:                 $valign = $1;
  270:             }
  271:         }
  272:         if ($protocol eq 'https') {
  273:             $socket->close(SSL_no_shutdown => 1,
  274:                            SSL_ctx_free => 1);
  275:         } else {
  276:             $socket->close();
  277:         }
  278:     }
  279:     &Apache::lonxml::end_alarm();
  280:     return $valign;
  281: }
  282: 
  283: sub mimetex_converted {
  284:     my $texstring=shift;
  285:     my $displaystyle=&displaystyle($texstring);
  286: 
  287:     &clean_out_math_mode($texstring);
  288: 
  289:     if ($displaystyle) {
  290: 	$$texstring='\\displaystyle \\Large '.$$texstring;
  291:     }
  292:     my $esc_texstring = &uri_escape($$texstring);
  293:     my $valign = &mimetex_valign($esc_texstring);
  294:     my $result='<img src="/cgi-bin/mimetex.cgi?'.$esc_texstring.'" style="vertical-align:'.$valign.'px" alt="$'.$$texstring.'$" />';
  295:     if ($displaystyle) {
  296: 	$result='<center>'.$result.'</center>';
  297:     }
  298:     return $result;
  299: }
  300: 
  301: sub converted {
  302:     my ($string,$mode)=@_;
  303:     if ($mode eq '') { $mode = &tex_engine(); }
  304:     if ($mode =~ /tth/i) {
  305: 	return &tth_converted($string);
  306:     } elsif ($mode =~ /jsmath/i) {
  307: 	return &jsMath_converted($string);
  308:     } elsif ($mode =~ /mimetex/i) {
  309: 	return &mimetex_converted($string);
  310:     }
  311:     return &tth_converted($string);
  312: }
  313: 
  314: # ------------------------------------------------------------ Message display
  315: 
  316: sub to_convert {
  317:     my ($string) = @_;
  318:     $string=~s/\<br\s*\/?\>/ /gs;
  319: #    $string=~s/\s/ /gs;
  320:     $string=&HTML::Entities::decode($string);
  321:     return &converted(\$string);
  322: }
  323: 
  324: sub smiley {
  325:     my $expression=shift;
  326:     if ($env{'browser.imagesuppress'} eq 'on') { return $expression; }
  327:     my %smileys=('\:\-\)' => 'smiley',
  328: 		 '8\-\)'  => 'coolsmile',
  329: 		 '8\-(I|\|)'   => 'coolindiff',
  330: 		 ':\-(I|\|)'   => 'neutral',
  331: 		 '\:\-(o|O|\(\))' => 'shocked',
  332: 		 ':\-\('  => 'frowny',
  333: 		 '\;\-\)' => 'wink',
  334: 		 '\:\-P'  => 'baeh',
  335: 		 '\:\-(\\\|\\/)' => 'hrrm',
  336: 		 '\:\-D'  => 'bigsmile',
  337: 		 '\:\-C'  => 'angry',
  338: 		 '\:(\'|\`)\-\(' => 'cry',
  339: 		 '\:\-(X|\#)' => 'lipsrsealed',
  340: 		 '\:\-S' => 'huh');
  341:     my $iconpath=$Apache::lonnet::perlvar{'lonIconsURL'};
  342:     foreach my $smiley (keys(%smileys)) {
  343: 	$expression=~s/$smiley/\<img src="$iconpath\/$smileys{$smiley}.gif" \/\>/gs; 
  344:     }
  345:     return $expression;
  346: }
  347: 
  348: sub msgtexconverted {
  349:     my ($message,$email) = @_;
  350:     $errorstring='';
  351:     &init_tth();
  352:     my $outmessage='';
  353:     my $tex=0;
  354:     foreach my $fragment (split(/(?:\&lt\;|\<)\/*m\s*(?:\&gt\;|\>)/i,$message)) {
  355: 	if ($tex) {
  356: 	    if ($email) {
  357: 		$outmessage.='</pre><tt>'.&to_convert($fragment).'</tt><pre>';
  358: 		$tex=0;
  359: 	    } else {
  360: 		$outmessage.=&to_convert($fragment);
  361: 		$tex=0;
  362: 	    }
  363: 	} else {
  364:             $outmessage.=&smiley($fragment);
  365: 	    $tex=1;
  366: 	}
  367:     }
  368:     $message=$outmessage; $outmessage=''; $tex=0;
  369:     foreach my $fragment (split(/(?:\&lt\;|\<)\/*algebra\s*(?:\&gt\;|\>)/i,
  370: 				$message)) {
  371: 	if ($tex) {
  372: 	    if ($email) {
  373: 		$outmessage.='</pre><tt>'.&algebra($fragment,'web').'</tt><pre>';
  374: 		$tex=0;
  375: 	    } else {
  376: 		$outmessage.=&algebra($fragment,'web');
  377: 		$tex=0;
  378: 	    }
  379: 	} else {
  380:             $outmessage.=$fragment;
  381: 	    $tex=1;
  382: 	}
  383:     }
  384:     if (wantarray) {
  385: 	return ($outmessage,$errorstring);
  386:     } else {
  387: 	return $outmessage.$errorstring;
  388:     }
  389: }
  390: 
  391: sub algebra {
  392:     use AlgParser;
  393: 
  394:     my ($string,$target,$style,$parstack,$safeeval)=@_;
  395:     my $parser = new AlgParserWithImplicitExpand;
  396:     $string=&prepare_algebra($string);
  397:     my $ret = $parser->parse($string);
  398:     my $result='['.&mt('Algebra unconverted due to previous errors').']';
  399:     if ( ref($ret) ) {
  400: 	#$parser->tostring();
  401: 	$parser->normalize();
  402: 	my $latex=$parser->tolatex();
  403: 	$latex=&postprocess_algebra($latex);
  404: 	if ($style eq 'display') {
  405: 	    $latex='$$'.$latex.'$$x';
  406: 	} else {
  407: 	    # style is 'inline'
  408: 	    $latex='\\ensuremath{'.$latex.'}';
  409: 	}
  410: 	if ($target eq 'web' || $target eq 'analyze') {
  411:             my $display=&Apache::lonxml::get_param('display',$parstack,$safeeval);
  412:             $result = &converted(\$latex,$display);
  413: #	    $result = &converted(\$latex);
  414: 	} else {
  415: 	    $result = $latex;
  416: 	}
  417:     } else {
  418: 	&Apache::lonxml::error($parser->{'htmlerror'});
  419:     }
  420: }
  421: 
  422: sub prepare_algebra {
  423:     my ($string)=@_;
  424: 
  425:     # makes the decision about what is a minus sign easier supposedly
  426:     $string =~ s/(\<\>|\<\=|\>\=[\=\>\<] *)-/$1 zeroplace -/g;
  427: 
  428:     return $string;
  429: }
  430: 
  431: sub postprocess_algebra {
  432:     my ($string)=@_;
  433:     
  434:     # moodle had these and I don't know why, ignoring them for now
  435:     # $string =~s/\\fun/ /g;
  436: 
  437:     # sqrt(3,4) means the 4 root of 3
  438:     $string =~s/\\sqrt{([^,]+),([^\}]+)}/\\sqrt[$2]{$1}/gs;
  439: 
  440:     # log(3,4) means the log base 4 of 3
  441:     $string =~s/\\log\\left\((.+?),(.+?)\\right\)/\\log_{$2}\\left($1\\right)/gs;
  442: 
  443:     # log(3,4) means the log base 4 of 3
  444:     $string =~s/\\((?:sin|cos|tan|sec|csc|cot)(?:h)?)\\left\((.+?),(.+?)\\right\)/\\$1^{$3}\\left($2\\right)/gs;
  445: 
  446:     # int(3,a,b) integral from a to b of 3
  447:     $string =~s/\\int\\left\((.+?),(.+?),(.+?)\\right\)/\\int_{$2}^{$3}\\left($1\\right)/gs;
  448: 
  449:     # int( ... dx) -> ...
  450:     $string =~s/\\int\\left\((.+?)d[a-z]\\right\)/$1/gs;
  451: 
  452:     # 
  453:     $string =~s/\\lim\\left\((.+?),(.+?),(.+?)\\right\)/\\lim_{$2\\to $3}$1/gs;
  454:     return $string;
  455: }
  456: 1;
  457: __END__
  458: 
  459: 
  460: =pod
  461: 
  462: =head1 NAME
  463: 
  464: Apache::lontexconvert;
  465: 
  466: =head1 SYNOPSIS
  467: 
  468: Access to tth/ttm
  469: 
  470: This is part of the LearningOnline Network with CAPA project
  471: described at http://www.lon-capa.org.
  472: 
  473: 
  474: =head1 SUBROUTINES
  475: 
  476: =over
  477: 
  478: =item init_tth()
  479: 
  480: Header
  481: 
  482: =item convert_real()
  483: 
  484:  we need this routine because &converted can get called from inside
  485:  of the safespace (through &xmlparse('<m>stuff</m>') which doesn't
  486:  allow the opcode for alarm, so we need to compile this before we get
  487:  into the safe space since opcode checks only occur at compile time
  488: 
  489: =item tth_converted()
  490: 
  491: 
  492: =item clean_out_math_mode()
  493: 
  494: 
  495: =item displaystyle()
  496: 
  497: 
  498: =item jsMath_converted()
  499: 
  500: 
  501: =item tex_engine()
  502: 
  503: 
  504: =item init_math_support()
  505: 
  506: 
  507: =item mimetex_converted()
  508: 
  509: 
  510: =item converted()
  511: 
  512: 
  513: =item to_convert()
  514: 
  515: message display
  516: 
  517: =item smiley()
  518: 
  519: ???
  520: 
  521: =item msgtexconverted()
  522: 
  523: =item algebra()
  524: 
  525: =item prepare_algebra()
  526: 
  527: =item postprocess_algebra()
  528: 
  529: =back
  530: 
  531: =cut
  532: 
  533: 
  534: 

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>