1: # The LearningOnline Network with CAPA
2: # TeX Conversion Module
3: #
4: # $Id: lontexconvert.pm,v 1.119 2016/04/09 14:48:13 raeburn Exp $
5: #
6: # Copyright Michigan State University Board of Trustees
7: #
8: # This file is part of the LearningOnline Network with CAPA (LON-CAPA).
9: #
10: # LON-CAPA is free software; you can redistribute it and/or modify
11: # it under the terms of the GNU General Public License as published by
12: # the Free Software Foundation; either version 2 of the License, or
13: # (at your option) any later version.
14: #
15: # LON-CAPA is distributed in the hope that it will be useful,
16: # but WITHOUT ANY WARRANTY; without even the implied warranty of
17: # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18: # GNU General Public License for more details.
19: #
20: # You should have received a copy of the GNU General Public License
21: # along with LON-CAPA; if not, write to the Free Software
22: # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23: #
24: # /home/httpd/html/adm/gpl.txt
25: #
26: # http://www.lon-capa.org/
27: #
28: # Copyright for TtHfunc and TtMfunc by Ian Hutchinson.
29: # TtHfunc and TtMfunc (the "Code") may be compiled and linked into
30: # binary executable programs or libraries distributed by the
31: # Michigan State University (the "Licensee"), but any binaries so
32: # distributed are hereby licensed only for use in the context
33: # of a program or computational system for which the Licensee is the
34: # primary author or distributor, and which performs substantial
35: # additional tasks beyond the translation of (La)TeX into HTML.
36: # The C source of the Code may not be distributed by the Licensee
37: # to any other parties under any circumstances.
38: #
39:
40: package Apache::lontexconvert;
41:
42: use strict;
43: use tth();
44: use vars qw($errorstring);
45: #use Apache::lonxml();
46: use Apache::lonlocal;
47: use Apache::lonnet;
48: use lib '/home/httpd/lib/perl/';
49: use LONCAPA;
50: use URI::Escape;
51: use IO::Socket::INET;
52:
53:
54: #
55: # Table of substitutions to unicode characters.
56: #
57:
58: my %unicode_harpoons = (
59: '\rightleftharpoons' => 0x21cc,
60: );
61:
62: my %unicode_translations = (
63:
64: # Brackets - unicode for browsers/OS which support it.
65:
66: '' => 0x23a1,
67: '' => 0x23a2,
68: '' => 0x23a3,
69: '' => 0x23a4,
70: '' => 0x23a5,
71: '' => 0x23a6,
72:
73: # Parens - unicode for browsers/OS which support it
74:
75: '' => 0x239b,
76: '' => 0x239c,
77: '' => 0x239d,
78: '' => 0x239e,
79: '' => 0x239f,
80: '' => 0x23a0,
81:
82: );
83:
84: my %ascii_8bit_translations = (
85:
86: # Brackets - pure 8-bit ascii ugliness for browsers/OS which can't handle unicode
87:
88: '' => 0x5b,
89: '' => 0x5b, # '['
90: '' => 0x5b,
91: '' => 0x5d, # ']'
92: '' => 0x5d,
93: '' => 0x5d,
94:
95: # Parens - pure 8-bit ascii ugliness for browsers/OS which can't handle unicode
96:
97: '' => 0x28,
98: '' => 0x28, # '('
99: '' => 0x28,
100: '' => 0x29,
101: '' => 0x29, # '('
102: '' => 0x29,
103:
104: );
105:
106: ##
107: # Utility to convert elements of a string to unicode:
108: #
109: # @param input - Input string
110: # @param pattern - Pattern to convert
111: # @param unicode - Unicode to substitute for pattern.
112: #
113: # @return string - resulting string.
114: #
115: sub unicode_subst {
116: my ($input, $pattern, $unicode) = @_;
117:
118: my $char = pack('U', $unicode);
119:
120: $input =~ s/$pattern/$char/g;
121:
122: return $input;
123: }
124:
125: # ====================================================================== Header
126:
127: sub init_tth {
128: my $options=$env{'course.'.$env{'request.course.id'}.'.tthoptions'};
129: if ($options =~ /\S/) {
130: $options = ' '.$options;
131: } else {
132: undef($options);
133: }
134: if ($env{'browser.mathml'}) {
135: &tth::ttminit();
136: if ($env{'browser.unicode'}) {
137: &tth::ttmoptions('-L -u1'.$options);
138: } else {
139: &tth::ttmoptions('-L -u0'.$options);
140: }
141: } else {
142: &tth::tthinit();
143: if ($env{'browser.unicode'}) {
144: &tth::tthoptions('-L -u1'.$options);
145: } else {
146: &tth::tthoptions('-L -u0'.$options);
147: }
148: }
149: }
150:
151: # ================================================================== Conversion
152:
153: $Apache::lontexconvert::messedup=0;
154:
155:
156: sub convert_real {
157: my ($texstring)=@_;
158: my ($xmlstring,$errorstring);
159: local $SIG{SEGV}=sub { $Apache::lontexconvert::messedup=1; die; };
160: local $SIG{ALRM}=sub {
161: &Apache::lonnet::logthis("ALRM");
162: $xmlstring='['.&mt("TeX unconverted due to errors").']';
163: $Apache::lontexconvert::messedup=1;
164: die &mt("TeX unconverted due to errors");
165: };
166: &Apache::lonxml::start_alarm();
167: if ($env{'browser.mathml'}) {
168: $xmlstring=&tth::ttm($$texstring);
169: $xmlstring=~s/\<math\>/\<math xmlns=\"\&mathns\;\"\>/g;
170: $xmlstring=~s/\<br\>/\<br\/\>/g;
171: $xmlstring=~s/\<p\>/\<p\>\<\/p\>/g;
172: $errorstring.=&tth::ttmerror();
173: } else {
174: $xmlstring=&tth::tth($$texstring);
175: $errorstring.=&tth::ttherror();
176: $xmlstring=~s-</font(\s*)>-</font>-g;
177: }
178: $xmlstring=~s/^\s*\<br clear\=\"all\"/\<br/s;
179: $xmlstring=~s/^\s*//;
180: $xmlstring=~s/\s*$//;
181: $xmlstring=~s/^<br \/><table/<table/;
182: &Apache::lonxml::end_alarm();
183:
184: #
185: # Several strings produced by tth require
186: # transliteration -> unicode equivalents to render reliably
187: # in browsers. %unicode_translations and %unicode_harpoons are tables of
188: # string->substitution which we now apply. (%ascii_8bit_translations used
189: # instead for Windows XP and mobile devices.
190:
191: my $use_ascii;
192: if ($env{'browser.os'} eq 'win') {
193: if (($env{'browser.osversion'}) && ($env{'browser.osversion'} < 6.0)) {
194: $use_ascii = 1;
195: }
196: }
197: if ($env{'browser.mobile'}) {
198: $use_ascii = 1;
199: }
200:
201: foreach my $pattern (keys(%unicode_translations)) {
202: my $unicode = $unicode_translations{$pattern};
203: if ($use_ascii) {
204: $unicode = $ascii_8bit_translations{$pattern};
205: }
206: $xmlstring = &unicode_subst($xmlstring, $pattern, $unicode);
207: }
208:
209: foreach my $pattern (keys(%unicode_harpoons)) {
210: $xmlstring = &unicode_subst($xmlstring, $pattern, $unicode_harpoons{$pattern});
211: }
212:
213: return ($xmlstring,$errorstring);
214: }
215:
216: sub tth_converted {
217: my $texstring=shift;
218: my $xmlstring='['.&mt('UNDISPLAYABLE').']';
219: if ($Apache::lontexconvert::messedup) {
220: return '['.&mt('TeX unconverted due to previous errors').']';
221: }
222: $$texstring ='\\documentstyle{article}'.$$texstring;
223:
224: eval(<<'ENDCONV');
225: ($xmlstring,$errorstring)=&convert_real($texstring)
226: ENDCONV
227: if ($@) {
228: $errorstring.=&mt("Evaluation Error: ").$@;
229: $Apache::lontexconvert::messedup=1;
230: }
231: if ($Apache::lontexconvert::messedup || &tth::tthmessedup() ||
232: $errorstring) {
233: &Apache::lonnet::logthis("Trying to kill myself");
234: $Apache::lontexconvert::messedup=1;
235: if (ref($Apache::lonxml::request)) {
236: $Apache::lonxml::request->child_terminate();
237: } else {
238: my $request;
239: eval { $request=Apache->request; };
240: if (!$request) {
241: eval { $request=Apache2::RequestUtil->request; };
242: }
243: if ($request) {
244: $request->child_terminate();
245: } else {
246: &Apache::lonnet::logthis("Unable to find a request to do child_terminate on");
247: }
248: }
249: }
250: return $xmlstring;
251: }
252:
253: sub clean_out_math_mode {
254: my ($texstring)=@_;
255: $$texstring=~s/(?<!\\)\$//g;
256: $$texstring=~s/\\[\)\(\]\[]//g;
257: $$texstring=~s/\\ensuremath//g;
258: return '';
259: }
260:
261: sub displaystyle {
262: my ($texstring)=@_;
263: #has a $$ or \[ or \displaystyle or eqnarray in it, guessinng it's display mode
264: if ($$texstring=~/[^\\]\$\$/ ||
265: $$texstring=~/\\\[/ ||
266: $$texstring=~/\\displaystyle/ ||
267: $$texstring=~/eqnarray/
268: ) { return 1; }
269: return 0;
270: }
271:
272: sub MathJax_converted {
273: my $texstring=shift;
274: my $tag='math/tex;';
275: if (&displaystyle($texstring)) { $tag='math/tex; mode=display'; }
276: &clean_out_math_mode($texstring);
277: return &MathJax_header().
278: '<script type="'.$tag.'">'.$$texstring.'</script>';
279: }
280:
281: {
282: #Relies heavily on the previous jsMath installation
283: my @MathJax_sent_header;
284: sub MathJax_reset {
285: undef(@MathJax_sent_header);
286: }
287: sub MathJax_push {
288: push(@MathJax_sent_header,0);
289: }
290: sub MathJax_header {
291: if (!@MathJax_sent_header) {
292: &Apache::lonnet::logthis("mismatched calls of MathJax_header and MathJax_process");
293: return '';
294: }
295: return '' if $MathJax_sent_header[-1];
296: $MathJax_sent_header[-1]=1;
297: return
298: '<script type="text/javascript" src="/adm/MathJax/MathJax.js?config=TeX-AMS-MML_HTMLorMML"></script>'."\n";
299: }
300: #sub MathJax_process {
301: # my $state = pop(@MathJax_sent_header);
302: # return '' if !$state;
303: # return "\n".
304: # '<script type="text/javascript">MathJax.Process()</script>'."\n";
305: #}
306: #sub MathJax_state {
307: # my ($level) = @_;
308: # return $MathJax_sent_header[$level];
309: #}
310: }
311:
312: sub tex_engine {
313: if (exists($env{'form.texengine'})) {
314: if ($env{'form.texengine'} ne '') {
315: if (lc($env{'form.texengine'}) eq 'jsmath') {
316: return 'MathJax';
317: }
318: return $env{'form.texengine'};
319: }
320: }
321: if ($env{'request.course.id'}
322: && exists($env{'course.'.$env{'request.course.id'}.'.texengine'})) {
323: if (lc($env{'course.'.$env{'request.course.id'}.'.texengine'}) eq 'jsmath') {
324: return 'MathJax';
325: }
326: return $env{'course.'.$env{'request.course.id'}.'.texengine'};
327: }
328: if (exists($env{'environment.texengine'})) {
329: if (lc($env{'environment.texengine'}) eq 'jsmath') {
330: return 'MathJax';
331: }
332: return $env{'environment.texengine'};
333: }
334: return 'tth';
335: }
336:
337: sub init_math_support {
338: &init_tth();
339: &Apache::lontexconvert::MathJax_push();
340: if (lc(&tex_engine()) eq 'mathjax') {
341: return &Apache::lontexconvert::MathJax_header();
342: }
343: return;
344: }
345:
346: sub mimetex_valign {
347: my ($esc_texstring)=@_;
348: my $valign = 0;
349: my $path = '/cgi-bin/mimetex.cgi?'.$esc_texstring;
350: my $socket;
351: &Apache::lonxml::start_alarm();
352: $socket = IO::Socket::INET->new(PeerAddr => 'localhost',
353: PeerPort => 'http(80)',
354: Proto => 'tcp');
355: if ($socket) {
356: my $headreq = "HEAD $path HTTP/1.0\r\n\r\n";
357: print $socket $headreq;
358: while (<$socket>) {
359: if (/Vertical\-Align\:\s*?([\-\d]+)/) {
360: $valign = $1;
361: }
362: }
363: $socket->close();
364: }
365: &Apache::lonxml::end_alarm();
366: return $valign;
367: }
368:
369: sub mimetex_converted {
370: my $texstring=shift;
371:
372: # Alt-Argument for screen readers
373: my $alt_string=$$texstring;
374: $alt_string=~s/\"/\'\'/g;
375:
376: # Is this displaystyle?
377:
378: my $displaystyle=&displaystyle($texstring);
379:
380: # Remove math environment delimiters
381:
382: &clean_out_math_mode($texstring);
383:
384: if ($displaystyle) {
385: $$texstring='\\displaystyle \\Large '.$$texstring;
386: }
387: my $esc_texstring = &uri_escape($$texstring);
388: my $valign = &mimetex_valign($esc_texstring);
389: my $result='<img src="/cgi-bin/mimetex.cgi?'.$esc_texstring.'" style="vertical-align:'.$valign.'px" alt="'.$alt_string.'" />';
390: if ($displaystyle) {
391: $result='<div style="text-align:center">'.$result.'</div>';
392: }
393: return $result;
394: }
395:
396: sub converted {
397: my ($string,$mode)=@_;
398: if ($mode eq '') { $mode = &tex_engine(); }
399: if ($mode =~ /tth/i) {
400: return &tth_converted($string);
401: } elsif ($mode =~ /jsmath/i) {
402: return &MathJax_converted($string);
403: } elsif ($mode =~ /mathjax/i) {
404: return &MathJax_converted($string);
405: } elsif ($mode =~ /mimetex/i) {
406: return &mimetex_converted($string);
407: } elsif ($mode =~ /raw/i) {
408: return $$string;
409: }
410: return &tth_converted($string);
411: }
412:
413: # ------------------------------------------------------------ Message display
414:
415: sub to_convert {
416: my ($string) = @_;
417: &init_tth();
418: $string=~s/\<br\s*\/?\>/ /gs;
419: # $string=~s/\s/ /gs;
420: $string=&HTML::Entities::decode($string);
421: return &converted(\$string);
422: }
423:
424: sub smiley {
425: my $expression=shift;
426: my %smileys=(
427: '\:\-*\)' => 'face-smile.png',
428: '8\-\)' => 'face-cool.png',
429: '8\-(I|\|)' => 'face-glasses.png',
430: '\:\-(I|\|)' => 'face-plain.png',
431: '\:\-(o|O|\(\))' => 'face-surprise.png',
432: ':\-\(' => 'face-sad.png',
433: '\;\-\)' => 'face-wink.png',
434: '\:\-(P|p)' => 'face-raspberry.png',
435: '\:\-(\\\|\\/)' => 'face-uncertain.png',
436: '\:\-D' => 'face-smile-big.png',
437: '\:\-(C|\@)' => 'face-angry.png',
438: '\:(\'|\`)\-*\(' => 'face-crying.png',
439: '\:\-(X|x|\#)' => 'face-quiet.png',
440: '\:\-(s|S)' => 'face-uncertain.png',
441: '\:\-\$' => 'face-embarrassed.png',
442: '\:\-\*' => 'face-kiss.png',
443: '\+O\(' => 'face-sick.png',
444: '(\<\;3|\(heart\))' => 'heart.png',
445: '\(rose\)' => 'rose.png',
446: '\(pizza\)' => 'food-pizza.png',
447: '\(cake\)' => 'food-cake.png',
448: '\(ninja\)' => 'face-ninja.png',
449: '\(pirate\)' => 'face-pirate.png',
450: '\((agree|yes)\)' => 'opinion-agree.png',
451: '\((disagree|nay)\)' => 'opinion-disagree.png',
452: '(o|O)\-\)' => 'face-angel.png',
453: );
454: my $iconpath=$Apache::lonnet::perlvar{'lonIconsURL'};
455: foreach my $smiley (keys(%smileys)) {
456: $expression=~s/$smiley/\<img src="$iconpath\/$smileys{$smiley}" \/\>/gs;
457: }
458: return $expression;
459: }
460:
461: sub msgtexconverted {
462: my ($message,$email) = @_;
463: $errorstring='';
464: my $outmessage='';
465: my $tex=0;
466: foreach my $fragment (split(/(?:\<\;|\<)\/*m\s*(?:\>\;|\>)/i,$message)) {
467: if ($tex) {
468: if ($email) {
469: $outmessage.='</pre><tt>'.&to_convert($fragment).'</tt><pre>';
470: $tex=0;
471: } else {
472: $outmessage.=&to_convert($fragment);
473: $tex=0;
474: }
475: } else {
476: $outmessage.=&smiley($fragment);
477: $tex=1;
478: }
479: }
480: $message=$outmessage; $outmessage=''; $tex=0;
481: foreach my $fragment (split(/(?:\<\;|\<)\/*algebra\s*(?:\>\;|\>)/i,
482: $message)) {
483: if ($tex) {
484: my $algebra = &algebra($fragment, 'web', undef, undef, undef, 'tth');
485: if ($email) {
486: $outmessage.='</pre><tt>'.$algebra.'</tt><pre>';
487: $tex=0;
488: } else {
489: $outmessage.=$algebra;
490: $tex=0;
491: }
492: } else {
493: $outmessage.=$fragment;
494: $tex=1;
495: }
496: }
497: if (wantarray) {
498: return ($outmessage,$errorstring);
499: } else {
500: return $outmessage.$errorstring;
501: }
502: }
503:
504: sub algebra {
505: use AlgParser;
506: my ($string,$target,$style,$parstack,$safeeval,$tth)=@_;
507: my $parser = new AlgParserWithImplicitExpand;
508: if ($tth eq 'tth') {&init_tth();}
509: $string=&prepare_algebra($string);
510: my $ret = $parser->parse($string);
511: my $result='['.&mt('Algebra unconverted due to previous errors').']';
512: if ( ref($ret) ) {
513: #$parser->tostring();
514: $parser->normalize();
515: my $latex=$parser->tolatex();
516: $latex=&postprocess_algebra($latex);
517: if ($style eq 'display') {
518: $latex='$$'.$latex.'$$x';
519: } else {
520: # style is 'inline'
521: $latex='\\ensuremath{'.$latex.'}';
522: }
523: if ($target eq 'web' || $target eq 'analyze') {
524: my $display=&Apache::lonxml::get_param('display',$parstack,$safeeval);
525: $result = &converted(\$latex,$display);
526: # $result = &converted(\$latex);
527: } else {
528: $result = $latex;
529: }
530: } else {
531: &Apache::lonxml::error($parser->{'htmlerror'});
532: }
533: }
534:
535: sub prepare_algebra {
536: my ($string)=@_;
537:
538: # makes the decision about what is a minus sign easier supposedly
539: $string =~ s/(\<\>|\<\=|\>\=[\=\>\<] *)-/$1 zeroplace -/g;
540:
541: return $string;
542: }
543:
544: sub postprocess_algebra {
545: my ($string)=@_;
546:
547: # moodle had these and I don't know why, ignoring them for now
548: # $string =~s/\\fun/ /g;
549:
550: # sqrt(3,4) means the 4 root of 3
551: $string =~s/\\sqrt\{([^,]+),([^\}]+)}/\\sqrt[$2]{$1}/gs;
552:
553: # log(3,4) means the log base 4 of 3
554: $string =~s/\\log\\left\((.+?),(.+?)\\right\)/\\log_{$2}\\left($1\\right)/gs;
555:
556: # log(3,4) means the log base 4 of 3
557: $string =~s/\\((?:sin|cos|tan|sec|csc|cot)(?:h)?)\\left\((.+?),(.+?)\\right\)/\\$1^{$3}\\left($2\\right)/gs;
558:
559: # int(3,a,b) integral from a to b of 3
560: $string =~s/\\int\\left\((.+?),(.+?),(.+?)\\right\)/\\int_{$2}^{$3}\\left($1\\right)/gs;
561:
562: # int( ... dx) -> ...
563: $string =~s/\\int\\left\((.+?)d[a-z]\\right\)/$1/gs;
564:
565: #
566: $string =~s/\\lim\\left\((.+?),(.+?),(.+?)\\right\)/\\lim_{$2\\to $3}$1/gs;
567: return $string;
568: }
569:
570:
571: 1;
572: __END__
573:
574:
575: =pod
576:
577: =head1 NAME
578:
579: Apache::lontexconvert;
580:
581: =head1 SYNOPSIS
582:
583: Access to tth/ttm
584:
585: This is part of the LearningOnline Network with CAPA project
586: described at http://www.lon-capa.org.
587:
588:
589: =head1 SUBROUTINES
590:
591: =over
592:
593: =item init_tth()
594:
595: Header
596:
597: =item convert_real()
598:
599: we need this routine because &converted can get called from inside
600: of the safespace (through &xmlparse('<m>stuff</m>') which doesn't
601: allow the opcode for alarm, so we need to compile this before we get
602: into the safe space since opcode checks only occur at compile time
603:
604: =item tth_converted()
605:
606:
607: =item clean_out_math_mode()
608:
609:
610: =item displaystyle()
611:
612:
613: =item MathJax_converted()
614:
615: =item tex_engine()
616:
617: =item init_math_support()
618:
619: =item mimetex_valign()
620:
621: Makes a HEAD call to /cgi-bin/mimetex.cgi via IO:: to retrieve the
622: vertical alignment, before the subsequent call to mimetex_converted()
623: which generates the <img> tag and the corresponding image.
624:
625: Input: 1. $esc_texstring (escaped TeX to be rendered by mimetex).
626: Output: 1. $valign - number of pixels: positive or negative integer
627: which will be included in <img> tag for mimetex image to
628: support vertical alignment of image within a line of text.
629:
630: If a server is running SSL, and Apache rewrite rules are in place
631: to rewrite requests for http to https, modification will most likely
632: be needed for pass through for HEAD requests for /cgi-bin/mimetex.cgi.
633:
634: Example rewrite rules which rewrite all http traffic to https,
635: except HEAD requests for /cgi-bin/mimetex.cgi are:
636:
637: <IfModule mod_rewrite.c>
638: RewriteEngine On
639: RewriteLogLevel 0
640:
641: RewriteCond %{HTTPS} off
642: RewriteCond %{HTTP:Host} (.*)
643: RewriteCond %{REQUEST_METHOD} !HEAD
644: RewriteRule ^/(.*) https://%1/$1 [R=301,L]
645:
646: RewriteCond %{HTTPS} off
647: RewriteCond %{HTTP:Host} (.*)
648: RewriteCond %{REQUEST_METHOD} HEAD
649: RewriteCond %{REQUEST_URI} !^/cgi-bin/mimetex.cgi
650: RewriteRule ^/(.*) https://%1/$1 [R=301,L]
651: </IfModule>
652:
653: =item mimetex_converted()
654:
655:
656: =item converted()
657:
658:
659: =item to_convert()
660:
661: message display
662:
663: =item smiley()
664:
665: ???
666:
667: =item msgtexconverted()
668:
669: =item algebra()
670:
671: =item prepare_algebra()
672:
673: =item postprocess_algebra()
674:
675: =back
676:
677: =cut
678:
679:
680:
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>