--- loncom/xml/lontexconvert.pm 2002/10/28 20:40:25 1.12 +++ loncom/xml/lontexconvert.pm 2009/12/22 05:08:04 1.100 @@ -1,7 +1,7 @@ # The LearningOnline Network with CAPA # TeX Conversion Module # -# $Id: lontexconvert.pm,v 1.12 2002/10/28 20:40:25 www Exp $ +# $Id: lontexconvert.pm,v 1.100 2009/12/22 05:08:04 faziophi Exp $ # # Copyright Michigan State University Board of Trustees # @@ -36,106 +36,524 @@ # The C source of the Code may not be distributed by the Licensee # to any other parties under any circumstances. # -# 05/29/00,05/30,10/11,10/20 Gerd Kortemeyer -# 05/03/2001 Scott Harrison -# 5/4 Gerd Kortemeyer package Apache::lontexconvert; use strict; -use tth; +use tth(); use vars qw($errorstring); -use Apache::lonmsg; -use Apache::lonxml; +#use Apache::lonxml(); +use Apache::lonlocal; +use Apache::lonnet; +use lib '/home/httpd/lib/perl/'; +use LONCAPA; +use URI::Escape; +use IO::Socket::INET; +use IO::Socket::SSL; # ====================================================================== Header -sub header { - $errorstring=''; - my $time=time; - if ($ENV{'browser.mathml'}) { - &tth::ttminit(); - } else { - &tth::tthinit(); - } - return &Apache::lonxml::xmlbegin(). - &Apache::lonxml::fontsettings(). - "\n
/\
\<\/p\>/g; - $errorstring.=&tth::ttmerror(); +$Apache::lontexconvert::messedup=0; + + +sub convert_real { + my ($texstring)=@_; + my ($xmlstring,$errorstring); + local $SIG{SEGV}=sub { $Apache::lontexconvert::messedup=1; die; }; + local $SIG{ALRM}=sub { + &Apache::lonnet::logthis("ALRM"); + $xmlstring='['.&mt("TeX unconverted due to errors").']'; + $Apache::lontexconvert::messedup=1; + die &mt("TeX unconverted due to errors"); + }; + &Apache::lonxml::start_alarm(); + if ($env{'browser.mathml'}) { + $xmlstring=&tth::ttm($$texstring); + $xmlstring=~s/\/\/g; + $xmlstring=~s/\/\/g; + $xmlstring=~s/\/\\<\/p\>/g; + $errorstring.=&tth::ttmerror(); } else { - $xmlstring=&tth::tth($$texstring); - $errorstring.=&tth::ttherror(); + $xmlstring=&tth::tth($$texstring); + $errorstring.=&tth::ttherror(); + $xmlstring=~s---g; } - } + $xmlstring=~s/^\s*\child_terminate(); + } else { + my $request; + eval { $request=Apache->request; }; + if (!$request) { + eval { $request=Apache2::RequestUtil->request; }; + } + if ($request) { + $request->child_terminate(); + } else { + &Apache::lonnet::logthis("Unable to find a request to do child_terminate on"); + } + } + } + return $xmlstring; +} + +sub clean_out_math_mode { + my ($texstring)=@_; + $$texstring=~s/(?'.$errorstring.''; - } else { - &Apache::lonmsg::author_res_msg($ENV{'request.filename'},$errorstring); - } -# -------------------------------------------------------------------- End Body - $xmlstring.=&Apache::lonxml::xmlend(); - return $xmlstring; +sub jsMath_converted { + my $texstring=shift; + my $tag='span'; + if (&displaystyle($texstring)) { $tag='div'; } + &clean_out_math_mode($texstring); + return &jsMath_header(). + '<'.$tag.' class="math">'.$$texstring.''.$tag.'>'; +} + +{ + my @jsMath_sent_header; + sub jsMath_reset { + undef(@jsMath_sent_header); + } + sub jsMath_push { + push(@jsMath_sent_header,0); + } + sub jsMath_header { + if (!@jsMath_sent_header) { + &Apache::lonnet::logthis("mismatched calls of jsMath_header and jsMath_process"); + return ''; + } + return '' if $jsMath_sent_header[-1]; + $jsMath_sent_header[-1]=1; + return + ''."\n". + ''."\n"; + } + sub jsMath_process { + my $state = pop(@jsMath_sent_header); + return '' if !$state; + return "\n". + ''."\n"; + } + sub jsMath_state { + my ($level) = @_; + return $jsMath_sent_header[$level]; + } +} + +sub tex_engine { + if (exists($env{'form.texengine'})) { + if ($env{'form.texengine'} ne '') { + return $env{'form.texengine'}; + } + } + if ($env{'request.course.id'} + && exists($env{'course.'.$env{'request.course.id'}.'.texengine'})) { + return $env{'course.'.$env{'request.course.id'}.'.texengine'}; + } + if (exists($env{'environment.texengine'})) { + return $env{'environment.texengine'}; + } + return 'tth'; +} + +sub init_math_support { + my ($inherit_jsmath) = @_; + &init_tth(); + &Apache::lontexconvert::jsMath_push(); + if (lc(&tex_engine()) eq 'jsmath' || + ($inherit_jsmath && &jsMath_state(-2))) { + return &Apache::lontexconvert::jsMath_header(); + } + return; +} + +sub mimetex_valign { + my ($esc_texstring)=@_; + my $valign = 0; + my $lonhost = $Apache::lonnet::perlvar{'lonHostID'}; + my $hostname = &Apache::lonnet::hostname($lonhost); + my $protocol = $Apache::lonnet::protocol{$lonhost}; + my $path = '/cgi-bin/mimetex.cgi?'.$esc_texstring; + my $socket; + &Apache::lonxml::start_alarm(); + if ($protocol eq 'https') { + $socket = IO::Socket::SSL->new(PeerAddr => $hostname, + PeerPort => 'https(443)', + Proto => 'tcp'); + } else { + $socket = IO::Socket::INET->new(PeerAddr => $hostname, + PeerPort => 'http(80)', + Proto => 'tcp'); + } + if ($socket) { + my $headreq = "HEAD $path HTTP/1.0\r\n\r\n"; + print $socket $headreq; + while (<$socket>) { + if (/Vertical\-Align\:\s*?([\-\d]+)/) { + $valign = $1; + } + } + if ($protocol eq 'https') { + $socket->close(SSL_no_shutdown => 1, + SSL_ctx_free => 1); + } else { + $socket->close(); + } + } + &Apache::lonxml::end_alarm(); + return $valign; +} + +sub mimetex_converted { + my $texstring=shift; + +# Alt-Argument for screen readers + my $alt_string=$$texstring; + $alt_string=~s/\"/\'\'/g; + +# Is this displaystyle? + + my $displaystyle=&displaystyle($texstring); + +# Remove math environment delimiters + + &clean_out_math_mode($texstring); + + if ($displaystyle) { + $$texstring='\\displaystyle \\Large '.$$texstring; + } + my $esc_texstring = &uri_escape($$texstring); + my $valign = &mimetex_valign($esc_texstring); + my $result=''; + if ($displaystyle) { + $result=''.$result.''; + } + return $result; +} + +sub converted { + my ($string,$mode)=@_; + if ($mode eq '') { $mode = &tex_engine(); } + if ($mode =~ /tth/i) { + return &tth_converted($string); + } elsif ($mode =~ /jsmath/i) { + return &jsMath_converted($string); + } elsif ($mode =~ /mimetex/i) { + return &mimetex_converted($string); + } elsif ($mode =~ /raw/i) { + return $$string; + } + return &tth_converted($string); } # ------------------------------------------------------------ Message display sub to_convert { my ($string) = @_; - $string=~s/\/ /g; + $string=~s/\/ /gs; +# $string=~s/\s/ /gs; + $string=&HTML::Entities::decode($string); return &converted(\$string); } +sub smiley { + my $expression=shift; + if ($env{'browser.imagesuppress'} eq 'on') { return $expression; } + my %smileys=( + '\:\-*\)' => 'face-smile.png', + '8\-\)' => 'face-cool.png', + '8\-(I|\|)' => 'face-glasses.png', + ':\-*(I|\|)' => 'face-plain.png', + '\:\-(o|O|\(\))' => 'face-surprise.png', + ':\-*\(' => 'face-sad.png', + '\;\-*\)' => 'face-wink.png', + '\:\-*(P|p)' => 'face-raspberry.png', + '\:\-(\\\|\\/)' => 'face-uncertain.png', + '\:\-*D' => 'face-smile-big.png', + '\:\-*(C|\@)' => 'face-angry.png', + '\:(\'|\`)\-*\(' => 'face-crying.png', + '\:\-*(X|x|\#)' => 'face-quiet.png', + '\:\-*(s|S)' => 'face-uncertain.png', + '\:\-*\$' => 'face-embarrassed.png', + '\:\-*\*' => 'face-kiss.png', + '\+O\(' => 'face-sick.png', + '(\<\;3|\(heart\))' => 'heart.png', + '\(rose\)' => 'rose.png', + '\(pizza\)' => 'food-pizza.png', + '\(cake\)' => 'food-cake.png', + '\(ninja\)' => 'face-ninja.png', + '\(pirate\)' => 'face-pirate.png', + '\((agree|yes)\)' => 'opinion-agree.png', + '\((disagree|nay)\)' => 'opinion-disagree.png', + '(o|O)\-*\)' => 'face-angel.png', + ); + my $iconpath=$Apache::lonnet::perlvar{'lonIconsURL'}; + foreach my $smiley (keys(%smileys)) { + $expression=~s/$smiley/\/gs; + } + return $expression; +} + sub msgtexconverted { - my $message=shift; + my ($message,$email) = @_; + $errorstring=''; + &init_tth(); + my $outmessage=''; + my $tex=0; + foreach my $fragment (split(/(?:\<\;|\<)\/*m\s*(?:\>\;|\>)/i,$message)) { + if ($tex) { + if ($email) { + $outmessage.=''.&to_convert($fragment).''; + $tex=0; + } else { + $outmessage.=&to_convert($fragment); + $tex=0; + } + } else { + $outmessage.=&smiley($fragment); + $tex=1; + } + } + $message=$outmessage; $outmessage=''; $tex=0; + foreach my $fragment (split(/(?:\<\;|\<)\/*algebra\s*(?:\>\;|\>)/i, + $message)) { + if ($tex) { + if ($email) { + $outmessage.=''.&algebra($fragment,'web').''; + $tex=0; + } else { + $outmessage.=&algebra($fragment,'web'); + $tex=0; + } + } else { + $outmessage.=$fragment; + $tex=1; + } + } + if (wantarray) { + return ($outmessage,$errorstring); + } else { + return $outmessage.$errorstring; + } +} + +sub algebra { + use AlgParser; + + my ($string,$target,$style,$parstack,$safeeval)=@_; + my $parser = new AlgParserWithImplicitExpand; + $string=&prepare_algebra($string); + my $ret = $parser->parse($string); + my $result='['.&mt('Algebra unconverted due to previous errors').']'; + if ( ref($ret) ) { + #$parser->tostring(); + $parser->normalize(); + my $latex=$parser->tolatex(); + $latex=&postprocess_algebra($latex); + if ($style eq 'display') { + $latex='$$'.$latex.'$$x'; + } else { + # style is 'inline' + $latex='\\ensuremath{'.$latex.'}'; + } + if ($target eq 'web' || $target eq 'analyze') { + my $display=&Apache::lonxml::get_param('display',$parstack,$safeeval); + $result = &converted(\$latex,$display); +# $result = &converted(\$latex); + } else { + $result = $latex; + } + } else { + &Apache::lonxml::error($parser->{'htmlerror'}); + } +} + +sub prepare_algebra { + my ($string)=@_; - #FIXME this crap needs to go but right now the -L option might be - #ignored if this isn;t the first time the tth engine is used - #thus the \\document class crap, it makes sure we init the LaTeX stuff - if ($ENV{'browser.mathml'}) { - &tth::ttminit(); - &tth::ttmoptions("-L"); - } else { - &tth::tthinit(); - &tth::tthoptions("-L"); - } - $message=~s/(\$\$.+?\$\$)/&to_convert("\\documentclass{article}".$1)/ge; - $message=~s/(\$.+?\$)/&to_convert("\\documentclass{article}".$1)/ge; - $message=~s/(\\\(.+?\\\))/&to_convert("\\documentclass{article}".$1)/ge; - $message=~s/(\\\[.+?\\\])/&to_convert("\\documentclass{article}".$1)/ge; - return $message.$errorstring; + # makes the decision about what is a minus sign easier supposedly + $string =~ s/(\<\>|\<\=|\>\=[\=\>\<] *)-/$1 zeroplace -/g; + + return $string; } +sub postprocess_algebra { + my ($string)=@_; + + # moodle had these and I don't know why, ignoring them for now + # $string =~s/\\fun/ /g; + + # sqrt(3,4) means the 4 root of 3 + $string =~s/\\sqrt{([^,]+),([^\}]+)}/\\sqrt[$2]{$1}/gs; + + # log(3,4) means the log base 4 of 3 + $string =~s/\\log\\left\((.+?),(.+?)\\right\)/\\log_{$2}\\left($1\\right)/gs; + + # log(3,4) means the log base 4 of 3 + $string =~s/\\((?:sin|cos|tan|sec|csc|cot)(?:h)?)\\left\((.+?),(.+?)\\right\)/\\$1^{$3}\\left($2\\right)/gs; + + # int(3,a,b) integral from a to b of 3 + $string =~s/\\int\\left\((.+?),(.+?),(.+?)\\right\)/\\int_{$2}^{$3}\\left($1\\right)/gs; + + # int( ... dx) -> ... + $string =~s/\\int\\left\((.+?)d[a-z]\\right\)/$1/gs; + + # + $string =~s/\\lim\\left\((.+?),(.+?),(.+?)\\right\)/\\lim_{$2\\to $3}$1/gs; + return $string; +} 1; __END__ +=pod + +=head1 NAME + +Apache::lontexconvert; + +=head1 SYNOPSIS + +Access to tth/ttm + +This is part of the LearningOnline Network with CAPA project +described at http://www.lon-capa.org. + + +=head1 SUBROUTINES + +=over + +=item init_tth() + +Header + +=item convert_real() + + we need this routine because &converted can get called from inside + of the safespace (through &xmlparse('stuff') which doesn't + allow the opcode for alarm, so we need to compile this before we get + into the safe space since opcode checks only occur at compile time + +=item tth_converted() + + +=item clean_out_math_mode() + + +=item displaystyle() + + +=item jsMath_converted() + + +=item tex_engine() + + +=item init_math_support() + + +=item mimetex_converted() + + +=item converted() + + +=item to_convert() + +message display + +=item smiley() + +??? + +=item msgtexconverted() + +=item algebra() + +=item prepare_algebra() + +=item postprocess_algebra() +=back +=cut
\<\/p\>/g; + $errorstring.=&tth::ttmerror(); } else { - $xmlstring=&tth::tth($$texstring); - $errorstring.=&tth::ttherror(); + $xmlstring=&tth::tth($$texstring); + $errorstring.=&tth::ttherror(); + $xmlstring=~s---g; } - } + $xmlstring=~s/^\s*\child_terminate(); + } else { + my $request; + eval { $request=Apache->request; }; + if (!$request) { + eval { $request=Apache2::RequestUtil->request; }; + } + if ($request) { + $request->child_terminate(); + } else { + &Apache::lonnet::logthis("Unable to find a request to do child_terminate on"); + } + } + } + return $xmlstring; +} + +sub clean_out_math_mode { + my ($texstring)=@_; + $$texstring=~s/(?'.$errorstring.''; - } else { - &Apache::lonmsg::author_res_msg($ENV{'request.filename'},$errorstring); - } -# -------------------------------------------------------------------- End Body - $xmlstring.=&Apache::lonxml::xmlend(); - return $xmlstring; +sub jsMath_converted { + my $texstring=shift; + my $tag='span'; + if (&displaystyle($texstring)) { $tag='div'; } + &clean_out_math_mode($texstring); + return &jsMath_header(). + '<'.$tag.' class="math">'.$$texstring.''.$tag.'>'; +} + +{ + my @jsMath_sent_header; + sub jsMath_reset { + undef(@jsMath_sent_header); + } + sub jsMath_push { + push(@jsMath_sent_header,0); + } + sub jsMath_header { + if (!@jsMath_sent_header) { + &Apache::lonnet::logthis("mismatched calls of jsMath_header and jsMath_process"); + return ''; + } + return '' if $jsMath_sent_header[-1]; + $jsMath_sent_header[-1]=1; + return + ''."\n". + ''."\n"; + } + sub jsMath_process { + my $state = pop(@jsMath_sent_header); + return '' if !$state; + return "\n". + ''."\n"; + } + sub jsMath_state { + my ($level) = @_; + return $jsMath_sent_header[$level]; + } +} + +sub tex_engine { + if (exists($env{'form.texengine'})) { + if ($env{'form.texengine'} ne '') { + return $env{'form.texengine'}; + } + } + if ($env{'request.course.id'} + && exists($env{'course.'.$env{'request.course.id'}.'.texengine'})) { + return $env{'course.'.$env{'request.course.id'}.'.texengine'}; + } + if (exists($env{'environment.texengine'})) { + return $env{'environment.texengine'}; + } + return 'tth'; +} + +sub init_math_support { + my ($inherit_jsmath) = @_; + &init_tth(); + &Apache::lontexconvert::jsMath_push(); + if (lc(&tex_engine()) eq 'jsmath' || + ($inherit_jsmath && &jsMath_state(-2))) { + return &Apache::lontexconvert::jsMath_header(); + } + return; +} + +sub mimetex_valign { + my ($esc_texstring)=@_; + my $valign = 0; + my $lonhost = $Apache::lonnet::perlvar{'lonHostID'}; + my $hostname = &Apache::lonnet::hostname($lonhost); + my $protocol = $Apache::lonnet::protocol{$lonhost}; + my $path = '/cgi-bin/mimetex.cgi?'.$esc_texstring; + my $socket; + &Apache::lonxml::start_alarm(); + if ($protocol eq 'https') { + $socket = IO::Socket::SSL->new(PeerAddr => $hostname, + PeerPort => 'https(443)', + Proto => 'tcp'); + } else { + $socket = IO::Socket::INET->new(PeerAddr => $hostname, + PeerPort => 'http(80)', + Proto => 'tcp'); + } + if ($socket) { + my $headreq = "HEAD $path HTTP/1.0\r\n\r\n"; + print $socket $headreq; + while (<$socket>) { + if (/Vertical\-Align\:\s*?([\-\d]+)/) { + $valign = $1; + } + } + if ($protocol eq 'https') { + $socket->close(SSL_no_shutdown => 1, + SSL_ctx_free => 1); + } else { + $socket->close(); + } + } + &Apache::lonxml::end_alarm(); + return $valign; +} + +sub mimetex_converted { + my $texstring=shift; + +# Alt-Argument for screen readers + my $alt_string=$$texstring; + $alt_string=~s/\"/\'\'/g; + +# Is this displaystyle? + + my $displaystyle=&displaystyle($texstring); + +# Remove math environment delimiters + + &clean_out_math_mode($texstring); + + if ($displaystyle) { + $$texstring='\\displaystyle \\Large '.$$texstring; + } + my $esc_texstring = &uri_escape($$texstring); + my $valign = &mimetex_valign($esc_texstring); + my $result=''; + if ($displaystyle) { + $result='
'; + $tex=0; + } else { + $outmessage.=&to_convert($fragment); + $tex=0; + } + } else { + $outmessage.=&smiley($fragment); + $tex=1; + } + } + $message=$outmessage; $outmessage=''; $tex=0; + foreach my $fragment (split(/(?:\<\;|\<)\/*algebra\s*(?:\>\;|\>)/i, + $message)) { + if ($tex) { + if ($email) { + $outmessage.='
'; + $tex=0; + } else { + $outmessage.=&algebra($fragment,'web'); + $tex=0; + } + } else { + $outmessage.=$fragment; + $tex=1; + } + } + if (wantarray) { + return ($outmessage,$errorstring); + } else { + return $outmessage.$errorstring; + } +} + +sub algebra { + use AlgParser; + + my ($string,$target,$style,$parstack,$safeeval)=@_; + my $parser = new AlgParserWithImplicitExpand; + $string=&prepare_algebra($string); + my $ret = $parser->parse($string); + my $result='['.&mt('Algebra unconverted due to previous errors').']'; + if ( ref($ret) ) { + #$parser->tostring(); + $parser->normalize(); + my $latex=$parser->tolatex(); + $latex=&postprocess_algebra($latex); + if ($style eq 'display') { + $latex='$$'.$latex.'$$x'; + } else { + # style is 'inline' + $latex='\\ensuremath{'.$latex.'}'; + } + if ($target eq 'web' || $target eq 'analyze') { + my $display=&Apache::lonxml::get_param('display',$parstack,$safeeval); + $result = &converted(\$latex,$display); +# $result = &converted(\$latex); + } else { + $result = $latex; + } + } else { + &Apache::lonxml::error($parser->{'htmlerror'}); + } +} + +sub prepare_algebra { + my ($string)=@_; - #FIXME this crap needs to go but right now the -L option might be - #ignored if this isn;t the first time the tth engine is used - #thus the \\document class crap, it makes sure we init the LaTeX stuff - if ($ENV{'browser.mathml'}) { - &tth::ttminit(); - &tth::ttmoptions("-L"); - } else { - &tth::tthinit(); - &tth::tthoptions("-L"); - } - $message=~s/(\$\$.+?\$\$)/&to_convert("\\documentclass{article}".$1)/ge; - $message=~s/(\$.+?\$)/&to_convert("\\documentclass{article}".$1)/ge; - $message=~s/(\\\(.+?\\\))/&to_convert("\\documentclass{article}".$1)/ge; - $message=~s/(\\\[.+?\\\])/&to_convert("\\documentclass{article}".$1)/ge; - return $message.$errorstring; + # makes the decision about what is a minus sign easier supposedly + $string =~ s/(\<\>|\<\=|\>\=[\=\>\<] *)-/$1 zeroplace -/g; + + return $string; } +sub postprocess_algebra { + my ($string)=@_; + + # moodle had these and I don't know why, ignoring them for now + # $string =~s/\\fun/ /g; + + # sqrt(3,4) means the 4 root of 3 + $string =~s/\\sqrt{([^,]+),([^\}]+)}/\\sqrt[$2]{$1}/gs; + + # log(3,4) means the log base 4 of 3 + $string =~s/\\log\\left\((.+?),(.+?)\\right\)/\\log_{$2}\\left($1\\right)/gs; + + # log(3,4) means the log base 4 of 3 + $string =~s/\\((?:sin|cos|tan|sec|csc|cot)(?:h)?)\\left\((.+?),(.+?)\\right\)/\\$1^{$3}\\left($2\\right)/gs; + + # int(3,a,b) integral from a to b of 3 + $string =~s/\\int\\left\((.+?),(.+?),(.+?)\\right\)/\\int_{$2}^{$3}\\left($1\\right)/gs; + + # int( ... dx) -> ... + $string =~s/\\int\\left\((.+?)d[a-z]\\right\)/$1/gs; + + # + $string =~s/\\lim\\left\((.+?),(.+?),(.+?)\\right\)/\\lim_{$2\\to $3}$1/gs; + return $string; +} 1; __END__ +=pod + +=head1 NAME + +Apache::lontexconvert; + +=head1 SYNOPSIS + +Access to tth/ttm + +This is part of the LearningOnline Network with CAPA project +described at http://www.lon-capa.org. + + +=head1 SUBROUTINES + +=over + +=item init_tth() + +Header + +=item convert_real() + + we need this routine because &converted can get called from inside + of the safespace (through &xmlparse('stuff') which doesn't + allow the opcode for alarm, so we need to compile this before we get + into the safe space since opcode checks only occur at compile time + +=item tth_converted() + + +=item clean_out_math_mode() + + +=item displaystyle() + + +=item jsMath_converted() + + +=item tex_engine() + + +=item init_math_support() + + +=item mimetex_converted() + + +=item converted() + + +=item to_convert() + +message display + +=item smiley() + +??? + +=item msgtexconverted() + +=item algebra() + +=item prepare_algebra() + +=item postprocess_algebra() +=back +=cut