File:  [LON-CAPA] / loncom / xml / lontexconvert.pm
Revision 1.122: download - view: text, annotated - select for diffs
Fri Feb 15 20:56:22 2019 UTC (5 years, 10 months ago) by raeburn
Branches: MAIN
CVS tags: version_2_12_X, HEAD
- Default renderer for unconfigured domains set in a single location.

# The LearningOnline Network with CAPA
# TeX Conversion Module
#
# $Id: lontexconvert.pm,v 1.122 2019/02/15 20:56:22 raeburn Exp $
#
# Copyright Michigan State University Board of Trustees
#
# This file is part of the LearningOnline Network with CAPA (LON-CAPA).
#
# LON-CAPA is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# LON-CAPA is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with LON-CAPA; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
#
# /home/httpd/html/adm/gpl.txt
#
# http://www.lon-capa.org/
#
# Copyright for TtHfunc and TtMfunc by Ian Hutchinson. 
# TtHfunc and TtMfunc (the "Code") may be compiled and linked into 
# binary executable programs or libraries distributed by the 
# Michigan State University (the "Licensee"), but any binaries so 
# distributed are hereby licensed only for use in the context
# of a program or computational system for which the Licensee is the 
# primary author or distributor, and which performs substantial 
# additional tasks beyond the translation of (La)TeX into HTML.
# The C source of the Code may not be distributed by the Licensee
# to any other parties under any circumstances.
#

package Apache::lontexconvert;

use strict;
use tth();
use vars qw($errorstring);
#use Apache::lonxml();
use Apache::lonlocal;
use Apache::lonnet;
use lib '/home/httpd/lib/perl/';
use LONCAPA;
use URI::Escape;
use IO::Socket::INET;


#
# Table of substitutions to unicode characters.
#

my %unicode_harpoons = (
                        '\rightleftharpoons'  => 0x21cc,
                      );

my %unicode_translations = (

# Brackets - unicode for browsers/OS which support it.

    ''             => 0x23a1,
    ''             => 0x23a2,
    ''             => 0x23a3,
    ''             => 0x23a4,
    ''             => 0x23a5,
    ''             => 0x23a6,

#  Parens - unicode for browsers/OS which support it

    ''              => 0x239b,
    ''              => 0x239c,
    ''              => 0x239d,
    ''              => 0x239e,
    ''              => 0x239f,
    ''              => 0x23a0,

);

my %ascii_8bit_translations = (

# Brackets - pure 8-bit ascii ugliness for browsers/OS which can't handle unicode

    ''              => 0x5b,
    ''              => 0x5b,    # '['
    ''              => 0x5b,
    ''              => 0x5d,    # ']'
    ''              => 0x5d,
    ''              => 0x5d,

# Parens - pure 8-bit ascii ugliness for browsers/OS which can't handle unicode

    ''              => 0x28,
    ''              => 0x28,      # '('
    ''              => 0x28,
    ''              => 0x29,
    ''              => 0x29,      # '('
    ''              => 0x29,

);

##
# Utility to convert elements of a string to unicode:
#
# @param input - Input string
# @param pattern - Pattern to convert
# @param unicode - Unicode to substitute for pattern.
#
# @return string - resulting string.
# 
sub unicode_subst {
    my ($input, $pattern, $unicode) = @_;
    
    my $char = pack('U', $unicode);

    $input =~ s/$pattern/$char/g;

    return $input;
}

# ====================================================================== Header

sub init_tth {
    my $options=$env{'course.'.$env{'request.course.id'}.'.tthoptions'};
    if ($options =~ /\S/) {
	$options = ' '.$options;
    } else {
	undef($options);
    }
    if ($env{'browser.mathml'}) {
	&tth::ttminit();
	if ($env{'browser.unicode'}) {
	    &tth::ttmoptions('-L -u1'.$options);
	} else {
	    &tth::ttmoptions('-L -u0'.$options);
	}
    } else {
	&tth::tthinit();
	if ($env{'browser.unicode'}) {
	    &tth::tthoptions('-L -u1'.$options);
	} else {
	    &tth::tthoptions('-L -u0'.$options);
	}
    }
}

# ================================================================== Conversion

$Apache::lontexconvert::messedup=0;


sub convert_real {
    my ($texstring)=@_;
    my ($xmlstring,$errorstring);
    local $SIG{SEGV}=sub { $Apache::lontexconvert::messedup=1; die; };
    local $SIG{ALRM}=sub { 
	&Apache::lonnet::logthis("ALRM");
	$xmlstring='['.&mt("TeX unconverted due to errors").']';
	$Apache::lontexconvert::messedup=1;
	die &mt("TeX unconverted due to errors");
    };
    &Apache::lonxml::start_alarm();
    if ($env{'browser.mathml'}) {
	$xmlstring=&tth::ttm($$texstring);
	$xmlstring=~s/\<math\>/\<math xmlns=\"\&mathns\;\"\>/g;
	$xmlstring=~s/\<br\>/\<br\/\>/g;
	$xmlstring=~s/\<p\>/\<p\>\<\/p\>/g;
	$errorstring.=&tth::ttmerror();
    } else {
	$xmlstring=&tth::tth($$texstring);
	$errorstring.=&tth::ttherror();
	$xmlstring=~s-</font(\s*)>-</font>-g;
    }
    $xmlstring=~s/^\s*\<br clear\=\"all\"/\<br/s;
    $xmlstring=~s/^\s*//;
    $xmlstring=~s/\s*$//;
    $xmlstring=~s/^<br \/><table/<table/;
    &Apache::lonxml::end_alarm();

    #
    # Several strings produced by tth require
    # transliteration -> unicode equivalents to render reliably
    # in browsers. %unicode_translations and %unicode_harpoons are tables of
    # string->substitution which we now apply. (%ascii_8bit_translations used
    # instead for Windows XP and mobile devices.

    my $use_ascii;
    if ($env{'browser.os'} eq 'win') {
        if (($env{'browser.osversion'}) && ($env{'browser.osversion'} < 6.0)) {
            $use_ascii = 1;
        }
    }
    if ($env{'browser.mobile'}) {
        $use_ascii = 1;
    }

    foreach my $pattern (keys(%unicode_translations)) {
	my $unicode = $unicode_translations{$pattern};
	if ($use_ascii) {
	    $unicode = $ascii_8bit_translations{$pattern};
	}
	$xmlstring = &unicode_subst($xmlstring, $pattern, $unicode);
    }

    foreach my $pattern (keys(%unicode_harpoons)) {
        $xmlstring = &unicode_subst($xmlstring, $pattern, $unicode_harpoons{$pattern});
    }

    return ($xmlstring,$errorstring);
}

sub tth_converted {
    my $texstring=shift;
    my $xmlstring='['.&mt('UNDISPLAYABLE').']';
    if ($Apache::lontexconvert::messedup) {
	return '['.&mt('TeX unconverted due to previous errors').']';
    }
    $$texstring ='\\documentstyle{article}'.$$texstring;

    eval(<<'ENDCONV');
    ($xmlstring,$errorstring)=&convert_real($texstring)
ENDCONV
    if ($@) {
	$errorstring.=&mt("Evaluation Error: ").$@;
	$Apache::lontexconvert::messedup=1;
    }
    if ($Apache::lontexconvert::messedup || &tth::tthmessedup() || 
	$errorstring) {
	&Apache::lonnet::logthis("Trying to kill myself");
	$Apache::lontexconvert::messedup=1;
	if (ref($Apache::lonxml::request)) {
	    $Apache::lonxml::request->child_terminate();
	} else {
	    my $request;
	    eval { $request=Apache->request; };
	    if (!$request) {
		eval { $request=Apache2::RequestUtil->request; };
	    }
	    if ($request) {
		$request->child_terminate();
	    } else {
		&Apache::lonnet::logthis("Unable to find a request to do child_terminate on");
	    }
	}
    }
    return $xmlstring;
}

sub clean_out_math_mode {
    my ($texstring)=@_;
    $$texstring=~s/(?<!\\)\$//g;
    $$texstring=~s/\\[\)\(\]\[]//g;
    $$texstring=~s/\\ensuremath//g;
    return '';
}

sub displaystyle {
    my ($texstring)=@_;
    #has a $$ or \[ or \displaystyle or eqnarray in it, guessinng it's display mode
    if ($$texstring=~/[^\\]\$\$/ ||
        $$texstring=~/\\\[/ ||
        $$texstring=~/\\displaystyle/ ||
        $$texstring=~/eqnarray/
       ) { return 1; }
    return 0;
}

sub MathJax_converted {
    my $texstring=shift;
    my ($tag,$startspan,$endspan);
    $tag='math/tex;';
    if (&displaystyle($texstring)) {
        $tag='math/tex; mode=display';
        $startspan='';
        $endspan='';
    } else {
        $startspan='<span style="display:inline-block;">';
        $endspan='</span>';
    }
    &clean_out_math_mode($texstring);
    return &MathJax_header().$startspan.
      '<script type="'.$tag.'">'.$$texstring.'</script>'.$endspan;
}

{
    #Relies heavily on the previous jsMath installation
    my @MathJax_sent_header;
    sub MathJax_reset {
        undef(@MathJax_sent_header);
    }
    sub MathJax_push {
        push(@MathJax_sent_header,0);
    }
    sub MathJax_header {
        if (!@MathJax_sent_header) {
            &Apache::lonnet::logthis("mismatched calls of MathJax_header and MathJax_process");
            return '';
        }
        return '' if $MathJax_sent_header[-1];
        $MathJax_sent_header[-1]=1;
        return
          '<script type="text/javascript" src="/adm/MathJax/MathJax.js?config=TeX-AMS-MML_HTMLorMML"></script>'."\n";
    }
    #sub MathJax_process {
    #    my $state = pop(@MathJax_sent_header);
    #    return '' if !$state;
    #    return "\n".
    #        '<script type="text/javascript">MathJax.Process()</script>'."\n";
    #}
    #sub MathJax_state {
    #    my ($level) = @_;
    #    return $MathJax_sent_header[$level];
    #}
}

sub tex_engine {
    if (exists($env{'form.texengine'})) {
	if ($env{'form.texengine'} ne '') {
            if (lc($env{'form.texengine'}) eq 'jsmath') {
                return 'MathJax';
            }
            return $env{'form.texengine'};
        }
    }    
    if ($env{'request.course.id'}
	&& exists($env{'course.'.$env{'request.course.id'}.'.texengine'})) {
        if (lc($env{'course.'.$env{'request.course.id'}.'.texengine'}) eq 'jsmath') {
            return 'MathJax';
        }
	return $env{'course.'.$env{'request.course.id'}.'.texengine'};
    }
    if (exists($env{'environment.texengine'})) {
        if (lc($env{'environment.texengine'}) eq 'jsmath') {
            return 'MathJax';
        }
	return $env{'environment.texengine'};
    }
    my $dom = $env{'request.role.domain'} || $env{'user.domain'};
    my %domdefaults = &Apache::lonnet::get_domain_defaults($dom);
    if ($domdefaults{'texengine'} ne '') {
        return $domdefaults{'texengine'};
    }
    return $Apache::lonnet::deftex;
}

sub init_math_support {
    &init_tth();
    &Apache::lontexconvert::MathJax_push();
    if (lc(&tex_engine()) eq 'mathjax') {
        return &Apache::lontexconvert::MathJax_header();
    }
    return;
}

sub mimetex_valign {
    my ($esc_texstring)=@_;
    my $valign = 0;
    my $path = '/cgi-bin/mimetex.cgi?'.$esc_texstring;
    my $socket;
    &Apache::lonxml::start_alarm();
    $socket = IO::Socket::INET->new(PeerAddr => 'localhost',
                                    PeerPort => 'http(80)',
                                    Proto    => 'tcp');
    if ($socket) {
        my $headreq = "HEAD $path HTTP/1.0\r\n\r\n";
        print $socket $headreq;
        while (<$socket>) {
            if (/Vertical\-Align\:\s*?([\-\d]+)/) {
                $valign = $1;
            }
        }
        $socket->close();
    }
    &Apache::lonxml::end_alarm();
    return $valign;
}

sub mimetex_converted {
    my $texstring=shift;

# Alt-Argument for screen readers
    my $alt_string=$$texstring;
    $alt_string=~s/\"/\'\'/g;

# Is this displaystyle?

    my $displaystyle=&displaystyle($texstring);

# Remove math environment delimiters

    &clean_out_math_mode($texstring);

    if ($displaystyle) {
	$$texstring='\\displaystyle \\Large '.$$texstring;
    }
    my $esc_texstring = &uri_escape($$texstring);
    my $valign = &mimetex_valign($esc_texstring);
    my $result='<img src="/cgi-bin/mimetex.cgi?'.$esc_texstring.'" style="vertical-align:'.$valign.'px" alt="'.$alt_string.'" />';
    if ($displaystyle) {
	$result='<div style="text-align:center">'.$result.'</div>';
    }
    return $result;
}

sub converted {
    my ($string,$mode)=@_;
    if ($mode eq '') { $mode = &tex_engine(); }
    if ($mode =~ /tth/i) {
	return &tth_converted($string);
    } elsif ($mode =~ /jsmath/i) {
        return &MathJax_converted($string);
    } elsif ($mode =~ /mathjax/i) {
	return &MathJax_converted($string);
    } elsif ($mode =~ /mimetex/i) {
	return &mimetex_converted($string);
    } elsif ($mode =~ /raw/i) {
        return $$string;
    }
    return &tth_converted($string);
}

# ------------------------------------------------------------ Message display

sub to_convert {
    my ($string) = @_;
    &init_tth();
    $string=~s/\<br\s*\/?\>/ /gs;
#    $string=~s/\s/ /gs;
    $string=&HTML::Entities::decode($string);
    return &converted(\$string);
}

sub smiley {
    my $expression=shift;
    my %smileys=(
    	 '\:\-*\)' => 'face-smile.png',
		 '8\-\)'  => 'face-cool.png',
		 '8\-(I|\|)'   => 'face-glasses.png',
		 '\:\-(I|\|)'   => 'face-plain.png',
		 '\:\-(o|O|\(\))' => 'face-surprise.png',
		 ':\-\('  => 'face-sad.png',
		 '\;\-\)' => 'face-wink.png',
		 '\:\-(P|p)'  => 'face-raspberry.png',
		 '\:\-(\\\|\\/)' => 'face-uncertain.png',
		 '\:\-D'  => 'face-smile-big.png',
		 '\:\-(C|\@)'  => 'face-angry.png',
		 '\:(\'|\`)\-*\(' => 'face-crying.png',
		 '\:\-(X|x|\#)' => 'face-quiet.png',
		 '\:\-(s|S)' => 'face-uncertain.png',
		 '\:\-\$' => 'face-embarrassed.png',
		 '\:\-\*' => 'face-kiss.png',
		 '\+O\(' => 'face-sick.png',
		 '(\&lt\;3|\(heart\))' => 'heart.png',
		 '\(rose\)' => 'rose.png',
		 '\(pizza\)' => 'food-pizza.png',
		 '\(cake\)' => 'food-cake.png',
		 '\(ninja\)' => 'face-ninja.png',
		 '\(pirate\)' => 'face-pirate.png',
		 '\((agree|yes)\)' => 'opinion-agree.png',
		 '\((disagree|nay)\)' => 'opinion-disagree.png',
		 '(o|O)\-\)' => 'face-angel.png',
		 );
    my $iconpath=$Apache::lonnet::perlvar{'lonIconsURL'};
    foreach my $smiley (keys(%smileys)) {
	$expression=~s/$smiley/\<img src="$iconpath\/$smileys{$smiley}" \/\>/gs; 
    }
    return $expression;
}

sub msgtexconverted {
    my ($message,$email) = @_;
    $errorstring='';
    my $outmessage='';
    my $tex=0;
    foreach my $fragment (split(/(?:\&lt\;|\<)\/*m\s*(?:\&gt\;|\>)/i,$message)) {
	if ($tex) {
	    if ($email) {
		$outmessage.='</pre><tt>'.&to_convert($fragment).'</tt><pre>';
		$tex=0;
	    } else {
		$outmessage.=&to_convert($fragment);
		$tex=0;
	    }
	} else {
            $outmessage.=&smiley($fragment);
	    $tex=1;
	}
    }
    $message=$outmessage; $outmessage=''; $tex=0;
    foreach my $fragment (split(/(?:\&lt\;|\<)\/*algebra\s*(?:\&gt\;|\>)/i,
				$message)) {
	if ($tex) {
        my $algebra = &algebra($fragment, 'web', undef, undef, undef, 'tth');
	    if ($email) {
		$outmessage.='</pre><tt>'.$algebra.'</tt><pre>';
		$tex=0;
	    } else {
		$outmessage.=$algebra;
		$tex=0;
	    }
	} else {
        $outmessage.=$fragment;
	    $tex=1;
	}
    }
    if (wantarray) {
	return ($outmessage,$errorstring);
    } else {
	return $outmessage.$errorstring;
    }
}

sub algebra {
    use AlgParser;
    my ($string,$target,$style,$parstack,$safeeval,$tth)=@_;
    my $parser = new AlgParserWithImplicitExpand;
    if ($tth eq 'tth') {&init_tth();}
    $string=&prepare_algebra($string);
    my $ret = $parser->parse($string);
    my $result='['.&mt('Algebra unconverted due to previous errors').']';
    if ( ref($ret) ) {
	#$parser->tostring();
	$parser->normalize();
	my $latex=$parser->tolatex();
	$latex=&postprocess_algebra($latex);
	if ($style eq 'display') {
	    $latex='$$'.$latex.'$$x';
	} else {
	    # style is 'inline'
	    $latex='\\ensuremath{'.$latex.'}';
	}
	if ($target eq 'web' || $target eq 'analyze') {
            my $display=&Apache::lonxml::get_param('display',$parstack,$safeeval);
            $result = &converted(\$latex,$display);
#	    $result = &converted(\$latex);
	} else {
	    $result = $latex;
	}
    } else {
	&Apache::lonxml::error($parser->{'htmlerror'});
    }
}

sub prepare_algebra {
    my ($string)=@_;

    # makes the decision about what is a minus sign easier supposedly
    $string =~ s/(\<\>|\<\=|\>\=[\=\>\<] *)-/$1 zeroplace -/g;

    return $string;
}

sub postprocess_algebra {
    my ($string)=@_;
    
    # moodle had these and I don't know why, ignoring them for now
    # $string =~s/\\fun/ /g;

    # sqrt(3,4) means the 4 root of 3
    $string =~s/\\sqrt\{([^,]+),([^\}]+)}/\\sqrt[$2]{$1}/gs;

    # log(3,4) means the log base 4 of 3
    $string =~s/\\log\\left\((.+?),(.+?)\\right\)/\\log_{$2}\\left($1\\right)/gs;

    # log(3,4) means the log base 4 of 3
    $string =~s/\\((?:sin|cos|tan|sec|csc|cot)(?:h)?)\\left\((.+?),(.+?)\\right\)/\\$1^{$3}\\left($2\\right)/gs;

    # int(3,a,b) integral from a to b of 3
    $string =~s/\\int\\left\((.+?),(.+?),(.+?)\\right\)/\\int_{$2}^{$3}\\left($1\\right)/gs;

    # int( ... dx) -> ...
    $string =~s/\\int\\left\((.+?)d[a-z]\\right\)/$1/gs;

    # 
    $string =~s/\\lim\\left\((.+?),(.+?),(.+?)\\right\)/\\lim_{$2\\to $3}$1/gs;
    return $string;
}


1;
__END__


=pod

=head1 NAME

Apache::lontexconvert;

=head1 SYNOPSIS

Access to tth/ttm

This is part of the LearningOnline Network with CAPA project
described at http://www.lon-capa.org.


=head1 SUBROUTINES

=over

=item init_tth()

Header

=item convert_real()

 we need this routine because &converted can get called from inside
 of the safespace (through &xmlparse('<m>stuff</m>') which doesn't
 allow the opcode for alarm, so we need to compile this before we get
 into the safe space since opcode checks only occur at compile time

=item tth_converted()


=item clean_out_math_mode()


=item displaystyle()


=item MathJax_converted()

=item tex_engine()

=item init_math_support()

=item mimetex_valign()

 Makes a HEAD call to /cgi-bin/mimetex.cgi via IO:: to retrieve the 
 vertical alignment, before the subsequent call to mimetex_converted()
 which generates the <img> tag and the corresponding image.

 Input: 1.  $esc_texstring (escaped TeX to be rendered by mimetex).
 Output: 1. $valign - number of pixels: positive or negative integer 
            which will be included in <img> tag for mimetex image to
            support vertical alignment of image within a line of text.

 If a server is running SSL, and Apache rewrite rules are in place 
 to rewrite requests for http to https, modification will most likely 
 be needed for pass through for HEAD requests for /cgi-bin/mimetex.cgi. 

 Example rewrite rules which rewrite all http traffic to https, 
 except HEAD requests for /cgi-bin/mimetex.cgi are:

 <IfModule mod_rewrite.c>
     RewriteEngine On
     RewriteLogLevel 0

     RewriteCond %{HTTPS} off
     RewriteCond %{HTTP:Host} (.*)
     RewriteCond %{REQUEST_METHOD} !HEAD 
     RewriteRule ^/(.*) https://%1/$1 [R=301,L]

     RewriteCond %{HTTPS} off
     RewriteCond %{HTTP:Host} (.*)
     RewriteCond %{REQUEST_METHOD} HEAD
     RewriteCond %{REQUEST_URI} !^/cgi-bin/mimetex.cgi
     RewriteRule ^/(.*) https://%1/$1 [R=301,L]
 </IfModule>

=item mimetex_converted()


=item converted()


=item to_convert()

message display

=item smiley()

???

=item msgtexconverted()

=item algebra()

=item prepare_algebra()

=item postprocess_algebra()

=back

=cut




FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>