<?php class Page2Tex { private $_current_page; private static $header_count = 0; private static $p_count=0; private static $hil_count=0; private $page_count=0; private $_base; private $_dir; private $_verb_find = array('\$','\%', '\{', '\}', "\t",'``','`'); private $_verb_replace = array('$', '%', '{','}', " ",'"','\''); function __construct($base, $dir, $current='') { $this->_base = $base; $this->_current_page = $current; $this->_dir = $dir; } function setCurrentPage($current) { self::$header_count = self::$header_count+1000; $this->_current_page = $current; } function escape_verbatim($matches) { return "\begin{small}\begin{verbatim}". str_replace($this->_verb_find, $this->_verb_replace, $matches[1]). '\end{verbatim}\end{small}'."\n"; } function escape_verb($matches) { $text = str_replace($this->_verb_find, $this->_verb_replace, $matches[1]); return '\begin{small}\verb<'.$text.'< \end{small}'; } function include_image($matches) { $current_path = $this->_current_page; $image = dirname($current_path).'/'.trim($matches[1]); $file = realpath($image); $info = getimagesize($file); switch($info[2]) { case 1: $im = imagecreatefromgif($file); break; case 2: $im = imagecreatefromjpeg($file); break; case 3: $im = imagecreatefrompng($file); break; } $base = $this->_base; if(isset($im)) { $prefix = strtolower(str_replace(realpath($base), '', $file)); $filename = preg_replace('/\\\|\//', '_', substr($prefix,1)); $filename = substr($filename, 0, strrpos($filename,'.')).'.png'; $newfile = $this->_dir.'/'.$filename; imagepng($im,$newfile); imagedestroy($im); return $this->include_figure($info, $filename); } } function include_figure($info, $filename) { $width = sprintf('%0.2f', $info[0]/(135/2.54)); return ' \begin{figure}[!ht] \centering \includegraphics[width='.$width.'cm]{'.$filename.'} \label{fig:'.$filename.'} \end{figure} '; } function anchor($matches) { $page = $this->get_current_path(); return '\hypertarget{'.$page.'/'.strtolower($matches[1]).'}{}'; } function texttt($matches) { $text ='\texttt{'.str_replace(array('#','_','&'),array('\#','\_','\&'), $matches[1]).'}'; //$text = preg_replace('/([^\\\\])&([^;]+)/', '$1\&$2', $text); return $text; } function get_current_path() { $current_path = $this->_current_page; $base = $this->_base; $page = strtolower(substr(str_replace($base, '', $current_path),1)); return $page; } function make_link($matches) { if(is_int(strpos($matches[1], '#'))) { if(strpos($matches[1],'?') ===false) { if(strpos($matches[1],'http://')===false) { $target = $this->get_current_path().'/'.substr($matches[1],1); return '\hyperlink{'.$target.'}{'.$matches[2].'}'; } } else { $page = strtolower(str_replace('?page=', '', $matches[1])); $page = str_replace('.','/',$page); $page = str_replace('#','.page/',$page); return '\hyperlink{'.$page.'}{'.$matches[2].'}'; } } else if(is_int(strpos($matches[1],'?'))) { $page = str_replace('?page=','',$matches[1]); return '\hyperlink{'.$page.'}{'.$matches[2].'}'; } return '\href{'.str_replace('#','\\#',$matches[1]).'}{'.$matches[2].'}'; } function parse_html($page,$html) { $html = preg_replace('/<\/?com:TContent[^>]*>/', '', $html); $html = preg_replace('/<\/?p [^>]*>/', '', $html); $html = preg_replace('/<\/?p>/', '', $html); $html = preg_replace('/(\s+|\(+|\[+)"/', '$1``', $html); $html = preg_replace('/(\s+|\(+|\[+)\'/', '$1`', $html); //escape { and } $html = preg_replace('/([^\s]+){([^}]*)}([^\s]+)/', '$1\\\{$2\\\}$3', $html); $html = preg_replace_callback('/<img\s+src="?<%~([^"]*)%>"?[^>]*\/>/', array($this, 'include_image'), $html); //escape % $html = str_replace('%', '\%', $html); //codes $html = str_replace('$', '\$', $html); $html = preg_replace_callback('/<com:TTextHighlighter[^>]*>((.|\n)*?)<\/com:TTextHighlighter\s*>/', array($this,'escape_verbatim'), $html); // $html = preg_replace('/<\/com:TTextHighlighter>/', '`2`', $html); // $html = preg_replace_callback('/(`1`)([^`]*)(`2`)/m', array($this,'escape_verbatim'), $html); $html = preg_replace_callback('/(<div class="source">)((.|\n)*?)(<\/div>)/', array($this,'escape_verbatim'), $html); $html = preg_replace_callback('/(<pre>)([^<]*)(<\/pre>)/', array($this,'escape_verbatim'), $html); //<code> $html = preg_replace_callback('/<code>([^<]*)<\/code>/', array($this,'escape_verb'), $html); //runbar $html = preg_replace('/<com:RunBar\s+PagePath="([^"]*)"\s+\/>/', '\href{http://www.pradosoft.com/demos/quickstart/index.php?page=$1}{$1 Demo}', $html); //DocLink $html = preg_replace('/<com:DocLink\s+ClassPath="([^"]*)[.]([^."]*)"\s+Text="([^"]+)"\s*\/>/', '\href{http://www.pradosoft.com/docs/manual/$1/$2.html}{$3}', $html); $html = preg_replace('/<com:DocLink\s+ClassPath="([^"]*)[.]([^.]*)"\s+\/>/', '\href{http://www.pradosoft.com/docs/manual/$1/$2.html}{$1.$2 API Reference}', $html); //text modifiers $html = preg_replace('/<(b|strong)[^>]*>([^<]*)<\/(b|strong)>/', '\textbf{$2}', $html); $html = preg_replace('/<i [^>]*>([^<]*)+?<\/i>/', '\emph{$1}', $html); $html = preg_replace_callback('/<tt>([^<]*)<\/tt>/', array($this,'texttt'), $html); //links $html = preg_replace_callback('/<a[^>]+href="([^"]*)"[^>]*>([^<]*)<\/a>/', array($this,'make_link'), $html); //anchor $html = preg_replace_callback('/<a[^>]+name="([^"]*)"[^>]*><\/a>/', array($this,'anchor'), $html); //description <dl> $html = preg_replace('/<dt>([^<]*)<\/dt>/', '\item[$1]', $html); $html = preg_replace('/<\/?dd>/', '', $html); $html = preg_replace('/<dl>/', '\begin{description}', $html); $html = preg_replace('/<\/dl>/', '\end{description}', $html); //item lists $html = preg_replace('/<ul[^>]*>/', '\begin{itemize}', $html); $html = preg_replace('/<\/ul>/', '\end{itemize}', $html); $html = preg_replace('/<ol[^>]*>/', '\begin{enumerate}', $html); $html = preg_replace('/<\/ol>/', '\end{enumerate}', $html); $html = preg_replace('/<li[^>]*>/', '\item ', $html); $html = preg_replace('/<\/li>/', '', $html); //headings $html = preg_replace('/<h1(\s+id="[^"]+")?>([^<]+)<\/h1>/', '\section{$2}', $html); $html = preg_replace('/<h2(\s+id="[^"]+")?>([^<]+)<\/h2>/', '\subsection{$2}', $html); $html = preg_replace('/<h3(\s+id="[^"]+")?>([^<]+)<\/h3>/', '\subsubsection{$2}', $html); //div box $html = preg_replace_callback('/<div class="[tipnofe]*?">((.|\n)*?)<\/div>/', array($this, 'mbox'), $html); //tabular $html = preg_replace_callback('/<!--\s*tabular:([^-]*)-->\s*<table[^>]*>((.|\n)*?)<\/table>/', array($this, 'tabular'), $html); $html = preg_replace('/<!--((.|\n)*?)-->/', '', $html); $html = preg_replace('/<div class="last-modified">((.|\n)*?)<\/div>/', '', $html); //useless divs $html = preg_replace('/<div [^>]*">((.|\n)*?)<\/div>/', '$1', $html); //since $html = preg_replace('/<com:SinceVersion[^>]+>/', '', $html); //requiresversion $html = preg_replace('/<com:RequiresVersion[^>]+>/', '', $html); $html = html_entity_decode($html); return $html; } function tabular($matches) { $options = array(); foreach(explode(',', $matches[1]) as $string) { $sub = explode('=', trim($string)); $options[trim($sub[0])] = trim($sub[1]); } $widths = explode(' ',preg_replace('/\(|\)/', '', $options['width'])); $this->_tabular_widths = $widths; $this->_tabular_total = count($widths); $this->_tabular_col = 0; $begin = '\begin{table}[!hpt]\centering '."\n".' \begin{tabular}{'.$options['align'].'}\hline'; $end = '\end{tabular} '."\n".'\end{table}'."\n"; $table = preg_replace('/<\/tr>/', '\\\\\\\\ \hline', $matches[2]); $table = preg_replace('/<tr>/', '', $table); $table = preg_replace('/<th>([^<]+)<\/th>/', '\textbf{$1} &', $table); $table = preg_replace_callback('/<td>((.|\n)*?)<\/td>/', array($this, 'table_column'), $table); $table = preg_replace('/<br \/>/', ' \\\\\\\\', $table); $table = preg_replace('/&\s*\\\\\\\\/', '\\\\\\\\', $table); return $begin.$table.$end; } function table_column($matches) { $width = $this->_tabular_widths[$this->_tabular_col]; if($this->_tabular_col >= $this->_tabular_total-1) $this->_tabular_col = 0; else $this->_tabular_col++; return '\begin{minipage}{'.$width.'\textwidth}\vspace{3mm}'. $matches[1].'\vspace{3mm}\end{minipage} & '; } function mbox($matches) { return "\n\begin{mybox}\n".$matches[1]."\n".'\end{mybox}'."\n"; } function get_chapter_label($chapter) { return '\hypertarget{'.str_replace(' ', '', $chapter).'}{}'; } function get_section_label($section) { $section = str_replace('.page', '', $section); return '\hypertarget{'.str_replace('/', '.', $section).'}{}'; } function set_header_id($content, $j) { $this->page_count=$j; $content = preg_replace_callback('/<h1>/', array($this,"h1"), $content); $content = preg_replace_callback('/<h2>/', array($this,"h2"), $content); $content = preg_replace_callback('/<h3>/', array($this,"h3"), $content); $content = $this->set_block_content_id($content); return $content; } function h1($matches) { $page = $this->page_count*1000; return "<h1 id=\"".($page + (++self::$header_count))."\">"; } function h2($matches) { $page = $this->page_count*1000; return "<h2 id=\"".($page + (++self::$header_count))."\">"; } function h3($matches) { $page = $this->page_count*1000; return "<h3 id=\"".($page + (++self::$header_count))."\">"; } function set_block_content_id($content) { $content = preg_replace_callback('/<p>/', array($this, 'add_p'), $content); $content = preg_replace_callback('/<com:TTextHighlighter([^>]+)>/', array($this, 'hil'), $content); return $content; } function hil($matches) { $id = ($this->page_count*10000) + (++self::$hil_count); if(preg_match('/id="code-\d+"/i', $matches[1])) { $code = preg_replace('/id="code-(\d+)"/', 'id="code_$1"', $matches[0]); //var_dump($code); return $code; } else if(preg_match('/id="[^"]+"/i', $matches[1])) { return $matches[0]; } else { $changes = str_replace('"source"', '"source block-content" id="code-'.$id.'"', $matches[0]); return $changes; } } function add_p($matches) { $page = $this->page_count*10000; return "<p id=\"".($page + (++self::$p_count))."\" class=\"block-content\">"; } }