getnikola · Jan 14, 2017
diff --git a/‎v7/latex/README.md
+42 b/‎v7/latex/README.md
+42
diff --git a/‎v7/latex/conf.py.sample
+16 b/‎v7/latex/conf.py.sample
+16
diff --git a/‎v7/latex/latex.plugin
+12 b/‎v7/latex/latex.plugin
+12
diff --git a/‎v7/latex/latex/__init__.py
+351 b/‎v7/latex/latex/__init__.py
+351
diff --git a/‎v7/latex/latex/htmlify.py
+577 b/‎v7/latex/latex/htmlify.py
+577
diff --git a/‎v7/latex/latex/parser.py
+1,074 b/‎v7/latex/latex/parser.py
+1,074
diff --git a/‎v7/latex/latex/plugins/latex_formula_image_renderer.plugin
+12 b/‎v7/latex/latex/plugins/latex_formula_image_renderer.plugin
+12
diff --git a/‎v7/latex/latex/plugins/latex_formula_image_renderer.py
+191 b/‎v7/latex/latex/plugins/latex_formula_image_renderer.py
+191
diff --git a/‎v7/latex/latex/plugins/latex_formula_mathjax.plugin
+12 b/‎v7/latex/latex/plugins/latex_formula_mathjax.plugin
+12
diff --git a/‎v7/latex/latex/plugins/latex_formula_mathjax.py
+112 b/‎v7/latex/latex/plugins/latex_formula_mathjax.py
+112
diff --git a/‎v7/latex/latex/tokenizer.py
+378 b/‎v7/latex/latex/tokenizer.py
+378
diff --git a/‎v7/latex/latex/tree.py
+876 b/‎v7/latex/latex/tree.py
+876
diff --git a/‎v7/latex/requirements-plugins.txt
+1 b/‎v7/latex/requirements-plugins.txt
+1
@@ -0,0 +1,42 @@
+This plugin allows to write posts and pages in a LaTeX-like syntax.
+
+For Python before 3.4, you need to install the [`enum34` library](https://pypi.python.org/pypi/enum34). From Python 3.4 on, it is part of the language.
+
+
+Formulae
+--------
+
+There are two available formulae backends:
+
+ * one based on the [`latex_formula_renderer` plugin](https://plugins.getnikola.com/v7/latex_formula_renderer/);
+ * one based on [MathJax](https://www.mathjax.org/).
+
+The first plugin allows special features the second doesn't:
+
+ * `align` environments (see the [AMSMath documentation](ftp://ftp.ams.org/ams/doc/amsmath/amsldoc.pdf));
+ * XY-pic diagrams (see the [XY-Pic user guide](http://texdoc.net/texmf-dist/doc/generic/xypic/xyguide.pdf));
+ * PSTricks graphics (see [here](https://en.wikipedia.org/wiki/PSTricks) for more information);
+ * TikZ pictures (see [here](https://en.wikibooks.org/wiki/LaTeX/PGF/TikZ) for more information).
+
+You need an installed LaTeX distribution for this to work, with some extra tools. See the `latex_formula_renderer` plugin for details.
+
+
+Required Translations
+---------------------
+
+You need to add the following translations to your theme if you use theorem environments:
+``` .py
+MESSAGES = {
+    'math_thm_name': 'Theorem',
+    'math_prop_name': 'Proposition',
+    'math_cor_name': 'Corollary',
+    'math_lemma_name': 'Lemma',
+    'math_def_name': 'Definition',
+    'math_defs_name': 'Definitions',
+    'math_proof_name': 'Proof',
+    'math_example_name': 'Example',
+    'math_examples_name': 'Examples',
+    'math_remark_name': 'Remark',
+    'math_remarks_name': 'Remarks',
+}
+```
@@ -0,0 +1,16 @@
+# Determines how the formulae are rendered. Possibilities:
+#  - "latex_formula_image_renderer": renders formulae as graphics and includes them.
+#  - "latex_formula_mathjax": inserts MathJax code.
+LATEX_FORMULA_RENDERER = "latex_formula_image_renderer"
+
+# When "latex_formula_image_renderer" is selected as the formula renderer,
+# the formulae colors and scale can be set here:
+#
+# The color must be given as an RGB triple with components in range [0, 1].
+# Here, (0, 0, 0) is black and (1, 1, 1) is white.
+LATEX_FORMULA_COLOR = (0., 0., 0.)
+#
+# The formula scale determines the effective size of the formulae.
+# Check what looks good with your theme's main font.
+LATEX_FORMULA_SCALE = 1.25
+
@@ -0,0 +1,12 @@
+[Core]
+Name = latex
+Module = latex
+
+[Nikola]
+PluginCategory = PageCompiler
+
+[Documentation]
+Author = Felix Fontein
+Version = 0.1
+Website = https://felix.fontein.de
+Description = Compile LaTeX-similar text to HTML
@@ -0,0 +1,12 @@
+[Core]
+Name = latex_formula_image_renderer
+Module = latex_formula_image_renderer
+
+[Nikola]
+Compiler = latex
+PluginCategory = CompilerExtension
+
+[Documentation]
+Author = Felix Fontein
+Version = 0.1
+Description = Provides LaTeX image formula rendering
@@ -0,0 +1,191 @@
+# -*- coding: utf-8 -*-
+
+# Copyright © 2014-2017 Felix Fontein
+#
+# Permission is hereby granted, free of charge, to any
+# person obtaining a copy of this software and associated
+# documentation files (the "Software"), to deal in the
+# Software without restriction, including without limitation
+# the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the
+# Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice
+# shall be included in all copies or substantial portions of
+# the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY
+# KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE
+# WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR
+# PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS
+# OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
+# OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
+# OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
+# SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
+
+"""Render formulas for LaTeX post compiler as images using the latex_formula_renderer plugin."""
+
+from __future__ import unicode_literals
+
+import nikola.plugin_categories
+import nikola.utils
+
+import json
+import os.path
+import sys
+
+LOGGER = nikola.utils.get_logger('compile_latex.formula.image', nikola.utils.STDERR_HANDLER)
+
+
+class FormulaContext(object):
+    """Stores information about the formula renderer.
+
+    For the formula image renderer, scale and color are stored in the context.
+    """
+
+    def __init__(self, scale, color):
+        """Create formula context with given scale and color."""
+        self.scale = scale
+        self.color = color
+
+    def clone(self):
+        """Clone this FormulaContext object."""
+        return FormulaContext(self.scale, self.color)
+
+
+def _escape_html_argument(text):
+    """Escape a string to be usable as an HTML tag argument."""
+    result = ""
+    for c in text:
+        if c == "<":
+            result += "&lt;"
+        elif c == ">":
+            result += "&gt;"
+        elif c == "&":
+            result += "&amp;"
+        elif c == '"':
+            result += "&quot;"
+        elif c == "'":
+            result += "&#39;"
+        elif c == " ":
+            result += " "
+        elif '0' <= c <= '9' or 'A' <= c <= 'Z' or 'a' <= c <= 'z' or c in {'/', ':', '.', '@', '-', '_'}:
+            result += c
+        else:
+            result += '&#x{0};'.format(hex(ord(c))[2:])
+    return result
+
+
+class LatexImageFormulaRenderer(nikola.plugin_categories.CompilerExtension):
+    """Render LaTeX formulae as image files using the latex_formula_renderer plugin."""
+
+    name = 'latex_formula_image_renderer'
+    compiler_name = 'latex'
+    latex_plugin_type = 'formula_renderer'
+
+    def __init__(self):
+        """Initialize plugin."""
+        super(LatexImageFormulaRenderer, self).__init__()
+        self.__formula_scale = 1.25
+        self.__formula_color = (0., 0., 0.)
+
+    def _get_formulae_filename(self, post, lang):
+        """Get filename for post and language to store LaTeX formulae in."""
+        return post.translated_base_path(lang) + '.ltxfor'
+
+    def _collect_formulas(self):
+        """Collect LaTeX formulae used in posts."""
+        # Look for candidates from posts
+        candidates = set()
+        for post in self.site.timeline:
+            if post.compiler.name != 'latex':
+                continue
+            for lang in self.site.config['TRANSLATIONS']:
+                candidates.add(self._get_formulae_filename(post, lang))
+        # Look for candidates from extra formula sources
+        for dirpath, _, filenames in os.walk(self.__extra_formula_sources, followlinks=True):
+            for filename in filenames:
+                if filename.endswith('.texfor'):
+                    candidates.add(os.path.join(dirpath, filename))
+        # Check the candidates
+        formulae = []
+        for fn in candidates:
+            if os.path.isfile(fn):
+                with open(fn, "rb") as f:
+                    fs = json.loads(f.read().decode('utf-8'))
+                for f in fs:
+                    formulae.append(tuple(f))
+        return formulae
+
+    def set_site(self, site):
+        """Set Nikola site object."""
+        super(LatexImageFormulaRenderer, self).set_site(site)
+        self.__formula_color = site.config.get('LATEX_FORMULA_COLOR', self.__formula_color)
+        self.__formula_scale = site.config.get('LATEX_FORMULA_SCALE', self.__formula_scale)
+        self.__extra_formula_sources = os.path.join(site.config['CACHE_FOLDER'], 'extra-formula-sources')
+
+        if not hasattr(site, 'latex_formula_collectors'):
+            site.latex_formula_collectors = []
+        site.latex_formula_collectors.append(self._collect_formulas)
+
+    def create_context(self):
+        """Create a FormulaContext object."""
+        return FormulaContext(self.__formula_scale, self.__formula_color)
+
+    def get_extra_targets(self, post, lang, dest):
+        """Return a list of extra formula-related targets."""
+        return [self._get_formulae_filename(post, lang)]
+
+    def add_extra_deps(self, post, lang, what, where):
+        """Return a list of extra dependencies for given post and language."""
+        if what == 'uptodate' and where == 'fragment':
+            return [nikola.utils.config_changed({
+                'scale': self.__formula_scale,
+                'color': list(self.__formula_color),
+            }, 'latex_formula_image_renderer:config')]
+        return []
+
+    def _write_formulae(self, latex_context, filename):
+        """Write used LaTeX formulae into JSON-encoded file."""
+        formulae = sorted(latex_context.get_plugin_data(self.name, 'formulae', []))
+        with open(filename, "wb") as f:
+            f.write(json.dumps(formulae, sort_keys=True).encode('utf-8'))
+
+    def write_extra_targets(self, post, lang, dest, latex_context):
+        """Write extra formula-related targets."""
+        self._write_formulae(latex_context, self._get_formulae_filename(post, lang))
+
+    def before_processing(self, latex_context, source_path=None, post=None):
+        """Add information to context before post is processed."""
+        latex_context.store_plugin_data(self.name, 'formulae', [])
+
+    def after_processing(self, latex_context, source_path=None, post=None):
+        """Retrieve information from context after post is processed."""
+        if post is None and source_path is not None:
+            fn = os.path.join(self.__extra_formula_sources, source_path, '.texfor')
+            nikola.utils.makedirs(os.path.split(fn)[0])
+            self._write_formulae(latex_context, fn)
+
+    def modify_result(self, output, latex_context):
+        """Modify generated HTML output."""
+        return output
+
+    def render(self, formula, formula_context, formula_type, latex_context):
+        """Produce HTML code which displays the formula.
+
+        formula: LaTeX code for the formula (excluding environment/delimiters)
+        formula_context: a FormulaContext object created by this object (or a clone of it)
+        formula_type: one of 'inline', 'display', 'align', 'pstricks', 'tikzpicture'
+        latex_context: the LaTeX context object
+        """
+        try:
+            lfr = self.site.latex_formula_renderer
+        except:
+            LOGGER.error("Cannot find latex formula rendering plugin!")
+            sys.exit(1)
+        src, width, height = lfr.compile(formula, formula_context.color, formula_context.scale, formula_type)
+        latex_context.get_plugin_data(self.name, 'formulae', []).append((formula, formula_context.color, formula_context.scale, formula_type))
+        alt_text = _escape_html_argument(formula).strip()
+        css_type = formula_type
+        return "<img class='img-{0}-formula img-formula' width='{1}' height='{2}' src='{3}' alt='{4}' title='{4}' />".format(css_type, width, height, src, alt_text)
@@ -0,0 +1,12 @@
+[Core]
+Name = latex_formula_mathjax
+Module = latex_formula_mathjax
+
+[Nikola]
+Compiler = latex
+PluginCategory = CompilerExtension
+
+[Documentation]
+Author = Felix Fontein
+Version = 0.1
+Description = Provides mathjax-based formula rendering
@@ -0,0 +1,112 @@
+# -*- coding: utf-8 -*-
+
+# Copyright © 2014-2017 Felix Fontein
+#
+# Permission is hereby granted, free of charge, to any
+# person obtaining a copy of this software and associated
+# documentation files (the "Software"), to deal in the
+# Software without restriction, including without limitation
+# the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the
+# Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice
+# shall be included in all copies or substantial portions of
+# the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY
+# KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE
+# WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR
+# PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS
+# OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
+# OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
+# OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
+# SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
+
+"""Display formulas for LaTeX post compiler via MathJax."""
+
+from __future__ import unicode_literals
+
+import nikola.plugin_categories
+import nikola.utils
+
+LOGGER = nikola.utils.get_logger('compile_latex.formula.mathjax', nikola.utils.STDERR_HANDLER)
+
+
+class FormulaContext(object):
+    """Stores information about the formula renderer."""
+
+    def clone(self):
+        """Clone this FormulaContext object."""
+        return FormulaContext()
+
+
+class MathJaxFormulaRenderer(nikola.plugin_categories.CompilerExtension):
+    """Show LaTeX formulae via MathJax. Supports only inline and display-style formulae."""
+
+    name = 'latex_formula_mathjax'
+    compiler_name = 'latex'
+    latex_plugin_type = 'formula_renderer'
+
+    def __init__(self):
+        """Initialize plugin."""
+        super(MathJaxFormulaRenderer, self).__init__()
+        self.__script_origin = '//cdn.mathjax.org/mathjax/latest/MathJax.js'
+        self.__delimiters = {
+            'inline': r'\({0}\)',
+            'display': r'$${0}$$'
+        }
+
+    def set_site(self, site):
+        """Set Nikola site object."""
+        super(MathJaxFormulaRenderer, self).set_site(site)
+        self.__script_origin = site.config.get('LATEX_MATHJAX_SCRIPT_ORIGIN', self.__script_origin)
+
+    def create_context(self):
+        """Create a FormulaContext object."""
+        return FormulaContext()
+
+    def get_extra_targets(self, post, lang, dest):
+        """Return a list of extra formula-related targets."""
+        return []
+
+    def add_extra_deps(self, post, lang, what, where):
+        """Return a list of extra dependencies for given post and language."""
+        if what == 'uptodate' and where == 'fragment':
+            return [nikola.utils.config_changed({
+                'script_origin': self.__script_origin,
+                'delimiters': self.__delimiters,
+            }, 'latex_formula_mathjax:config')]
+        return []
+
+    def write_extra_targets(self, post, lang, dest, latex_context):
+        """Write extra formula-related targets."""
+        pass
+
+    def before_processing(self, latex_context, source_path=None, post=None):
+        """Add information to context before post is processed."""
+        pass
+
+    def after_processing(self, latex_context, source_path=None, post=None):
+        """Retrieve information from context after post is processed."""
+        pass
+
+    def modify_result(self, output, latex_context):
+        """Modify generated HTML output."""
+        prefix = '''<script type="text/x-mathjax-config">MathJax.Hub.Config({tex2jax: {inlineMath: [['\\\\(','\\\\)']]}});</script>'''
+        prefix += '''<script type="application/javascript" src="''' + self.__script_origin + '''?config=TeX-AMS_HTML-full"></script>'''
+        return prefix + output
+
+    def render(self, formula, formula_context, formula_type, latex_context):
+        """Produce HTML code which displays the formula.
+
+        formula: LaTeX code for the formula (excluding environment/delimiters)
+        formula_context: a FormulaContext object created by this object (or a clone of it)
+        formula_type: one of 'inline', 'display', 'align', 'pstricks', 'tikzpicture'
+        latex_context: the LaTeX context object
+        """
+        if formula_type not in self.__delimiters:
+            raise NotImplementedError("Formula type '{}' is not supported by MathJax formula rendering backend!".format(formula_type))
+
+        return self.__delimiters[formula_type].format(formula)
@@ -0,0 +1,378 @@
+# -*- coding: utf-8 -*-
+
+# Copyright © 2014-2017 Felix Fontein
+#
+# Permission is hereby granted, free of charge, to any
+# person obtaining a copy of this software and associated
+# documentation files (the "Software"), to deal in the
+# Software without restriction, including without limitation
+# the rights to use, copy, modify, merge, publish,
+# distribute, sublicense, and/or sell copies of the
+# Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice
+# shall be included in all copies or substantial portions of
+# the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY
+# KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE
+# WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR
+# PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS
+# OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
+# OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
+# OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
+# SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
+
+"""A basic LaTeX tokenizer."""
+
+from __future__ import unicode_literals
+
+import nikola.utils
+
+from enum import Enum
+
+LOGGER = nikola.utils.get_logger('compile_latex.tokenizer', nikola.utils.STDERR_HANDLER)
+
+
+class Token(Enum):
+    """Represents a single token."""
+
+    Whitespace = 1
+    NonbreakableWhitespace = 2
+    Text = 3
+    EscapedText = 4
+    Command = 5  # '\' followed by text
+    InlineFormulaDelimiter = 6  # just '$' (the alternative, '\(', is a Command)
+    DisplayFormulaDelimiter = 7  # just '$$' (the alternative, '\[', is a Command)
+    CurlyBraketOpen = 8  # '{'
+    CurlyBraketClose = 9  # '}'
+    SquareBraketOpen = 10  # '['
+    SquareBraketClose = 11  # ']'
+    DoubleNewLine = 12
+    Comment = 13  # '%'
+    ForcedLineBreak = 14  # '\\'
+    TableColumnDelimiter = 15  # '&'
+
+
+def _compute_position(input, index):
+    """Compute line/column position given an index in a string."""
+    line = 1
+    col = 1
+    eol = None  # last end of line character
+    for c in input[:index]:
+        if c == '\n' or c == '\r':
+            if eol is None or eol == c:
+                eol = c
+                line += 1
+                col = 1
+            else:
+                # ignore second of '\n\r' and '\r\n' sequences
+                eol = None
+        else:
+            col += 1
+    return (line, col)
+
+
+class Tokenizer:
+    """A simple tokenizer."""
+
+    def _is_whitespace(self, char):
+        """Check for whitespace."""
+        return ord(char) <= 32
+
+    def _is_line_break(self, char):
+        """Check for line breaks."""
+        return ord(char) == 10 or ord(char) == 13
+
+    def _is_command_char(self, char):
+        """Check for a command character."""
+        return (char >= 'A' and char <= 'Z') or (char >= 'a' and char <= 'z') or (char == '@')
+
+    def _eat_whitespace(self):
+        """Skip whitespace and return number of contained line breaks."""
+        number_of_line_breaks = 0
+        last_line_break = None
+        while self._position < len(self._input):
+            if not self._is_whitespace(self._input[self._position]):
+                break
+            if self._is_line_break(self._input[self._position]):
+                if last_line_break is None or last_line_break == self._input[self._position]:
+                    number_of_line_breaks += 1
+                last_line_break = self._input[self._position]
+            else:
+                last_line_break = None
+            self._position += 1
+        return number_of_line_breaks
+
+    def _eat_comment(self):
+        """Skip comment's content."""
+        start = self._position
+        last_line_break = None
+        had_line_break = False
+        while self._position < len(self._input):
+            if had_line_break and not self._is_whitespace(self._input[self._position]):
+                break
+            if self._is_line_break(self._input[self._position]):
+                if last_line_break is None or last_line_break == self._input[self._position]:
+                    if had_line_break:
+                        break
+                last_line_break = self._input[self._position]
+                had_line_break = True
+            else:
+                last_line_break = None
+            self._position += 1
+        return self._input[start:self._position]
+
+    def _read_text(self, strict):
+        """Read text."""
+        start = self._position
+        while self._position < len(self._input):
+            char = self._input[self._position]
+            if self._is_whitespace(char):
+                break
+            if char == "~" or char == "{" or char == "}" or char == "$" or char == "[" or char == "]" or char == "$" or char == "\\" or char == "&":
+                break
+            if strict and not self._is_command_char(char):
+                break
+            self._position += 1
+        return self._input[start:self._position]
+
+    def _find_next(self):
+        """Find next token."""
+        self._token = None
+        self._token_value = None
+        self._token_begin_index = None
+        self._token_end_index = None
+        if (self._position >= len(self._input)):
+            return
+        self._token_begin_index = self._position
+        char = self._input[self._position]
+        if self._is_whitespace(char):
+            number_of_line_breaks = self._eat_whitespace()
+            if number_of_line_breaks > 1:
+                self._token = Token.DoubleNewLine
+            else:
+                self._token = Token.Whitespace
+        elif char == "~":
+            self._token = Token.NonbreakableWhitespace
+            self._position += 1
+        elif char == '&':
+            self._token = Token.TableColumnDelimiter
+            self._position += 1
+        elif char == "{":
+            self._token = Token.CurlyBraketOpen
+            self._position += 1
+        elif char == "}":
+            self._token = Token.CurlyBraketClose
+            self._position += 1
+        elif char == "[":
+            self._token = Token.SquareBraketOpen
+            self._position += 1
+        elif char == "]":
+            self._token = Token.SquareBraketClose
+            self._position += 1
+        elif char == "$":
+            self._token = Token.InlineFormulaDelimiter
+            self._position += 1
+            if self._position < len(self._input) and self._input[self._position] == "$":
+                self._token = Token.DisplayFormulaDelimiter
+                self._position += 1
+        elif char == "\\":
+            self._position += 1
+            if self._position == len(self._input):
+                raise "Reached end of text after '\\'"
+            self._token = Token.Command
+            cmd = self._read_text(True)
+            if len(cmd) == 0:
+                ch = self._input[self._position]
+                if ch == '(' or ch == ')' or ch == '[' or ch == ']':
+                    self._token_value = ch
+                elif ch == '\\':
+                    self._token = Token.ForcedLineBreak
+                else:
+                    self._token = Token.EscapedText
+                    self._token_value = ch
+                self._position += 1
+            else:
+                self._token_value = cmd
+        elif char == '%':
+            self._token = Token.Comment
+            self._position += 1
+            self._token_value = self._eat_comment()
+        else:
+            self._token = Token.Text
+            self._token_value = self._read_text(False)
+        self._token_end_index = self._position
+
+    def __init__(self, input):
+        """Initialize tokenizer with input unicode string ``input``."""
+        self._input = input
+        self._position = 0
+        self._find_next()
+
+    def has_token(self):
+        """Whether a token is available."""
+        return self._token is not None
+
+    def token_type(self):
+        """Return type of current token."""
+        return self._token
+
+    def token_value(self):
+        """Return value of current token."""
+        # only if token_type() returns Token.Text or Token.Command
+        return self._token_value
+
+    def token_begin_index(self):
+        """Return beginning of token in input string."""
+        return self._token_begin_index
+
+    def token_end_index(self):
+        """Return end of token in input string."""
+        return self._token_end_index
+
+    def next(self):
+        """Proceed to next token."""
+        if self._token is not None:
+            self._find_next()
+
+    def get_substring(self, start_index, end_index):
+        """Return substring of input string."""
+        return self._input[start_index:end_index]
+
+    def get_position(self, index):
+        """Retrieve position as (line, column) pair in input string."""
+        return _compute_position(self._input, index)
+
+
+class TokenStream:
+    """Represent the output of a Tokenizer as a stream of tokens, allowing to peek ahead."""
+
+    def _fill_ahead(self, count):
+        """Fill ahead buffer."""
+        if len(self.__ahead) < count:
+            for i in range(len(self.__ahead), count):
+                if self.__tokenizer.has_token():
+                    self.__ahead.append((self.__tokenizer.token_type(), self.__tokenizer.token_value()))
+                    self.__ahead_indices.append((self.__tokenizer.token_begin_index(), self.__tokenizer.token_end_index()))
+                    self.__tokenizer.next()
+                else:
+                    self.__ahead.append((None, None))
+                    self.__ahead_indices.append((None, None))
+
+    def __init__(self, input):
+        """Create TokenStream from input unicode string. Creates Tokenizer."""
+        self.__tokenizer = Tokenizer(input)
+        self.__ahead = list()
+        self.__ahead_indices = list()
+
+    def current(self):
+        """Get current token. Return pair (type, value)."""
+        self._fill_ahead(1)
+        return self.__ahead[0]
+
+    def current_indices(self):
+        """Get current token indices in input string."""
+        self._fill_ahead(1)
+        return self.__ahead_indices[0]
+
+    def current_type(self):
+        """Get current token type."""
+        self._fill_ahead(1)
+        return self.__ahead[0][0]
+
+    def current_value(self):
+        """Get current token value."""
+        self._fill_ahead(1)
+        return self.__ahead[0][1]
+
+    def has_current(self):
+        """Return True if current token is available."""
+        self._fill_ahead(1)
+        return self.__ahead[0][0] is not None
+
+    def skip_current(self, count=1):
+        """Skip number of tokens."""
+        assert count >= 0
+        self._fill_ahead(count)
+        self.__ahead = self.__ahead[count:]
+        self.__ahead_indices = self.__ahead_indices[count:]
+
+    def peek(self, index):
+        """Peek ahead in token stream. Return pair (type, value)."""
+        assert index >= 0
+        self._fill_ahead(index + 1)
+        return self.__ahead[index]
+
+    def peek_indices(self, index):
+        """Peek ahead in token stream. Return indices of token in input string."""
+        assert index >= 0
+        self._fill_ahead(index + 1)
+        return self.__ahead_indices[index]
+
+    def peek_type(self, index):
+        """Peek ahead in token stream. Return token's type."""
+        assert index >= 0
+        self._fill_ahead(index + 1)
+        return self.__ahead[index][0]
+
+    def peek_value(self, index):
+        """Peek ahead in token stream. Return token's value."""
+        assert index >= 0
+        self._fill_ahead(index + 1)
+        return self.__ahead[index][1]
+
+    def can_peek(self, index):
+        """Check whether token at current index + ``index`` can be peeked at, i.e. whether it exists."""
+        assert index >= 0
+        self._fill_ahead(index + 1)
+        return self.__ahead[index][0] is not None
+
+    def get_substring(self, start_index, end_index):
+        """Return substring of input string."""
+        return self.__tokenizer.get_substring(start_index, end_index)
+
+    def get_position(self, index):
+        """Retrieve position as (line, column) pair in input string."""
+        return self.__tokenizer.get_position(index)
+
+    def set_value(self, index, new_value):
+        """Set value of token at current index + ``index`` to ``new_value``.
+
+        Use with care!
+        """
+        assert index >= 0
+        self._fill_ahead(index + 1)
+        self.__ahead[index] = (self.__ahead[index][0], new_value)
+
+
+def recombine_tokens(tokens):
+    """Recombine list of tokens as string."""
+    result = ""
+    for type, value in tokens:
+        if type == Token.Whitespace:
+            result += " "
+        if type == Token.NonbreakableWhitespace:
+            result += "~"
+        elif type == Token.Text:
+            result += value
+        elif type == Token.EscapedText:
+            result += "\\{}".format(value)
+        elif type == Token.Command:
+            result += "\\{}".format(value)
+        elif type == Token.InlineFormulaDelimiter:
+            result += "$"
+        elif type == Token.DisplayFormulaDelimiter:
+            result += "$$"
+        elif type == Token.CurlyBraketOpen:
+            result += "{"
+        elif type == Token.CurlyBraketClose:
+            result += "}"
+        elif type == Token.SquareBraketOpen:
+            result += "["
+        elif type == Token.SquareBraketClose:
+            result += "]"
+        elif type == Token.DoubleNewLine:
+            result += "\n\n"
+    return result
@@ -0,0 +1 @@
+latex_formula_renderer