Source code for autotest.client.shared.jsontemplate

# Copyright (C) 2009 Andy Chu
#
# Andy Chu agreed with double licensing this file for the purposes of
# usage inside autotest with both the Apache license, Version 2.0, and
# the GPL Version 2.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Python implementation of json-template.

JSON Template is a minimal and powerful templating language for transforming a
JSON dictionary to arbitrary text.

To use this module, you will typically use the Template constructor, and catch
various exceptions thrown.  You may also want to use the FromFile/FromString
methods, which allow Template constructor options to be embedded in the template
string itself.

Other functions are exposed for tools which may want to process templates.
"""

__author__ = 'Andy Chu'

__all__ = [
    'Error', 'CompilationError', 'EvaluationError', 'BadFormatter',
    'BadPredicate', 'MissingFormatter', 'ConfigurationError',
    'TemplateSyntaxError', 'UndefinedVariable', 'CompileTemplate', 'FromString',
    'FromFile', 'Template', 'expand']

import StringIO
import pprint
import re

# For formatters
import cgi  # cgi.escape
import urllib  # for urllib.encode
import urlparse  # for urljoin


[docs]class Error(Exception):

    """Base class for all exceptions in this module.

    Thus you can "except jsontemplate.Error: to catch all exceptions thrown by
    this module.
    """

    def __str__(self):
        """This helps people debug their templates.

        If a variable isn't defined, then some context is shown in the traceback.
        TODO: Attach context for other errors.
        """
        if hasattr(self, 'near'):
            return '%s\n\nNear: %s' % (self.args[0], pprint.pformat(self.near))
        else:
            return self.args[0]


[docs]class CompilationError(Error):

    """Base class for errors that happen during the compilation stage."""


[docs]class EvaluationError(Error):

    """Base class for errors that happen when expanding the template.

    This class of errors generally involve the data dictionary or the execution of
    the formatters.
    """

    def __init__(self, msg, original_exception=None):
        Error.__init__(self, msg)
        self.original_exception = original_exception


[docs]class BadFormatter(CompilationError):

    """A bad formatter was specified, e.g. {variable|BAD}"""


[docs]class BadPredicate(CompilationError):

    """A bad predicate was specified, e.g. {.BAD?}"""


[docs]class MissingFormatter(CompilationError):

    """
    Raised when formatters are required, and a variable is missing a formatter.
    """


[docs]class ConfigurationError(CompilationError):

    """
    Raised when the Template options are invalid and it can't even be compiled.
    """


[docs]class TemplateSyntaxError(CompilationError):

    """Syntax error in the template text."""


[docs]class UndefinedVariable(EvaluationError):

    """The template contains a variable not defined by the data dictionary."""


_SECTION_RE = re.compile(r'(repeated)?\s*section\s+(\S+)')

# Some formatters and predicates need to look up values in the whole context,
# rather than just the current node.  'Node functions' start with a lowercase
# letter; 'Context functions' start with any other character.
SIMPLE_FUNC, ENHANCED_FUNC = 0, 1


class FunctionRegistry(object):

    """Abstract class for looking up formatters or predicates at compile time."""

    def Lookup(self, user_str):
        """Lookup a function.

        Args:
          user_str: A raw string from the user, which may include uninterpreted
            arguments.  For example, 'pluralize person people' or 'test? admin'

        Returns:
          A 2-tuple of (function, args)
            function: Callable that formats data as a string
            args: Extra arguments to be passed to the function at expansion time
              Should be None to pass NO arguments, since it can pass a 0-tuple too.
        """
        raise NotImplementedError

    def LookupWithType(self, user_str):
        func, args = self.Lookup(user_str)
        # If users need the complexity of FunctionRegistry, then they get the
        # 3-arguments formatter signature (value, context, args)
        return func, args, ENHANCED_FUNC


def _DecideFuncType(user_str):
    """
    By default, formatters/predicates which start with a non-lowercase letter take
    contexts rather than just the cursor.
    """
    if user_str[0].islower():
        return SIMPLE_FUNC
    else:
        return ENHANCED_FUNC


class DictRegistry(FunctionRegistry):

    """Look up functions in a simple dictionary."""

    def __init__(self, func_dict):
        self.func_dict = func_dict

    def LookupWithType(self, user_str):
        return self.func_dict.get(user_str), None, _DecideFuncType(user_str)


class CallableRegistry(FunctionRegistry):

    """Look up functions in a (higher-order) function."""

    def __init__(self, func):
        self.func = func

    def LookupWithType(self, user_str):
        return self.func(user_str), None, _DecideFuncType(user_str)


class PrefixRegistry(FunctionRegistry):

    """Lookup functions with arguments.

    The function name is identified by a prefix.  The character after the prefix,
    usually a space, is considered the argument delimiter (similar to sed/perl's
    s/foo/bar s|foo|bar syntax).
    """

    def __init__(self, functions):
        """
        Args:
          functions: List of 2-tuples (prefix, function), e.g.
          [('pluralize', _Pluralize), ('cycle', _Cycle)]
        """
        self.functions = functions

    def Lookup(self, user_str):
        for prefix, func in self.functions:
            if user_str.startswith(prefix):
                i = len(prefix)

                # Usually a space, but could be something else
                try:
                    splitchar = user_str[i]
                except IndexError:
                    args = ()  # No arguments
                else:
                    args = user_str.split(splitchar)[1:]

                return func, args
        return None, ()


class ChainedRegistry(FunctionRegistry):

    """Look up functions in chain of other FunctionRegistry instances."""

    def __init__(self, registries):
        self.registries = registries

    def LookupWithType(self, user_str):
        for registry in self.registries:
            func, args, func_type = registry.LookupWithType(user_str)
            if func:
                return func, args, func_type

        # Nothing found
        return None, None, SIMPLE_FUNC


class _ProgramBuilder(object):

    """
    Receives method calls from the parser, and constructs a tree of _Section()
    instances.
    """

    def __init__(self, formatters, predicates):
        """
        Args:
          formatters: See docstring for CompileTemplate
          predicates: See docstring for CompileTemplate
        """
        self.current_block = _Section()
        self.stack = [self.current_block]

        # Passing a dictionary or a function is often more convenient than making a
        # FunctionRegistry
        if isinstance(formatters, dict):
            formatters = DictRegistry(formatters)
        elif callable(formatters):
            formatters = CallableRegistry(formatters)

        # default formatters with arguments
        default_formatters = PrefixRegistry([
            ('pluralize', _Pluralize), ('cycle', _Cycle)
        ])

        # First consult user formatters, then the default formatters
        self.formatters = ChainedRegistry(
            [formatters, DictRegistry(_DEFAULT_FORMATTERS), default_formatters])

        # Same for predicates
        if isinstance(predicates, dict):
            predicates = DictRegistry(predicates)
        elif callable(predicates):
            predicates = CallableRegistry(predicates)

        self.predicates = ChainedRegistry(
            [predicates, DictRegistry(_DEFAULT_PREDICATES)])

    def Append(self, statement):
        """
        Args:
          statement: Append a literal
        """
        self.current_block.Append(statement)

    def _GetFormatter(self, format_str):
        """
        The user's formatters are consulted first, then the default formatters.
        """
        formatter, args, func_type = self.formatters.LookupWithType(format_str)
        if formatter:
            return formatter, args, func_type
        else:
            raise BadFormatter('%r is not a valid formatter' % format_str)

    def _GetPredicate(self, pred_str):
        """
        The user's predicates are consulted first, then the default predicates.
        """
        predicate, args, func_type = self.predicates.LookupWithType(pred_str)
        if predicate:
            return predicate, args, func_type
        else:
            raise BadPredicate('%r is not a valid predicate' % pred_str)

    def AppendSubstitution(self, name, formatters):
        formatters = [self._GetFormatter(f) for f in formatters]
        self.current_block.Append((_DoSubstitute, (name, formatters)))

    def _NewSection(self, func, new_block):
        self.current_block.Append((func, new_block))
        self.stack.append(new_block)
        self.current_block = new_block

    def NewSection(self, token_type, section_name):
        """For sections or repeated sections."""

        # TODO: Consider getting rid of this dispatching, and turn _Do* into methods
        if token_type == REPEATED_SECTION_TOKEN:
            new_block = _RepeatedSection(section_name)
            func = _DoRepeatedSection
        elif token_type == SECTION_TOKEN:
            new_block = _Section(section_name)
            func = _DoSection
        else:
            raise AssertionError('Invalid token type %s' % token_type)

        self._NewSection(func, new_block)

    def NewOrClause(self, pred_str):
        """
        {.or ...} Can appear inside predicate blocks or section blocks, with
        slightly different meaning.
        """
        if pred_str:
            pred = self._GetPredicate(pred_str)
        else:
            pred = None
        self.current_block.NewOrClause(pred)

    def AlternatesWith(self):
        self.current_block.AlternatesWith()

    def NewPredicateSection(self, pred_str):
        """For chains of predicate clauses."""
        pred = self._GetPredicate(pred_str)
        block = _PredicateSection()
        block.NewOrClause(pred)

        self._NewSection(_DoPredicates, block)

    def EndSection(self):
        self.stack.pop()
        self.current_block = self.stack[-1]

    def Root(self):
        # It's assumed that we call this at the end of the program
        return self.current_block


class _AbstractSection(object):

    def __init__(self):
        # Pairs of func, args, or a literal string
        self.current_clause = []

    def Append(self, statement):
        """Append a statement to this block."""
        self.current_clause.append(statement)

    def AlternatesWith(self):
        raise TemplateSyntaxError(
            '{.alternates with} can only appear with in {.repeated section ...}')

    def NewOrClause(self):
        raise NotImplementedError


class _Section(_AbstractSection):

    """Represents a (repeated) section."""

    def __init__(self, section_name=None):
        """
        Args:
          section_name: name given as an argument to the section
          token_type: The token type that created this section (e.g.
              PREDICATE_TOKEN)
        """
        _AbstractSection.__init__(self)
        self.section_name = section_name

        # Clauses is just a string and a list of statements.
        self.statements = {'default': self.current_clause}

    def __repr__(self):
        return '<Section %s>' % self.section_name

    def Statements(self, clause='default'):
        return self.statements.get(clause, [])

    def NewOrClause(self, pred):
        if pred:
            raise TemplateSyntaxError(
                '{.or} clause only takes a predicate inside predicate blocks')
        self.current_clause = []
        self.statements['or'] = self.current_clause


class _RepeatedSection(_Section):

    """Repeated section is like section, but it supports {.alternates with}"""

    def AlternatesWith(self):
        self.current_clause = []
        self.statements['alternates with'] = self.current_clause


class _PredicateSection(_AbstractSection):

    """Represents a sequence of predicate clauses."""

    def __init__(self):
        _AbstractSection.__init__(self)
        # List of func, statements
        self.clauses = []

    def NewOrClause(self, pred):
        # {.or} always executes if reached
        pred = pred or (lambda x: True, None, SIMPLE_FUNC)  # 3-tuple
        self.current_clause = []
        self.clauses.append((pred, self.current_clause))


class _Frame(object):

    """A stack frame."""

    def __init__(self, context, index=-1):
        # Public attributes
        self.context = context
        self.index = index   # An iteration index.  -1 means we're NOT iterating.

    def __str__(self):
        return 'Frame %s (%s)' % (self.context, self.index)


class _ScopedContext(object):

    """Allows scoped lookup of variables.

    If the variable isn't in the current context, then we search up the stack.
    """

    def __init__(self, context, undefined_str):
        """
        Args:
          context: The root context
          undefined_str: See Template() constructor.
        """
        self.stack = [_Frame(context)]
        self.undefined_str = undefined_str

    def PushSection(self, name):
        """Given a section name, push it on the top of the stack.

        Returns:
          The new section, or None if there is no such section.
        """
        if name == '@':
            new_context = self.stack[-1].context
        else:
            new_context = self.stack[-1].context.get(name)
        self.stack.append(_Frame(new_context))
        return new_context

    def Pop(self):
        self.stack.pop()

    def Next(self):
        """Advance to the next item in a repeated section.

        Raises:
          StopIteration if there are no more elements
        """
        stacktop = self.stack[-1]

        # Now we're iterating -- push a new mutable object onto the stack
        if stacktop.index == -1:
            stacktop = _Frame(None, index=0)
            self.stack.append(stacktop)

        context_array = self.stack[-2].context

        if stacktop.index == len(context_array):
            self.stack.pop()
            raise StopIteration

        stacktop.context = context_array[stacktop.index]
        stacktop.index += 1

        return True  # OK, we mutated the stack

    def _Undefined(self, name):
        if self.undefined_str is None:
            raise UndefinedVariable('%r is not defined' % name)
        else:
            return self.undefined_str

    def _LookUpStack(self, name):
        """Look up the stack for the given name."""
        i = len(self.stack) - 1
        while 1:
            frame = self.stack[i]
            if name == '@index':
                if frame.index != -1:  # -1 is undefined
                    return frame.index  # @index is 1-based
            else:
                context = frame.context
                if hasattr(context, 'get'):  # Can't look up names in a list or atom
                    try:
                        return context[name]
                    except KeyError:
                        pass

            i -= 1  # Next frame
            if i <= -1:  # Couldn't find it anywhere
                return self._Undefined(name)

    def Lookup(self, name):
        """Get the value associated with a name in the current context.

        The current context could be an dictionary in a list, or a dictionary
        outside a list.

        Args:
          name: name to lookup, e.g. 'foo' or 'foo.bar.baz'

        Returns:
          The value, or self.undefined_str

        Raises:
          UndefinedVariable if self.undefined_str is not set
        """
        if name == '@':
            return self.stack[-1].context

        parts = name.split('.')
        value = self._LookUpStack(parts[0])

        # Now do simple lookups of the rest of the parts
        for part in parts[1:]:
            try:
                value = value[part]
            except (KeyError, TypeError):  # TypeError for non-dictionaries
                return self._Undefined(part)

        return value


def _ToString(x):
    # Some cross-language values for primitives
    if x is None:
        return 'null'
    if isinstance(x, basestring):
        return x
    return pprint.pformat(x)


def _HtmlAttrValue(x):
    return cgi.escape(x, quote=True)


def _AbsUrl(relative_url, context, unused_args):
    """Returns an absolute URL, given the current node as a relative URL.

    Assumes that the context has a value named 'base-url'.  This is a little like
    the HTML <base> tag, but implemented with HTML generation.

    Raises:
      UndefinedVariable if 'base-url' doesn't exist
    """
    # urljoin is flexible about trailing/leading slashes -- it will add or de-dupe
    # them
    return urlparse.urljoin(context.Lookup('base-url'), relative_url)


# See http://google-ctemplate.googlecode.com/svn/trunk/doc/howto.html for more
# escape types.
#
# Also, we might want to take a look at Django filters.
#
# This is a *public* constant, so that callers can use it construct their own
# formatter lookup dictionaries, and pass them in to Template.
_DEFAULT_FORMATTERS = {
    'html': cgi.escape,

    # The 'htmltag' name is deprecated.  The html-attr-value name is preferred
    # because it can be read with "as":
    #   {url|html-attr-value} means:
    #   "substitute 'url' as an HTML attribute value"
    'html-attr-value': _HtmlAttrValue,
    'htmltag': _HtmlAttrValue,

    'raw': lambda x: x,
    # Used for the length of a list.  Can be used for the size of a dictionary
    # too, though I haven't run into that use case.
    'size': lambda value: str(len(value)),

    # The argument is a dictionary, and we get a a=1&b=2 string back.
    'url-params': urllib.urlencode,

    # The argument is an atom, and it takes 'Search query?' -> 'Search+query%3F'
    'url-param-value': urllib.quote_plus,  # param is an atom

    # The default formatter, when no other default is specifier.  For debugging,
    # this could be lambda x: json.dumps(x, indent=2), but here we want to be
    # compatible to Python 2.4.
    'str': _ToString,

    # Just show a plain URL on an HTML page (without anchor text).
    'plain-url': lambda x: '<a href="%s">%s</a>' % (
        cgi.escape(x, quote=True), cgi.escape(x)),

    # A context formatter
    'AbsUrl': _AbsUrl,

    # Placeholders for "standard names".  We're not including them by default
    # since they require additional dependencies.  We can provide a part of the
    # "lookup chain" in formatters.py for people people want the dependency.

    # 'json' formats arbitrary data dictionary nodes as JSON strings.  'json'
    # and 'js-string' are identical (since a JavaScript string *is* JSON).  The
    # latter is meant to be serve as extra documentation when you want a string
    # argument only, which is a common case.
    'json': None,
    'js-string': None,
}


def _Pluralize(value, unused_context, args):
    """Formatter to pluralize words."""

    if len(args) == 0:
        s, p = '', 's'
    elif len(args) == 1:
        s, p = '', args[0]
    elif len(args) == 2:
        s, p = args
    else:
        # Should have been checked at compile time
        raise AssertionError

    if value > 1:
        return p
    else:
        return s


def _Cycle(value, unused_context, args):
    """Cycle between various values on consecutive integers."""
    # @index starts from 1, so used 1-based indexing
    return args[(value - 1) % len(args)]


def _IsDebugMode(unused_value, context, unused_args):
    try:
        return bool(context.Lookup('debug'))
    except UndefinedVariable:
        return False


_DEFAULT_PREDICATES = {
    'singular?': lambda x: x == 1,
    'plural?': lambda x: x > 1,
    'Debug?': _IsDebugMode,
}


def SplitMeta(meta):
    """Split and validate metacharacters.

    Example: '{}' -> ('{', '}')

    This is public so the syntax highlighter and other tools can use it.
    """
    n = len(meta)
    if n % 2 == 1:
        raise ConfigurationError(
            '%r has an odd number of metacharacters' % meta)
    return meta[:n / 2], meta[n / 2:]


_token_re_cache = {}


def MakeTokenRegex(meta_left, meta_right):
    """Return a (compiled) regular expression for tokenization.

    Args:
      meta_left, meta_right: e.g. '{' and '}'

    - The regular expressions are memoized.
    - This function is public so the syntax highlighter can use it.
    """
    key = meta_left, meta_right
    if key not in _token_re_cache:
        # - Need () grouping for re.split
        # - For simplicity, we allow all characters except newlines inside
        #   metacharacters ({} / [])
        _token_re_cache[key] = re.compile(
            r'(' +
            re.escape(meta_left) +
            r'.+?' +
            re.escape(meta_right) +
            r')')
    return _token_re_cache[key]


# Examples:

(LITERAL_TOKEN,  # "Hi"
 SUBSTITUTION_TOKEN,  # {var|html}
 SECTION_TOKEN,  # {.section name}
 REPEATED_SECTION_TOKEN,  # {.repeated section name}
 PREDICATE_TOKEN,  # {.predicate?}
 ALTERNATES_TOKEN,  # {.or}
 OR_TOKEN,  # {.or}
 END_TOKEN,  # {.end}
 ) = range(8)


def _MatchDirective(token):
    """Helper function for matching certain directives."""

    if token.startswith('.'):
        token = token[1:]
    else:
        return None, None  # Must start with .

    if token == 'alternates with':
        return ALTERNATES_TOKEN, token

    if token.startswith('or'):
        if token.strip() == 'or':
            return OR_TOKEN, None
        else:
            pred_str = token[2:].strip()
            return OR_TOKEN, pred_str

    if token == 'end':
        return END_TOKEN, None

    match = _SECTION_RE.match(token)
    if match:
        repeated, section_name = match.groups()
        if repeated:
            return REPEATED_SECTION_TOKEN, section_name
        else:
            return SECTION_TOKEN, section_name

    # {.if plural?} and {.plural?} are synonyms.  The ".if" will read better for
    # expressions, for people who like that kind of dirty thing...
    if token.startswith('if '):
        return PREDICATE_TOKEN, token[3:].strip()
    if token.endswith('?'):
        return PREDICATE_TOKEN, token

    return None, None  # no match


def _Tokenize(template_str, meta_left, meta_right):
    """Yields tokens, which are 2-tuples (TOKEN_TYPE, token_string)."""

    trimlen = len(meta_left)

    token_re = MakeTokenRegex(meta_left, meta_right)

    for line in template_str.splitlines(True):  # retain newlines
        tokens = token_re.split(line)

        # Check for a special case first.  If a comment or "block" directive is on a
        # line by itself (with only space surrounding it), then the space is
        # omitted.  For simplicity, we don't handle the case where we have 2
        # directives, say '{.end} # {#comment}' on a line.

        if len(tokens) == 3:
            # ''.isspace() is False, so work around that
            if (tokens[0].isspace() or not tokens[0]) and \
               (tokens[2].isspace() or not tokens[2]):
                token = tokens[1][trimlen: -trimlen]

                if token.startswith('#'):
                    continue  # The whole line is omitted

                token_type, token = _MatchDirective(token)
                if token_type is not None:
                    yield token_type, token  # Only yield the token, not space
                    continue

        # The line isn't special; process it normally.

        for i, token in enumerate(tokens):
            if i % 2 == 0:
                yield LITERAL_TOKEN, token

            else:  # It's a "directive" in metachracters

                assert token.startswith(meta_left), repr(token)
                assert token.endswith(meta_right), repr(token)
                token = token[trimlen: -trimlen]

                # It's a comment
                if token.startswith('#'):
                    continue

                if token.startswith('.'):

                    literal = {
                        '.meta-left': meta_left,
                        '.meta-right': meta_right,
                        '.space': ' ',
                        '.tab': '\t',
                        '.newline': '\n',
                    }.get(token)

                    if literal is not None:
                        yield LITERAL_TOKEN, literal
                        continue

                    token_type, token = _MatchDirective(token)
                    if token_type is not None:
                        yield token_type, token

                else:  # Now we know the directive is a substitution.
                    yield SUBSTITUTION_TOKEN, token


[docs]def CompileTemplate(
    template_str, builder=None, meta='{}', format_char='|',
    more_formatters=lambda x: None, more_predicates=lambda x: None,
        default_formatter='str'):
    """Compile the template string, calling methods on the 'program builder'.

    Args:
      template_str: The template string.  It should not have any compilation
          options in the header -- those are parsed by FromString/FromFile

      builder: The interface of _ProgramBuilder isn't fixed.  Use at your own
          risk.

      meta: The metacharacters to use, e.g. '{}', '[]'.

      more_formatters:
          Something that can map format strings to formatter functions.  One of:
            - A plain dictionary of names -> functions  e.g. {'html': cgi.escape}
            - A higher-order function which takes format strings and returns
              formatter functions.  Useful for when formatters have parsed
              arguments.
            - A FunctionRegistry instance for the most control.  This allows
              formatters which takes contexts as well.

      more_predicates:
          Like more_formatters, but for predicates.

      default_formatter: The formatter to use for substitutions that are missing a
          formatter.  The 'str' formatter the "default default" -- it just tries
          to convert the context value to a string in some unspecified manner.

    Returns:
      The compiled program (obtained from the builder)

    Raises:
      The various subclasses of CompilationError.  For example, if
      default_formatter=None, and a variable is missing a formatter, then
      MissingFormatter is raised.

    This function is public so it can be used by other tools, e.g. a syntax
    checking tool run before submitting a template to source control.
    """
    builder = builder or _ProgramBuilder(more_formatters, more_predicates)
    meta_left, meta_right = SplitMeta(meta)

    # : is meant to look like Python 3000 formatting {foo:.3f}.  According to
    # PEP 3101, that's also what .NET uses.
    # | is more readable, but, more importantly, reminiscent of pipes, which is
    # useful for multiple formatters, e.g. {name|js-string|html}
    if format_char not in (':', '|'):
        raise ConfigurationError(
            'Only format characters : and | are accepted (got %r)' % format_char)

    # If we go to -1, then we got too many {end}.  If end at 1, then we're missing
    # an {end}.
    balance_counter = 0

    for token_type, token in _Tokenize(template_str, meta_left, meta_right):

        if token_type == LITERAL_TOKEN:
            if token:
                builder.Append(token)
            continue

        if token_type in (SECTION_TOKEN, REPEATED_SECTION_TOKEN):
            builder.NewSection(token_type, token)
            balance_counter += 1
            continue

        if token_type == PREDICATE_TOKEN:
            # Everything of the form {.predicate?} starts a new predicate section
            block_made = builder.NewPredicateSection(token)
            balance_counter += 1
            continue

        if token_type == OR_TOKEN:
            builder.NewOrClause(token)
            continue

        if token_type == ALTERNATES_TOKEN:
            builder.AlternatesWith()
            continue

        if token_type == END_TOKEN:
            balance_counter -= 1
            if balance_counter < 0:
                # TODO: Show some context for errors
                raise TemplateSyntaxError(
                    'Got too many %send%s statements.  You may have mistyped an '
                    "earlier 'section' or 'repeated section' directive."
                    % (meta_left, meta_right))
            builder.EndSection()
            continue

        if token_type == SUBSTITUTION_TOKEN:
            parts = token.split(format_char)
            if len(parts) == 1:
                if default_formatter is None:
                    raise MissingFormatter('This template requires explicit formatters.')
                # If no formatter is specified, the default is the 'str' formatter,
                # which the user can define however they desire.
                name = token
                formatters = [default_formatter]
            else:
                name = parts[0]
                formatters = parts[1:]

            builder.AppendSubstitution(name, formatters)

    if balance_counter != 0:
        raise TemplateSyntaxError('Got too few %send%s statements' %
                                  (meta_left, meta_right))

    return builder.Root()


_OPTION_RE = re.compile(r'^([a-zA-Z\-]+):\s*(.*)')
# TODO: whitespace mode, etc.
_OPTION_NAMES = ['meta', 'format-char', 'default-formatter', 'undefined-str']


[docs]def FromString(s, more_formatters=lambda x: None, _constructor=None):
    """Like FromFile, but takes a string."""

    f = StringIO.StringIO(s)
    return FromFile(f, more_formatters=more_formatters, _constructor=_constructor)


[docs]def FromFile(f, more_formatters=lambda x: None, _constructor=None):
    """Parse a template from a file, using a simple file format.

    This is useful when you want to include template options in a data file,
    rather than in the source code.

    The format is similar to HTTP or E-mail headers.  The first lines of the file
    can specify template options, such as the metacharacters to use.  One blank
    line must separate the options from the template body.

    Example:

      default-formatter: none
      meta: {{}}
      format-char: :
      <blank line required>
      Template goes here: {{variable:html}}

    Args:
      f: A file handle to read from.  Caller is responsible for opening and
      closing it.
    """
    _constructor = _constructor or Template

    options = {}

    # Parse lines until the first one that doesn't look like an option
    while 1:
        line = f.readline()
        match = _OPTION_RE.match(line)
        if match:
            name, value = match.group(1), match.group(2)

            # Accept something like 'Default-Formatter: raw'.  This syntax is like
            # HTTP/E-mail headers.
            name = name.lower()

            if name in _OPTION_NAMES:
                name = name.replace('-', '_')
                value = value.strip()
                if name == 'default_formatter' and value.lower() == 'none':
                    value = None
                options[name] = value
            else:
                break
        else:
            break

    if options:
        if line.strip():
            raise CompilationError(
                'Must be one blank line between template options and body (got %r)'
                % line)
        body = f.read()
    else:
        # There were no options, so no blank line is necessary.
        body = line + f.read()

    return _constructor(body, more_formatters=more_formatters, **options)


[docs]class Template(object):

    """Represents a compiled template.

    Like many template systems, the template string is compiled into a program,
    and then it can be expanded any number of times.  For example, in a web app,
    you can compile the templates once at server startup, and use the expand()
    method at request handling time.  expand() uses the compiled representation.

    There are various options for controlling parsing -- see CompileTemplate.
    Don't go crazy with metacharacters.  {}, [], {{}} or <> should cover nearly
    any circumstance, e.g. generating HTML, CSS XML, JavaScript, C programs, text
    files, etc.
    """

    def __init__(self, template_str, builder=None, undefined_str=None,
                 **compile_options):
        """
        Args:
          template_str: The template string.
          undefined_str: A string to appear in the output when a variable to be
              substituted is missing.  If None, UndefinedVariable is raised.
              (Note: This is not really a compilation option, because affects
              template expansion rather than compilation.  Nonetheless we make it a
              constructor argument rather than an .expand() argument for
              simplicity.)

        It also accepts all the compile options that CompileTemplate does.
        """
        self._program = CompileTemplate(
            template_str, builder=builder, **compile_options)
        self.undefined_str = undefined_str

    #
    # Public API
    #

[docs]    def render(self, data_dict, callback):
        """Low level method to expands the template piece by piece.

        Args:
          data_dict: The JSON data dictionary.
          callback: A callback which should be called with each expanded token.

        Example: You can pass 'f.write' as the callback to write directly to a file
        handle.
        """
        context = _ScopedContext(data_dict, self.undefined_str)
        _Execute(self._program.Statements(), context, callback)

[docs]    def expand(self, *args, **kwargs):
        """Expands the template with the given data dictionary, returning a string.

        This is a small wrapper around render(), and is the most convenient
        interface.

        Args:
          The JSON data dictionary.  Like the builtin dict() constructor, it can
          take a single dictionary as a positional argument, or arbitrary keyword
          arguments.

        Returns:
          The return value could be a str() or unicode() instance, depending on the
          the type of the template string passed in, and what the types the strings
          in the dictionary are.
        """
        if args:
            if len(args) == 1:
                data_dict = args[0]
            else:
                raise TypeError(
                    'expand() only takes 1 positional argument (got %s)' % args)
        else:
            data_dict = kwargs

        tokens = []
        self.render(data_dict, tokens.append)
        return ''.join(tokens)

[docs]    def tokenstream(self, data_dict):
        """Yields a list of tokens resulting from expansion.

        This may be useful for WSGI apps.  NOTE: In the current implementation, the
        entire expanded template must be stored memory.

        NOTE: This is a generator, but JavaScript doesn't have generators.
        """
        tokens = []
        self.render(data_dict, tokens.append)
        for token in tokens:
            yield token


def _DoRepeatedSection(args, context, callback):
    """{repeated section foo}"""

    block = args

    items = context.PushSection(block.section_name)
    # TODO: if 'items' is a dictionary, allow @name and @value.

    if items:
        if not isinstance(items, list):
            raise EvaluationError('Expected a list; got %s' % type(items))

        last_index = len(items) - 1
        statements = block.Statements()
        alt_statements = block.Statements('alternates with')
        try:
            i = 0
            while True:
                context.Next()
                # Execute the statements in the block for every item in the list.
                # Execute the alternate block on every iteration except the last.  Each
                # item could be an atom (string, integer, etc.) or a dictionary.
                _Execute(statements, context, callback)
                if i != last_index:
                    _Execute(alt_statements, context, callback)
                i += 1
        except StopIteration:
            pass

    else:
        _Execute(block.Statements('or'), context, callback)

    context.Pop()


def _DoSection(args, context, callback):
    """{section foo}"""

    block = args
    # If a section present and "true", push the dictionary onto the stack as the
    # new context, and show it
    if context.PushSection(block.section_name):
        _Execute(block.Statements(), context, callback)
        context.Pop()
    else:  # missing or "false" -- show the {.or} section
        context.Pop()
        _Execute(block.Statements('or'), context, callback)


def _DoPredicates(args, context, callback):
    """{.predicate?}

    Here we execute the first clause that evaluates to true, and then stop.
    """
    block = args
    value = context.Lookup('@')
    for (predicate, args, func_type), statements in block.clauses:
        if func_type == ENHANCED_FUNC:
            do_clause = predicate(value, context, args)
        else:
            do_clause = predicate(value)

        if do_clause:
            _Execute(statements, context, callback)
            break


def _DoSubstitute(args, context, callback):
    """Variable substitution, e.g. {foo}"""

    name, formatters = args

    # So we can have {.section is_new}new since {@}{.end}.  Hopefully this idiom
    # is OK.
    if name == '@':
        value = context.Lookup('@')
    else:
        try:
            value = context.Lookup(name)
        except TypeError, e:
            raise EvaluationError(
                'Error evaluating %r in context %r: %r' % (name, context, e))

    for func, args, func_type in formatters:
        try:
            if func_type == ENHANCED_FUNC:
                value = func(value, context, args)
            else:
                value = func(value)
        except KeyboardInterrupt:
            raise
        except Exception, e:
            raise EvaluationError(
                'Formatting value %r with formatter %s raised exception: %r' %
                (value, formatters, e), original_exception=e)

    # TODO: Require a string/unicode instance here?
    if value is None:
        raise EvaluationError('Evaluating %r gave None value' % name)
    callback(value)


def _Execute(statements, context, callback):
    """Execute a bunch of template statements in a ScopedContext.

    Args:
      callback: Strings are "written" to this callback function.

    This is called in a mutually recursive fashion.
    """

    for i, statement in enumerate(statements):
        if isinstance(statement, basestring):
            callback(statement)
        else:
            # In the case of a substitution, args is a pair (name, formatters).
            # In the case of a section, it's a _Section instance.
            try:
                func, args = statement
                func(args, context, callback)
            except UndefinedVariable, e:
                # Show context for statements
                start = max(0, i - 3)
                end = i + 3
                e.near = statements[start:end]
                raise


[docs]def expand(template_str, dictionary, **kwargs):
    """Free function to expands a template string with a data dictionary.

    This is useful for cases where you don't care about saving the result of
    compilation (similar to re.match('.*', s) vs DOT_STAR.match(s))
    """
    t = Template(template_str, **kwargs)
    return t.expand(dictionary)