| # -*- coding: utf-8 -*- |
| """ |
| jinja2.utils |
| ~~~~~~~~~~~~ |
| |
| Utility functions. |
| |
| :copyright: 2008 by Armin Ronacher. |
| :license: BSD, see LICENSE for more details. |
| """ |
| import re |
| import string |
| from collections import deque |
| from copy import deepcopy |
| from functools import update_wrapper |
| from itertools import imap |
| |
| |
| _word_split_re = re.compile(r'(\s+)') |
| _punctuation_re = re.compile( |
| '^(?P<lead>(?:%s)*)(?P<middle>.*?)(?P<trail>(?:%s)*)$' % ( |
| '|'.join(imap(re.escape, ('(', '<', '<'))), |
| '|'.join(imap(re.escape, ('.', ',', ')', '>', '\n', '>'))) |
| ) |
| ) |
| _simple_email_re = re.compile(r'^\S+@[a-zA-Z0-9._-]+\.[a-zA-Z0-9._-]+$') |
| |
| |
| def import_string(import_name, silent=False): |
| """Imports an object based on a string. This use useful if you want to |
| use import paths as endpoints or something similar. An import path can |
| be specified either in dotted notation (``xml.sax.saxutils.escape``) |
| or with a colon as object delimiter (``xml.sax.saxutils:escape``). |
| |
| If the `silent` is True the return value will be `None` if the import |
| fails. |
| |
| :return: imported object |
| """ |
| try: |
| if ':' in import_name: |
| module, obj = import_name.split(':', 1) |
| elif '.' in import_name: |
| items = import_name.split('.') |
| module = '.'.join(items[:-1]) |
| obj = items[-1] |
| else: |
| return __import__(import_name) |
| return getattr(__import__(module, None, None, [obj]), obj) |
| except (ImportError, AttributeError): |
| if not silent: |
| raise |
| |
| |
| def pformat(obj, verbose=False): |
| """Prettyprint an object. Either use the `pretty` library or the |
| builtin `pprint`. |
| """ |
| try: |
| from pretty import pretty |
| return pretty(obj, verbose=verbose) |
| except ImportError: |
| from pprint import pformat |
| return pformat(obj) |
| |
| |
| def urlize(text, trim_url_limit=None, nofollow=False): |
| """Converts any URLs in text into clickable links. Works on http://, |
| https:// and www. links. Links can have trailing punctuation (periods, |
| commas, close-parens) and leading punctuation (opening parens) and |
| it'll still do the right thing. |
| |
| If trim_url_limit is not None, the URLs in link text will be limited |
| to trim_url_limit characters. |
| |
| If nofollow is True, the URLs in link text will get a rel="nofollow" |
| attribute. |
| """ |
| trim_url = lambda x, limit=trim_url_limit: limit is not None \ |
| and (x[:limit] + (len(x) >=limit and '...' |
| or '')) or x |
| words = _word_split_re.split(text) |
| nofollow_attr = nofollow and ' rel="nofollow"' or '' |
| for i, word in enumerate(words): |
| match = _punctuation_re.match(word) |
| if match: |
| lead, middle, trail = match.groups() |
| if middle.startswith('www.') or ( |
| '@' not in middle and |
| not middle.startswith('http://') and |
| len(middle) > 0 and |
| middle[0] in string.letters + string.digits and ( |
| middle.endswith('.org') or |
| middle.endswith('.net') or |
| middle.endswith('.com') |
| )): |
| middle = '<a href="http://%s"%s>%s</a>' % (middle, |
| nofollow_attr, trim_url(middle)) |
| if middle.startswith('http://') or \ |
| middle.startswith('https://'): |
| middle = '<a href="%s"%s>%s</a>' % (middle, |
| nofollow_attr, trim_url(middle)) |
| if '@' in middle and not middle.startswith('www.') and \ |
| not ':' in middle and _simple_email_re.match(middle): |
| middle = '<a href="mailto:%s">%s</a>' % (middle, middle) |
| if lead + middle + trail != word: |
| words[i] = lead + middle + trail |
| return u''.join(words) |
| |
| |
| class Markup(unicode): |
| """Marks a string as being safe for inclusion in HTML/XML output without |
| needing to be escaped. This implements the `__html__` interface a couple |
| of frameworks and web applications use. |
| |
| The `escape` function returns markup objects so that double escaping can't |
| happen. If you want to use autoescaping in Jinja just set the finalizer |
| of the environment to `escape`. |
| """ |
| __slots__ = () |
| |
| def __html__(self): |
| return self |
| |
| def __add__(self, other): |
| if hasattr(other, '__html__') or isinstance(other, basestring): |
| return self.__class__(unicode(self) + unicode(escape(other))) |
| return NotImplemented |
| |
| def __radd__(self, other): |
| if hasattr(other, '__html__') or isinstance(other, basestring): |
| return self.__class__(unicode(escape(other)) + unicode(self)) |
| return NotImplemented |
| |
| def __mul__(self, num): |
| if not isinstance(num, (int, long)): |
| return NotImplemented |
| return self.__class__(unicode.__mul__(self, num)) |
| __rmul__ = __mul__ |
| |
| def __mod__(self, arg): |
| if isinstance(arg, tuple): |
| arg = tuple(imap(_MarkupEscapeHelper, arg)) |
| else: |
| arg = _MarkupEscapeHelper(arg) |
| return self.__class__(unicode.__mod__(self, arg)) |
| |
| def __repr__(self): |
| return '%s(%s)' % ( |
| self.__class__.__name__, |
| unicode.__repr__(self) |
| ) |
| |
| def join(self, seq): |
| return self.__class__(unicode.join(self, imap(escape, seq))) |
| join.__doc__ = unicode.join.__doc__ |
| |
| def split(self, *args, **kwargs): |
| return map(self.__class__, unicode.split(self, *args, **kwargs)) |
| split.__doc__ = unicode.split.__doc__ |
| |
| def rsplit(self, *args, **kwargs): |
| return map(self.__class__, unicode.rsplit(self, *args, **kwargs)) |
| rsplit.__doc__ = unicode.rsplit.__doc__ |
| |
| def splitlines(self, *args, **kwargs): |
| return map(self.__class__, unicode.splitlines(self, *args, **kwargs)) |
| splitlines.__doc__ = unicode.splitlines.__doc__ |
| |
| def make_wrapper(name): |
| orig = getattr(unicode, name) |
| def func(self, *args, **kwargs): |
| args = list(args) |
| for idx, arg in enumerate(args): |
| if hasattr(arg, '__html__') or isinstance(arg, basestring): |
| args[idx] = escape(arg) |
| for name, arg in kwargs.iteritems(): |
| if hasattr(arg, '__html__') or isinstance(arg, basestring): |
| kwargs[name] = escape(arg) |
| return self.__class__(orig(self, *args, **kwargs)) |
| return update_wrapper(func, orig, ('__name__', '__doc__')) |
| for method in '__getitem__', '__getslice__', 'capitalize', \ |
| 'title', 'lower', 'upper', 'replace', 'ljust', \ |
| 'rjust', 'lstrip', 'rstrip', 'partition', 'center', \ |
| 'strip', 'translate', 'expandtabs', 'rpartition', \ |
| 'swapcase', 'zfill': |
| locals()[method] = make_wrapper(method) |
| del method, make_wrapper |
| |
| |
| class _MarkupEscapeHelper(object): |
| """Helper for Markup.__mod__""" |
| |
| def __init__(self, obj): |
| self.obj = obj |
| |
| __getitem__ = lambda s, x: _MarkupEscapeHelper(s.obj[x]) |
| __unicode__ = lambda s: unicode(escape(s.obj)) |
| __str__ = lambda s: str(escape(s.obj)) |
| __repr__ = lambda s: str(repr(escape(s.obj))) |
| __int__ = lambda s: int(s.obj) |
| __float__ = lambda s: float(s.obj) |
| |
| |
| class LRUCache(object): |
| """A simple LRU Cache implementation.""" |
| # this is fast for small capacities (something around 200) but doesn't |
| # scale. But as long as it's only used for the database connections in |
| # a non request fallback it's fine. |
| |
| def __init__(self, capacity): |
| self.capacity = capacity |
| self._mapping = {} |
| self._queue = deque() |
| |
| # alias all queue methods for faster lookup |
| self._popleft = self._queue.popleft |
| self._pop = self._queue.pop |
| if hasattr(self._queue, 'remove'): |
| self._remove = self._queue.remove |
| self._append = self._queue.append |
| |
| def _remove(self, obj): |
| """Python 2.4 compatibility.""" |
| for idx, item in enumerate(self._queue): |
| if item == obj: |
| del self._queue[idx] |
| break |
| |
| def copy(self): |
| """Return an shallow copy of the instance.""" |
| rv = self.__class__(self.capacity) |
| rv._mapping.update(self._mapping) |
| rv._queue = deque(self._queue) |
| return rv |
| |
| def get(self, key, default=None): |
| """Return an item from the cache dict or `default`""" |
| if key in self: |
| return self[key] |
| return default |
| |
| def setdefault(self, key, default=None): |
| """Set `default` if the key is not in the cache otherwise |
| leave unchanged. Return the value of this key. |
| """ |
| if key in self: |
| return self[key] |
| self[key] = default |
| return default |
| |
| def clear(self): |
| """Clear the cache.""" |
| self._mapping.clear() |
| self._queue.clear() |
| |
| def __contains__(self, key): |
| """Check if a key exists in this cache.""" |
| return key in self._mapping |
| |
| def __len__(self): |
| """Return the current size of the cache.""" |
| return len(self._mapping) |
| |
| def __repr__(self): |
| return '<%s %r>' % ( |
| self.__class__.__name__, |
| self._mapping |
| ) |
| |
| def __getitem__(self, key): |
| """Get an item from the cache. Moves the item up so that it has the |
| highest priority then. |
| |
| Raise an `KeyError` if it does not exist. |
| """ |
| rv = self._mapping[key] |
| if self._queue[-1] != key: |
| self._remove(key) |
| self._append(key) |
| return rv |
| |
| def __setitem__(self, key, value): |
| """Sets the value for an item. Moves the item up so that it |
| has the highest priority then. |
| """ |
| if key in self._mapping: |
| self._remove(key) |
| elif len(self._mapping) == self.capacity: |
| del self._mapping[self._popleft()] |
| self._append(key) |
| self._mapping[key] = value |
| |
| def __delitem__(self, key): |
| """Remove an item from the cache dict. |
| Raise an `KeyError` if it does not exist. |
| """ |
| del self._mapping[key] |
| self._remove(key) |
| |
| def __iter__(self): |
| """Iterate over all values in the cache dict, ordered by |
| the most recent usage. |
| """ |
| return reversed(self._queue) |
| |
| def __reversed__(self): |
| """Iterate over the values in the cache dict, oldest items |
| coming first. |
| """ |
| return iter(self._queue) |
| |
| __copy__ = copy |
| |
| |
| # we have to import it down here as the speedups module imports the |
| # markup type which is define above. |
| try: |
| from jinja2._speedups import escape, soft_unicode |
| except ImportError: |
| def escape(obj): |
| """Convert the characters &, <, >, and " in string s to HTML-safe |
| sequences. Use this if you need to display text that might contain |
| such characters in HTML. |
| """ |
| if hasattr(obj, '__html__'): |
| return obj.__html__() |
| return Markup(unicode(obj) |
| .replace('&', '&') |
| .replace('>', '>') |
| .replace('<', '<') |
| .replace('"', '"') |
| ) |
| |
| def soft_unicode(s): |
| """Make a string unicode if it isn't already. That way a markup |
| string is not converted back to unicode. |
| """ |
| if not isinstance(s, unicode): |
| s = unicode(s) |
| return s |