blob: 1d888a2ab20a1ab6eefcd0aaa53138d82adaee85 [file] [log] [blame]
Armin Ronacher05530932008-04-20 13:27:49 +02001# -*- coding: utf-8 -*-
2"""
3 jinja2.ext
4 ~~~~~~~~~~
5
Armin Ronacherb5124e62008-04-25 00:36:14 +02006 Jinja extensions allow to add custom tags similar to the way django custom
7 tags work. By default two example extensions exist: an i18n and a cache
8 extension.
Armin Ronacher05530932008-04-20 13:27:49 +02009
Armin Ronacher55494e42010-01-22 09:41:48 +010010 :copyright: (c) 2010 by the Jinja Team.
Armin Ronacher05530932008-04-20 13:27:49 +020011 :license: BSD.
12"""
Armin Ronacherb5124e62008-04-25 00:36:14 +020013from collections import deque
Armin Ronacher05530932008-04-20 13:27:49 +020014from jinja2 import nodes
Armin Ronacher4f5008f2008-05-23 23:36:07 +020015from jinja2.defaults import *
Armin Ronacher4f77a302010-07-01 12:15:39 +020016from jinja2.environment import Environment
Armin Ronacher2feed1d2008-04-26 16:26:52 +020017from jinja2.runtime import Undefined, concat
Benjamin Wieganda3152742008-04-28 18:07:52 +020018from jinja2.exceptions import TemplateAssertionError, TemplateSyntaxError
Armin Ronacherbd357722009-08-05 20:25:06 +020019from jinja2.utils import contextfunction, import_string, Markup, next
Armin Ronacherb5124e62008-04-25 00:36:14 +020020
21
22# the only real useful gettext functions for a Jinja template. Note
23# that ugettext must be assigned to gettext as Jinja doesn't support
24# non unicode strings.
25GETTEXT_FUNCTIONS = ('_', 'gettext', 'ngettext')
Armin Ronacher05530932008-04-20 13:27:49 +020026
27
Armin Ronacher023b5e92008-05-08 11:03:10 +020028class ExtensionRegistry(type):
Armin Ronacher5c047ea2008-05-23 22:26:45 +020029 """Gives the extension an unique identifier."""
Armin Ronacher023b5e92008-05-08 11:03:10 +020030
31 def __new__(cls, name, bases, d):
32 rv = type.__new__(cls, name, bases, d)
33 rv.identifier = rv.__module__ + '.' + rv.__name__
34 return rv
35
36
Armin Ronacher05530932008-04-20 13:27:49 +020037class Extension(object):
Armin Ronacher7259c762008-04-30 13:03:59 +020038 """Extensions can be used to add extra functionality to the Jinja template
Armin Ronacher9d42abf2008-05-14 18:10:41 +020039 system at the parser level. Custom extensions are bound to an environment
40 but may not store environment specific data on `self`. The reason for
41 this is that an extension can be bound to another environment (for
42 overlays) by creating a copy and reassigning the `environment` attribute.
Armin Ronacher762079c2008-05-08 23:57:56 +020043
44 As extensions are created by the environment they cannot accept any
45 arguments for configuration. One may want to work around that by using
46 a factory function, but that is not possible as extensions are identified
47 by their import name. The correct way to configure the extension is
48 storing the configuration values on the environment. Because this way the
49 environment ends up acting as central configuration storage the
50 attributes may clash which is why extensions have to ensure that the names
51 they choose for configuration are not too generic. ``prefix`` for example
52 is a terrible name, ``fragment_cache_prefix`` on the other hand is a good
53 name as includes the name of the extension (fragment cache).
Armin Ronacher7259c762008-04-30 13:03:59 +020054 """
Armin Ronacher023b5e92008-05-08 11:03:10 +020055 __metaclass__ = ExtensionRegistry
Armin Ronacher05530932008-04-20 13:27:49 +020056
57 #: if this extension parses this is the list of tags it's listening to.
58 tags = set()
59
Armin Ronacher5b3f4dc2010-04-12 14:04:14 +020060 #: the priority of that extension. This is especially useful for
61 #: extensions that preprocess values. A lower value means higher
62 #: priority.
63 #:
64 #: .. versionadded:: 2.4
65 priority = 100
66
Armin Ronacher05530932008-04-20 13:27:49 +020067 def __init__(self, environment):
68 self.environment = environment
69
Armin Ronacher7259c762008-04-30 13:03:59 +020070 def bind(self, environment):
71 """Create a copy of this extension bound to another environment."""
72 rv = object.__new__(self.__class__)
73 rv.__dict__.update(self.__dict__)
74 rv.environment = environment
75 return rv
76
Armin Ronacher9ad96e72008-06-13 22:44:01 +020077 def preprocess(self, source, name, filename=None):
78 """This method is called before the actual lexing and can be used to
79 preprocess the source. The `filename` is optional. The return value
80 must be the preprocessed source.
81 """
82 return source
83
84 def filter_stream(self, stream):
85 """It's passed a :class:`~jinja2.lexer.TokenStream` that can be used
86 to filter tokens returned. This method has to return an iterable of
87 :class:`~jinja2.lexer.Token`\s, but it doesn't have to return a
88 :class:`~jinja2.lexer.TokenStream`.
Armin Ronacherd02fc7d2008-06-14 14:19:47 +020089
90 In the `ext` folder of the Jinja2 source distribution there is a file
91 called `inlinegettext.py` which implements a filter that utilizes this
92 method.
Armin Ronacher9ad96e72008-06-13 22:44:01 +020093 """
94 return stream
95
Armin Ronacher05530932008-04-20 13:27:49 +020096 def parse(self, parser):
Armin Ronacher023b5e92008-05-08 11:03:10 +020097 """If any of the :attr:`tags` matched this method is called with the
98 parser as first argument. The token the parser stream is pointing at
99 is the name token that matched. This method has to return one or a
100 list of multiple nodes.
101 """
Armin Ronacher27069d72008-05-11 19:48:12 +0200102 raise NotImplementedError()
Armin Ronacher023b5e92008-05-08 11:03:10 +0200103
104 def attr(self, name, lineno=None):
105 """Return an attribute node for the current extension. This is useful
Armin Ronacher53278a32011-01-24 01:16:00 +0100106 to pass constants on extensions to generated template code.
107
108 ::
Armin Ronacher023b5e92008-05-08 11:03:10 +0200109
Armin Ronacher69e12db2008-05-12 09:00:03 +0200110 self.attr('_my_attribute', lineno=lineno)
Armin Ronacher023b5e92008-05-08 11:03:10 +0200111 """
112 return nodes.ExtensionAttribute(self.identifier, name, lineno=lineno)
Armin Ronacher05530932008-04-20 13:27:49 +0200113
Armin Ronacher27069d72008-05-11 19:48:12 +0200114 def call_method(self, name, args=None, kwargs=None, dyn_args=None,
115 dyn_kwargs=None, lineno=None):
Armin Ronacher69e12db2008-05-12 09:00:03 +0200116 """Call a method of the extension. This is a shortcut for
117 :meth:`attr` + :class:`jinja2.nodes.Call`.
118 """
Armin Ronacher27069d72008-05-11 19:48:12 +0200119 if args is None:
120 args = []
121 if kwargs is None:
122 kwargs = []
123 return nodes.Call(self.attr(name, lineno=lineno), args, kwargs,
124 dyn_args, dyn_kwargs, lineno=lineno)
125
Armin Ronacher05530932008-04-20 13:27:49 +0200126
Armin Ronacher5c047ea2008-05-23 22:26:45 +0200127@contextfunction
Armin Ronacher4da90342010-05-29 17:35:10 +0200128def _gettext_alias(__context, *args, **kwargs):
Armin Ronacherb8892e72010-05-29 17:58:06 +0200129 return __context.call(__context.resolve('gettext'), *args, **kwargs)
Armin Ronacher4da90342010-05-29 17:35:10 +0200130
131
132def _make_new_gettext(func):
133 @contextfunction
134 def gettext(__context, __string, **variables):
Armin Ronacherffaa2e72010-05-29 20:57:16 +0200135 rv = __context.call(func, __string)
Armin Ronacher4da90342010-05-29 17:35:10 +0200136 if __context.eval_ctx.autoescape:
137 rv = Markup(rv)
138 return rv % variables
139 return gettext
140
141
142def _make_new_ngettext(func):
143 @contextfunction
Armin Ronacherb98dad92010-05-29 22:31:17 +0200144 def ngettext(__context, __singular, __plural, __num, **variables):
145 variables.setdefault('num', __num)
146 rv = __context.call(func, __singular, __plural, __num)
Armin Ronacher4da90342010-05-29 17:35:10 +0200147 if __context.eval_ctx.autoescape:
148 rv = Markup(rv)
149 return rv % variables
150 return ngettext
Armin Ronacher5c047ea2008-05-23 22:26:45 +0200151
152
Armin Ronachered98cac2008-05-07 08:42:11 +0200153class InternationalizationExtension(Extension):
Armin Ronacher762079c2008-05-08 23:57:56 +0200154 """This extension adds gettext support to Jinja2."""
Armin Ronacherb5124e62008-04-25 00:36:14 +0200155 tags = set(['trans'])
156
Armin Ronacher4720c362008-09-06 16:15:38 +0200157 # TODO: the i18n extension is currently reevaluating values in a few
158 # situations. Take this example:
159 # {% trans count=something() %}{{ count }} foo{% pluralize
160 # %}{{ count }} fooss{% endtrans %}
161 # something is called twice here. One time for the gettext value and
162 # the other time for the n-parameter of the ngettext function.
163
Armin Ronacherb5124e62008-04-25 00:36:14 +0200164 def __init__(self, environment):
165 Extension.__init__(self, environment)
Armin Ronacher5c047ea2008-05-23 22:26:45 +0200166 environment.globals['_'] = _gettext_alias
Armin Ronacher762079c2008-05-08 23:57:56 +0200167 environment.extend(
168 install_gettext_translations=self._install,
169 install_null_translations=self._install_null,
Armin Ronacher4da90342010-05-29 17:35:10 +0200170 install_gettext_callables=self._install_callables,
Armin Ronacher762079c2008-05-08 23:57:56 +0200171 uninstall_gettext_translations=self._uninstall,
Armin Ronacher4da90342010-05-29 17:35:10 +0200172 extract_translations=self._extract,
173 newstyle_gettext=False
Armin Ronacher762079c2008-05-08 23:57:56 +0200174 )
175
Armin Ronacher4da90342010-05-29 17:35:10 +0200176 def _install(self, translations, newstyle=None):
Armin Ronacher32133552008-09-15 14:35:01 +0200177 gettext = getattr(translations, 'ugettext', None)
178 if gettext is None:
179 gettext = translations.gettext
180 ngettext = getattr(translations, 'ungettext', None)
181 if ngettext is None:
182 ngettext = translations.ngettext
Armin Ronacher4da90342010-05-29 17:35:10 +0200183 self._install_callables(gettext, ngettext, newstyle)
Armin Ronacher762079c2008-05-08 23:57:56 +0200184
Armin Ronacher4da90342010-05-29 17:35:10 +0200185 def _install_null(self, newstyle=None):
186 self._install_callables(
187 lambda x: x,
188 lambda s, p, n: (n != 1 and (p,) or (s,))[0],
189 newstyle
190 )
191
192 def _install_callables(self, gettext, ngettext, newstyle=None):
193 if newstyle is not None:
194 self.environment.newstyle_gettext = newstyle
195 if self.environment.newstyle_gettext:
196 gettext = _make_new_gettext(gettext)
197 ngettext = _make_new_ngettext(ngettext)
Armin Ronacher762079c2008-05-08 23:57:56 +0200198 self.environment.globals.update(
Armin Ronacher4da90342010-05-29 17:35:10 +0200199 gettext=gettext,
200 ngettext=ngettext
Armin Ronacher762079c2008-05-08 23:57:56 +0200201 )
202
203 def _uninstall(self, translations):
204 for key in 'gettext', 'ngettext':
205 self.environment.globals.pop(key, None)
206
207 def _extract(self, source, gettext_functions=GETTEXT_FUNCTIONS):
208 if isinstance(source, basestring):
209 source = self.environment.parse(source)
210 return extract_from_ast(source, gettext_functions)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200211
212 def parse(self, parser):
213 """Parse a translatable tag."""
Armin Ronacherbd357722009-08-05 20:25:06 +0200214 lineno = next(parser.stream).lineno
Armin Ronacherb98dad92010-05-29 22:31:17 +0200215 num_called_num = False
Armin Ronacherb5124e62008-04-25 00:36:14 +0200216
Armin Ronacherb5124e62008-04-25 00:36:14 +0200217 # find all the variables referenced. Additionally a variable can be
218 # defined in the body of the trans block too, but this is checked at
219 # a later state.
220 plural_expr = None
221 variables = {}
Armin Ronacher7647d1c2009-01-05 12:16:46 +0100222 while parser.stream.current.type != 'block_end':
Armin Ronacherb5124e62008-04-25 00:36:14 +0200223 if variables:
224 parser.stream.expect('comma')
Armin Ronacher023b5e92008-05-08 11:03:10 +0200225
226 # skip colon for python compatibility
Armin Ronacherfdf95302008-05-11 22:20:51 +0200227 if parser.stream.skip_if('colon'):
Armin Ronacher023b5e92008-05-08 11:03:10 +0200228 break
229
Armin Ronacherb5124e62008-04-25 00:36:14 +0200230 name = parser.stream.expect('name')
231 if name.value in variables:
Armin Ronacher7f15ef82008-05-16 09:11:39 +0200232 parser.fail('translatable variable %r defined twice.' %
233 name.value, name.lineno,
234 exc=TemplateAssertionError)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200235
236 # expressions
Armin Ronacher7647d1c2009-01-05 12:16:46 +0100237 if parser.stream.current.type == 'assign':
Armin Ronacherbd357722009-08-05 20:25:06 +0200238 next(parser.stream)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200239 variables[name.value] = var = parser.parse_expression()
240 else:
241 variables[name.value] = var = nodes.Name(name.value, 'load')
Armin Ronacherb98dad92010-05-29 22:31:17 +0200242
Armin Ronacherb5124e62008-04-25 00:36:14 +0200243 if plural_expr is None:
Florian Apolloner5a25a472012-01-18 17:08:48 +0100244 if isinstance(var, nodes.Call):
245 plural_expr = nodes.Name(name.value, 'load')
246 else:
247 plural_expr = var
Armin Ronacherb98dad92010-05-29 22:31:17 +0200248 num_called_num = name.value == 'num'
Armin Ronacher023b5e92008-05-08 11:03:10 +0200249
Armin Ronacherb5124e62008-04-25 00:36:14 +0200250 parser.stream.expect('block_end')
251
252 plural = plural_names = None
253 have_plural = False
254 referenced = set()
255
256 # now parse until endtrans or pluralize
257 singular_names, singular = self._parse_block(parser, True)
258 if singular_names:
259 referenced.update(singular_names)
260 if plural_expr is None:
261 plural_expr = nodes.Name(singular_names[0], 'load')
Armin Ronacherb98dad92010-05-29 22:31:17 +0200262 num_called_num = singular_names[0] == 'num'
Armin Ronacherb5124e62008-04-25 00:36:14 +0200263
264 # if we have a pluralize block, we parse that too
265 if parser.stream.current.test('name:pluralize'):
266 have_plural = True
Armin Ronacherbd357722009-08-05 20:25:06 +0200267 next(parser.stream)
Armin Ronacher7647d1c2009-01-05 12:16:46 +0100268 if parser.stream.current.type != 'block_end':
Armin Ronacher4720c362008-09-06 16:15:38 +0200269 name = parser.stream.expect('name')
270 if name.value not in variables:
271 parser.fail('unknown variable %r for pluralization' %
272 name.value, name.lineno,
273 exc=TemplateAssertionError)
274 plural_expr = variables[name.value]
Armin Ronacherb98dad92010-05-29 22:31:17 +0200275 num_called_num = name.value == 'num'
Armin Ronacherb5124e62008-04-25 00:36:14 +0200276 parser.stream.expect('block_end')
277 plural_names, plural = self._parse_block(parser, False)
Armin Ronacherbd357722009-08-05 20:25:06 +0200278 next(parser.stream)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200279 referenced.update(plural_names)
280 else:
Armin Ronacherbd357722009-08-05 20:25:06 +0200281 next(parser.stream)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200282
283 # register free names as simple name expressions
284 for var in referenced:
285 if var not in variables:
286 variables[var] = nodes.Name(var, 'load')
287
Armin Ronacherb5124e62008-04-25 00:36:14 +0200288 if not have_plural:
289 plural_expr = None
290 elif plural_expr is None:
Armin Ronacher7f15ef82008-05-16 09:11:39 +0200291 parser.fail('pluralize without variables', lineno)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200292
Armin Ronacherffaa2e72010-05-29 20:57:16 +0200293 node = self._make_node(singular, plural, variables, plural_expr,
Armin Ronacher4f77a302010-07-01 12:15:39 +0200294 bool(referenced),
295 num_called_num and have_plural)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200296 node.set_lineno(lineno)
297 return node
298
299 def _parse_block(self, parser, allow_pluralize):
300 """Parse until the next block tag with a given name."""
301 referenced = []
302 buf = []
303 while 1:
Armin Ronacher7647d1c2009-01-05 12:16:46 +0100304 if parser.stream.current.type == 'data':
Armin Ronacherb5124e62008-04-25 00:36:14 +0200305 buf.append(parser.stream.current.value.replace('%', '%%'))
Armin Ronacherbd357722009-08-05 20:25:06 +0200306 next(parser.stream)
Armin Ronacher7647d1c2009-01-05 12:16:46 +0100307 elif parser.stream.current.type == 'variable_begin':
Armin Ronacherbd357722009-08-05 20:25:06 +0200308 next(parser.stream)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200309 name = parser.stream.expect('name').value
310 referenced.append(name)
311 buf.append('%%(%s)s' % name)
312 parser.stream.expect('variable_end')
Armin Ronacher7647d1c2009-01-05 12:16:46 +0100313 elif parser.stream.current.type == 'block_begin':
Armin Ronacherbd357722009-08-05 20:25:06 +0200314 next(parser.stream)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200315 if parser.stream.current.test('name:endtrans'):
316 break
317 elif parser.stream.current.test('name:pluralize'):
318 if allow_pluralize:
319 break
Armin Ronacher7f15ef82008-05-16 09:11:39 +0200320 parser.fail('a translatable section can have only one '
321 'pluralize section')
322 parser.fail('control structures in translatable sections are '
323 'not allowed')
Armin Ronacherd02fc7d2008-06-14 14:19:47 +0200324 elif parser.stream.eos:
325 parser.fail('unclosed translation block')
Armin Ronacherb5124e62008-04-25 00:36:14 +0200326 else:
327 assert False, 'internal parser error'
328
Armin Ronacher2feed1d2008-04-26 16:26:52 +0200329 return referenced, concat(buf)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200330
Armin Ronacherffaa2e72010-05-29 20:57:16 +0200331 def _make_node(self, singular, plural, variables, plural_expr,
Armin Ronacherb98dad92010-05-29 22:31:17 +0200332 vars_referenced, num_called_num):
Armin Ronacherb5124e62008-04-25 00:36:14 +0200333 """Generates a useful node from the data provided."""
Armin Ronacherffaa2e72010-05-29 20:57:16 +0200334 # no variables referenced? no need to escape for old style
Armin Ronacher4cccc222010-07-06 11:37:45 +0200335 # gettext invocations only if there are vars.
Armin Ronacherffaa2e72010-05-29 20:57:16 +0200336 if not vars_referenced and not self.environment.newstyle_gettext:
337 singular = singular.replace('%%', '%')
338 if plural:
339 plural = plural.replace('%%', '%')
340
Armin Ronacherb5124e62008-04-25 00:36:14 +0200341 # singular only:
342 if plural_expr is None:
343 gettext = nodes.Name('gettext', 'load')
344 node = nodes.Call(gettext, [nodes.Const(singular)],
345 [], None, None)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200346
347 # singular and plural
348 else:
349 ngettext = nodes.Name('ngettext', 'load')
350 node = nodes.Call(ngettext, [
351 nodes.Const(singular),
352 nodes.Const(plural),
353 plural_expr
354 ], [], None, None)
Armin Ronacherd84ec462008-04-29 13:43:16 +0200355
Armin Ronacher4da90342010-05-29 17:35:10 +0200356 # in case newstyle gettext is used, the method is powerful
357 # enough to handle the variable expansion and autoescape
358 # handling itself
359 if self.environment.newstyle_gettext:
Armin Ronacherb8892e72010-05-29 17:58:06 +0200360 for key, value in variables.iteritems():
Armin Ronacherb98dad92010-05-29 22:31:17 +0200361 # the function adds that later anyways in case num was
362 # called num, so just skip it.
363 if num_called_num and key == 'num':
364 continue
Armin Ronacherb8892e72010-05-29 17:58:06 +0200365 node.kwargs.append(nodes.Keyword(key, value))
Armin Ronacherd84ec462008-04-29 13:43:16 +0200366
Armin Ronacher4da90342010-05-29 17:35:10 +0200367 # otherwise do that here
368 else:
369 # mark the return value as safe if we are in an
370 # environment with autoescaping turned on
371 node = nodes.MarkSafeIfAutoescape(node)
372 if variables:
Armin Ronacherb8892e72010-05-29 17:58:06 +0200373 node = nodes.Mod(node, nodes.Dict([
374 nodes.Pair(nodes.Const(key), value)
375 for key, value in variables.items()
376 ]))
Armin Ronacherb5124e62008-04-25 00:36:14 +0200377 return nodes.Output([node])
378
379
Armin Ronacher5d2733f2008-05-15 23:26:52 +0200380class ExprStmtExtension(Extension):
381 """Adds a `do` tag to Jinja2 that works like the print statement just
382 that it doesn't print the return value.
383 """
384 tags = set(['do'])
385
386 def parse(self, parser):
Armin Ronacherbd357722009-08-05 20:25:06 +0200387 node = nodes.ExprStmt(lineno=next(parser.stream).lineno)
Armin Ronacher5d2733f2008-05-15 23:26:52 +0200388 node.node = parser.parse_tuple()
389 return node
390
391
Armin Ronacher3da90312008-05-23 16:37:28 +0200392class LoopControlExtension(Extension):
393 """Adds break and continue to the template engine."""
394 tags = set(['break', 'continue'])
395
396 def parse(self, parser):
Armin Ronacherbd357722009-08-05 20:25:06 +0200397 token = next(parser.stream)
Armin Ronacher3da90312008-05-23 16:37:28 +0200398 if token.value == 'break':
399 return nodes.Break(lineno=token.lineno)
400 return nodes.Continue(lineno=token.lineno)
401
402
Armin Ronacher9b4cc9f2010-02-07 03:55:15 +0100403class WithExtension(Extension):
404 """Adds support for a django-like with block."""
405 tags = set(['with'])
406
407 def parse(self, parser):
408 node = nodes.Scope(lineno=next(parser.stream).lineno)
409 assignments = []
410 while parser.stream.current.type != 'block_end':
411 lineno = parser.stream.current.lineno
412 if assignments:
413 parser.stream.expect('comma')
414 target = parser.parse_assign_target()
415 parser.stream.expect('assign')
416 expr = parser.parse_expression()
417 assignments.append(nodes.Assign(target, expr, lineno=lineno))
418 node.body = assignments + \
419 list(parser.parse_statements(('name:endwith',),
420 drop_needle=True))
421 return node
422
423
Armin Ronacher8346bd72010-03-14 19:43:47 +0100424class AutoEscapeExtension(Extension):
425 """Changes auto escape rules for a scope."""
426 tags = set(['autoescape'])
427
428 def parse(self, parser):
429 node = nodes.ScopedEvalContextModifier(lineno=next(parser.stream).lineno)
430 node.options = [
431 nodes.Keyword('autoescape', parser.parse_expression())
432 ]
433 node.body = parser.parse_statements(('name:endautoescape',),
434 drop_needle=True)
435 return nodes.Scope([node])
436
437
Armin Ronacherabd36572008-06-27 08:45:19 +0200438def extract_from_ast(node, gettext_functions=GETTEXT_FUNCTIONS,
439 babel_style=True):
440 """Extract localizable strings from the given template node. Per
441 default this function returns matches in babel style that means non string
442 parameters as well as keyword arguments are returned as `None`. This
443 allows Babel to figure out what you really meant if you are using
444 gettext functions that allow keyword arguments for placeholder expansion.
445 If you don't want that behavior set the `babel_style` parameter to `False`
446 which causes only strings to be returned and parameters are always stored
447 in tuples. As a consequence invalid gettext calls (calls without a single
448 string parameter or string parameters after non-string parameters) are
449 skipped.
450
451 This example explains the behavior:
452
453 >>> from jinja2 import Environment
454 >>> env = Environment()
455 >>> node = env.parse('{{ (_("foo"), _(), ngettext("foo", "bar", 42)) }}')
456 >>> list(extract_from_ast(node))
457 [(1, '_', 'foo'), (1, '_', ()), (1, 'ngettext', ('foo', 'bar', None))]
458 >>> list(extract_from_ast(node, babel_style=False))
459 [(1, '_', ('foo',)), (1, 'ngettext', ('foo', 'bar'))]
Armin Ronacherb5124e62008-04-25 00:36:14 +0200460
461 For every string found this function yields a ``(lineno, function,
462 message)`` tuple, where:
463
464 * ``lineno`` is the number of the line on which the string was found,
465 * ``function`` is the name of the ``gettext`` function used (if the
466 string was extracted from embedded Python code), and
467 * ``message`` is the string itself (a ``unicode`` object, or a tuple
468 of ``unicode`` objects for functions with multiple string arguments).
Armin Ronacher531578d2010-02-06 16:34:54 +0100469
470 This extraction function operates on the AST and is because of that unable
471 to extract any comments. For comment support you have to use the babel
472 extraction interface or extract comments yourself.
Armin Ronacherb5124e62008-04-25 00:36:14 +0200473 """
474 for node in node.find_all(nodes.Call):
475 if not isinstance(node.node, nodes.Name) or \
476 node.node.name not in gettext_functions:
477 continue
478
479 strings = []
480 for arg in node.args:
481 if isinstance(arg, nodes.Const) and \
482 isinstance(arg.value, basestring):
483 strings.append(arg.value)
484 else:
485 strings.append(None)
486
Armin Ronacherabd36572008-06-27 08:45:19 +0200487 for arg in node.kwargs:
488 strings.append(None)
489 if node.dyn_args is not None:
490 strings.append(None)
491 if node.dyn_kwargs is not None:
492 strings.append(None)
493
494 if not babel_style:
495 strings = tuple(x for x in strings if x is not None)
496 if not strings:
497 continue
Armin Ronacherb5124e62008-04-25 00:36:14 +0200498 else:
Armin Ronacherabd36572008-06-27 08:45:19 +0200499 if len(strings) == 1:
500 strings = strings[0]
501 else:
502 strings = tuple(strings)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200503 yield node.lineno, node.node.name, strings
504
505
Armin Ronacher531578d2010-02-06 16:34:54 +0100506class _CommentFinder(object):
507 """Helper class to find comments in a token stream. Can only
508 find comments for gettext calls forwards. Once the comment
509 from line 4 is found, a comment for line 1 will not return a
510 usable value.
511 """
512
513 def __init__(self, tokens, comment_tags):
514 self.tokens = tokens
515 self.comment_tags = comment_tags
516 self.offset = 0
517 self.last_lineno = 0
518
519 def find_backwards(self, offset):
520 try:
521 for _, token_type, token_value in \
522 reversed(self.tokens[self.offset:offset]):
523 if token_type in ('comment', 'linecomment'):
524 try:
525 prefix, comment = token_value.split(None, 1)
526 except ValueError:
527 continue
528 if prefix in self.comment_tags:
529 return [comment.rstrip()]
530 return []
531 finally:
532 self.offset = offset
533
534 def find_comments(self, lineno):
535 if not self.comment_tags or self.last_lineno > lineno:
536 return []
537 for idx, (token_lineno, _, _) in enumerate(self.tokens[self.offset:]):
538 if token_lineno > lineno:
539 return self.find_backwards(self.offset + idx)
540 return self.find_backwards(len(self.tokens))
541
542
Armin Ronacherb5124e62008-04-25 00:36:14 +0200543def babel_extract(fileobj, keywords, comment_tags, options):
544 """Babel extraction method for Jinja templates.
545
Armin Ronacher531578d2010-02-06 16:34:54 +0100546 .. versionchanged:: 2.3
547 Basic support for translation comments was added. If `comment_tags`
548 is now set to a list of keywords for extraction, the extractor will
549 try to find the best preceeding comment that begins with one of the
550 keywords. For best results, make sure to not have more than one
551 gettext call in one line of code and the matching comment in the
552 same line or the line before.
553
Armin Ronacher4f77a302010-07-01 12:15:39 +0200554 .. versionchanged:: 2.5.1
555 The `newstyle_gettext` flag can be set to `True` to enable newstyle
556 gettext calls.
557
Armin Ronacher11619152011-12-15 11:50:27 +0100558 .. versionchanged:: 2.7
559 A `silent` option can now be provided. If set to `False` template
560 syntax errors are propagated instead of being ignored.
561
Armin Ronacherb5124e62008-04-25 00:36:14 +0200562 :param fileobj: the file-like object the messages should be extracted from
563 :param keywords: a list of keywords (i.e. function names) that should be
564 recognized as translation functions
565 :param comment_tags: a list of translator tags to search for and include
Armin Ronacher531578d2010-02-06 16:34:54 +0100566 in the results.
Armin Ronacherb5124e62008-04-25 00:36:14 +0200567 :param options: a dictionary of additional options (optional)
568 :return: an iterator over ``(lineno, funcname, message, comments)`` tuples.
569 (comments will be empty currently)
570 """
Armin Ronacher4f5008f2008-05-23 23:36:07 +0200571 extensions = set()
Armin Ronacherb5124e62008-04-25 00:36:14 +0200572 for extension in options.get('extensions', '').split(','):
573 extension = extension.strip()
574 if not extension:
575 continue
Armin Ronacher4f5008f2008-05-23 23:36:07 +0200576 extensions.add(import_string(extension))
577 if InternationalizationExtension not in extensions:
578 extensions.add(InternationalizationExtension)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200579
Armin Ronacher4f77a302010-07-01 12:15:39 +0200580 def getbool(options, key, default=False):
Armin Ronacher11619152011-12-15 11:50:27 +0100581 return options.get(key, str(default)).lower() in \
582 ('1', 'on', 'yes', 'true')
Armin Ronacher4f77a302010-07-01 12:15:39 +0200583
Armin Ronacher11619152011-12-15 11:50:27 +0100584 silent = getbool(options, 'silent', True)
Armin Ronacher4f77a302010-07-01 12:15:39 +0200585 environment = Environment(
Armin Ronacher4f5008f2008-05-23 23:36:07 +0200586 options.get('block_start_string', BLOCK_START_STRING),
587 options.get('block_end_string', BLOCK_END_STRING),
588 options.get('variable_start_string', VARIABLE_START_STRING),
589 options.get('variable_end_string', VARIABLE_END_STRING),
590 options.get('comment_start_string', COMMENT_START_STRING),
591 options.get('comment_end_string', COMMENT_END_STRING),
592 options.get('line_statement_prefix') or LINE_STATEMENT_PREFIX,
Armin Ronacher59b6bd52009-03-30 21:00:16 +0200593 options.get('line_comment_prefix') or LINE_COMMENT_PREFIX,
Armin Ronacher4f77a302010-07-01 12:15:39 +0200594 getbool(options, 'trim_blocks', TRIM_BLOCKS),
Armin Ronacher4f5008f2008-05-23 23:36:07 +0200595 NEWLINE_SEQUENCE, frozenset(extensions),
Armin Ronacher4f77a302010-07-01 12:15:39 +0200596 cache_size=0,
597 auto_reload=False
Armin Ronacherb5124e62008-04-25 00:36:14 +0200598 )
599
Armin Ronacher4f77a302010-07-01 12:15:39 +0200600 if getbool(options, 'newstyle_gettext'):
601 environment.newstyle_gettext = True
602
Armin Ronacher4f5008f2008-05-23 23:36:07 +0200603 source = fileobj.read().decode(options.get('encoding', 'utf-8'))
Armin Ronacherc670b112008-06-29 17:23:04 +0200604 try:
605 node = environment.parse(source)
Armin Ronacher531578d2010-02-06 16:34:54 +0100606 tokens = list(environment.lex(environment.preprocess(source)))
Armin Ronacherc670b112008-06-29 17:23:04 +0200607 except TemplateSyntaxError, e:
Armin Ronacher11619152011-12-15 11:50:27 +0100608 if not silent:
609 raise
Armin Ronacherc670b112008-06-29 17:23:04 +0200610 # skip templates with syntax errors
611 return
Armin Ronacher531578d2010-02-06 16:34:54 +0100612
613 finder = _CommentFinder(tokens, comment_tags)
Armin Ronacherb5124e62008-04-25 00:36:14 +0200614 for lineno, func, message in extract_from_ast(node, keywords):
Armin Ronacher531578d2010-02-06 16:34:54 +0100615 yield lineno, func, message, finder.find_comments(lineno)
Armin Ronachered98cac2008-05-07 08:42:11 +0200616
617
618#: nicer import names
619i18n = InternationalizationExtension
Armin Ronacher5d2733f2008-05-15 23:26:52 +0200620do = ExprStmtExtension
Armin Ronacher3da90312008-05-23 16:37:28 +0200621loopcontrols = LoopControlExtension
Armin Ronacher9b4cc9f2010-02-07 03:55:15 +0100622with_ = WithExtension
Armin Ronacher8346bd72010-03-14 19:43:47 +0100623autoescape = AutoEscapeExtension