jinja2.ext

Extension API for adding custom tags and behavior.

  1"""Extension API for adding custom tags and behavior."""
  2import pprint
  3import re
  4import typing as t
  5
  6from markupsafe import Markup
  7
  8from . import defaults
  9from . import nodes
 10from .environment import Environment
 11from .exceptions import TemplateAssertionError
 12from .exceptions import TemplateSyntaxError
 13from .runtime import concat  # type: ignore
 14from .runtime import Context
 15from .runtime import Undefined
 16from .utils import import_string
 17from .utils import pass_context
 18
 19if t.TYPE_CHECKING:
 20    import typing_extensions as te
 21    from .lexer import Token
 22    from .lexer import TokenStream
 23    from .parser import Parser
 24
 25    class _TranslationsBasic(te.Protocol):
 26        def gettext(self, message: str) -> str:
 27            ...
 28
 29        def ngettext(self, singular: str, plural: str, n: int) -> str:
 30            pass
 31
 32    class _TranslationsContext(_TranslationsBasic):
 33        def pgettext(self, context: str, message: str) -> str:
 34            ...
 35
 36        def npgettext(self, context: str, singular: str, plural: str, n: int) -> str:
 37            ...
 38
 39    _SupportedTranslations = t.Union[_TranslationsBasic, _TranslationsContext]
 40
 41
 42# I18N functions available in Jinja templates. If the I18N library
 43# provides ugettext, it will be assigned to gettext.
 44GETTEXT_FUNCTIONS: t.Tuple[str, ...] = (
 45    "_",
 46    "gettext",
 47    "ngettext",
 48    "pgettext",
 49    "npgettext",
 50)
 51_ws_re = re.compile(r"\s*\n\s*")
 52
 53
 54class Extension:
 55    """Extensions can be used to add extra functionality to the Jinja template
 56    system at the parser level.  Custom extensions are bound to an environment
 57    but may not store environment specific data on `self`.  The reason for
 58    this is that an extension can be bound to another environment (for
 59    overlays) by creating a copy and reassigning the `environment` attribute.
 60
 61    As extensions are created by the environment they cannot accept any
 62    arguments for configuration.  One may want to work around that by using
 63    a factory function, but that is not possible as extensions are identified
 64    by their import name.  The correct way to configure the extension is
 65    storing the configuration values on the environment.  Because this way the
 66    environment ends up acting as central configuration storage the
 67    attributes may clash which is why extensions have to ensure that the names
 68    they choose for configuration are not too generic.  ``prefix`` for example
 69    is a terrible name, ``fragment_cache_prefix`` on the other hand is a good
 70    name as includes the name of the extension (fragment cache).
 71    """
 72
 73    identifier: t.ClassVar[str]
 74
 75    def __init_subclass__(cls) -> None:
 76        cls.identifier = f"{cls.__module__}.{cls.__name__}"
 77
 78    #: if this extension parses this is the list of tags it's listening to.
 79    tags: t.Set[str] = set()
 80
 81    #: the priority of that extension.  This is especially useful for
 82    #: extensions that preprocess values.  A lower value means higher
 83    #: priority.
 84    #:
 85    #: .. versionadded:: 2.4
 86    priority = 100
 87
 88    def __init__(self, environment: Environment) -> None:
 89        self.environment = environment
 90
 91    def bind(self, environment: Environment) -> "Extension":
 92        """Create a copy of this extension bound to another environment."""
 93        rv = object.__new__(self.__class__)
 94        rv.__dict__.update(self.__dict__)
 95        rv.environment = environment
 96        return rv
 97
 98    def preprocess(
 99        self, source: str, name: t.Optional[str], filename: t.Optional[str] = None
100    ) -> str:
101        """This method is called before the actual lexing and can be used to
102        preprocess the source.  The `filename` is optional.  The return value
103        must be the preprocessed source.
104        """
105        return source
106
107    def filter_stream(
108        self, stream: "TokenStream"
109    ) -> t.Union["TokenStream", t.Iterable["Token"]]:
110        """It's passed a :class:`~jinja2.lexer.TokenStream` that can be used
111        to filter tokens returned.  This method has to return an iterable of
112        :class:`~jinja2.lexer.Token`\\s, but it doesn't have to return a
113        :class:`~jinja2.lexer.TokenStream`.
114        """
115        return stream
116
117    def parse(self, parser: "Parser") -> t.Union[nodes.Node, t.List[nodes.Node]]:
118        """If any of the :attr:`tags` matched this method is called with the
119        parser as first argument.  The token the parser stream is pointing at
120        is the name token that matched.  This method has to return one or a
121        list of multiple nodes.
122        """
123        raise NotImplementedError()
124
125    def attr(
126        self, name: str, lineno: t.Optional[int] = None
127    ) -> nodes.ExtensionAttribute:
128        """Return an attribute node for the current extension.  This is useful
129        to pass constants on extensions to generated template code.
130
131        ::
132
133            self.attr('_my_attribute', lineno=lineno)
134        """
135        return nodes.ExtensionAttribute(self.identifier, name, lineno=lineno)
136
137    def call_method(
138        self,
139        name: str,
140        args: t.Optional[t.List[nodes.Expr]] = None,
141        kwargs: t.Optional[t.List[nodes.Keyword]] = None,
142        dyn_args: t.Optional[nodes.Expr] = None,
143        dyn_kwargs: t.Optional[nodes.Expr] = None,
144        lineno: t.Optional[int] = None,
145    ) -> nodes.Call:
146        """Call a method of the extension.  This is a shortcut for
147        :meth:`attr` + :class:`jinja2.nodes.Call`.
148        """
149        if args is None:
150            args = []
151        if kwargs is None:
152            kwargs = []
153        return nodes.Call(
154            self.attr(name, lineno=lineno),
155            args,
156            kwargs,
157            dyn_args,
158            dyn_kwargs,
159            lineno=lineno,
160        )
161
162
163@pass_context
164def _gettext_alias(
165    __context: Context, *args: t.Any, **kwargs: t.Any
166) -> t.Union[t.Any, Undefined]:
167    return __context.call(__context.resolve("gettext"), *args, **kwargs)
168
169
170def _make_new_gettext(func: t.Callable[[str], str]) -> t.Callable[..., str]:
171    @pass_context
172    def gettext(__context: Context, __string: str, **variables: t.Any) -> str:
173        rv = __context.call(func, __string)
174        if __context.eval_ctx.autoescape:
175            rv = Markup(rv)
176        # Always treat as a format string, even if there are no
177        # variables. This makes translation strings more consistent
178        # and predictable. This requires escaping
179        return rv % variables  # type: ignore
180
181    return gettext
182
183
184def _make_new_ngettext(func: t.Callable[[str, str, int], str]) -> t.Callable[..., str]:
185    @pass_context
186    def ngettext(
187        __context: Context,
188        __singular: str,
189        __plural: str,
190        __num: int,
191        **variables: t.Any,
192    ) -> str:
193        variables.setdefault("num", __num)
194        rv = __context.call(func, __singular, __plural, __num)
195        if __context.eval_ctx.autoescape:
196            rv = Markup(rv)
197        # Always treat as a format string, see gettext comment above.
198        return rv % variables  # type: ignore
199
200    return ngettext
201
202
203def _make_new_pgettext(func: t.Callable[[str, str], str]) -> t.Callable[..., str]:
204    @pass_context
205    def pgettext(
206        __context: Context, __string_ctx: str, __string: str, **variables: t.Any
207    ) -> str:
208        variables.setdefault("context", __string_ctx)
209        rv = __context.call(func, __string_ctx, __string)
210
211        if __context.eval_ctx.autoescape:
212            rv = Markup(rv)
213
214        # Always treat as a format string, see gettext comment above.
215        return rv % variables  # type: ignore
216
217    return pgettext
218
219
220def _make_new_npgettext(
221    func: t.Callable[[str, str, str, int], str]
222) -> t.Callable[..., str]:
223    @pass_context
224    def npgettext(
225        __context: Context,
226        __string_ctx: str,
227        __singular: str,
228        __plural: str,
229        __num: int,
230        **variables: t.Any,
231    ) -> str:
232        variables.setdefault("context", __string_ctx)
233        variables.setdefault("num", __num)
234        rv = __context.call(func, __string_ctx, __singular, __plural, __num)
235
236        if __context.eval_ctx.autoescape:
237            rv = Markup(rv)
238
239        # Always treat as a format string, see gettext comment above.
240        return rv % variables  # type: ignore
241
242    return npgettext
243
244
245class InternationalizationExtension(Extension):
246    """This extension adds gettext support to Jinja."""
247
248    tags = {"trans"}
249
250    # TODO: the i18n extension is currently reevaluating values in a few
251    # situations.  Take this example:
252    #   {% trans count=something() %}{{ count }} foo{% pluralize
253    #     %}{{ count }} fooss{% endtrans %}
254    # something is called twice here.  One time for the gettext value and
255    # the other time for the n-parameter of the ngettext function.
256
257    def __init__(self, environment: Environment) -> None:
258        super().__init__(environment)
259        environment.globals["_"] = _gettext_alias
260        environment.extend(
261            install_gettext_translations=self._install,
262            install_null_translations=self._install_null,
263            install_gettext_callables=self._install_callables,
264            uninstall_gettext_translations=self._uninstall,
265            extract_translations=self._extract,
266            newstyle_gettext=False,
267        )
268
269    def _install(
270        self, translations: "_SupportedTranslations", newstyle: t.Optional[bool] = None
271    ) -> None:
272        # ugettext and ungettext are preferred in case the I18N library
273        # is providing compatibility with older Python versions.
274        gettext = getattr(translations, "ugettext", None)
275        if gettext is None:
276            gettext = translations.gettext
277        ngettext = getattr(translations, "ungettext", None)
278        if ngettext is None:
279            ngettext = translations.ngettext
280
281        pgettext = getattr(translations, "pgettext", None)
282        npgettext = getattr(translations, "npgettext", None)
283        self._install_callables(
284            gettext, ngettext, newstyle=newstyle, pgettext=pgettext, npgettext=npgettext
285        )
286
287    def _install_null(self, newstyle: t.Optional[bool] = None) -> None:
288        import gettext
289
290        translations = gettext.NullTranslations()
291
292        if hasattr(translations, "pgettext"):
293            # Python < 3.8
294            pgettext = translations.pgettext
295        else:
296
297            def pgettext(c: str, s: str) -> str:
298                return s
299
300        if hasattr(translations, "npgettext"):
301            npgettext = translations.npgettext
302        else:
303
304            def npgettext(c: str, s: str, p: str, n: int) -> str:
305                return s if n == 1 else p
306
307        self._install_callables(
308            gettext=translations.gettext,
309            ngettext=translations.ngettext,
310            newstyle=newstyle,
311            pgettext=pgettext,
312            npgettext=npgettext,
313        )
314
315    def _install_callables(
316        self,
317        gettext: t.Callable[[str], str],
318        ngettext: t.Callable[[str, str, int], str],
319        newstyle: t.Optional[bool] = None,
320        pgettext: t.Optional[t.Callable[[str, str], str]] = None,
321        npgettext: t.Optional[t.Callable[[str, str, str, int], str]] = None,
322    ) -> None:
323        if newstyle is not None:
324            self.environment.newstyle_gettext = newstyle  # type: ignore
325        if self.environment.newstyle_gettext:  # type: ignore
326            gettext = _make_new_gettext(gettext)
327            ngettext = _make_new_ngettext(ngettext)
328
329            if pgettext is not None:
330                pgettext = _make_new_pgettext(pgettext)
331
332            if npgettext is not None:
333                npgettext = _make_new_npgettext(npgettext)
334
335        self.environment.globals.update(
336            gettext=gettext, ngettext=ngettext, pgettext=pgettext, npgettext=npgettext
337        )
338
339    def _uninstall(self, translations: "_SupportedTranslations") -> None:
340        for key in ("gettext", "ngettext", "pgettext", "npgettext"):
341            self.environment.globals.pop(key, None)
342
343    def _extract(
344        self,
345        source: t.Union[str, nodes.Template],
346        gettext_functions: t.Sequence[str] = GETTEXT_FUNCTIONS,
347    ) -> t.Iterator[
348        t.Tuple[int, str, t.Union[t.Optional[str], t.Tuple[t.Optional[str], ...]]]
349    ]:
350        if isinstance(source, str):
351            source = self.environment.parse(source)
352        return extract_from_ast(source, gettext_functions)
353
354    def parse(self, parser: "Parser") -> t.Union[nodes.Node, t.List[nodes.Node]]:
355        """Parse a translatable tag."""
356        lineno = next(parser.stream).lineno
357
358        context = None
359        context_token = parser.stream.next_if("string")
360
361        if context_token is not None:
362            context = context_token.value
363
364        # find all the variables referenced.  Additionally a variable can be
365        # defined in the body of the trans block too, but this is checked at
366        # a later state.
367        plural_expr: t.Optional[nodes.Expr] = None
368        plural_expr_assignment: t.Optional[nodes.Assign] = None
369        num_called_num = False
370        variables: t.Dict[str, nodes.Expr] = {}
371        trimmed = None
372        while parser.stream.current.type != "block_end":
373            if variables:
374                parser.stream.expect("comma")
375
376            # skip colon for python compatibility
377            if parser.stream.skip_if("colon"):
378                break
379
380            token = parser.stream.expect("name")
381            if token.value in variables:
382                parser.fail(
383                    f"translatable variable {token.value!r} defined twice.",
384                    token.lineno,
385                    exc=TemplateAssertionError,
386                )
387
388            # expressions
389            if parser.stream.current.type == "assign":
390                next(parser.stream)
391                variables[token.value] = var = parser.parse_expression()
392            elif trimmed is None and token.value in ("trimmed", "notrimmed"):
393                trimmed = token.value == "trimmed"
394                continue
395            else:
396                variables[token.value] = var = nodes.Name(token.value, "load")
397
398            if plural_expr is None:
399                if isinstance(var, nodes.Call):
400                    plural_expr = nodes.Name("_trans", "load")
401                    variables[token.value] = plural_expr
402                    plural_expr_assignment = nodes.Assign(
403                        nodes.Name("_trans", "store"), var
404                    )
405                else:
406                    plural_expr = var
407                num_called_num = token.value == "num"
408
409        parser.stream.expect("block_end")
410
411        plural = None
412        have_plural = False
413        referenced = set()
414
415        # now parse until endtrans or pluralize
416        singular_names, singular = self._parse_block(parser, True)
417        if singular_names:
418            referenced.update(singular_names)
419            if plural_expr is None:
420                plural_expr = nodes.Name(singular_names[0], "load")
421                num_called_num = singular_names[0] == "num"
422
423        # if we have a pluralize block, we parse that too
424        if parser.stream.current.test("name:pluralize"):
425            have_plural = True
426            next(parser.stream)
427            if parser.stream.current.type != "block_end":
428                token = parser.stream.expect("name")
429                if token.value not in variables:
430                    parser.fail(
431                        f"unknown variable {token.value!r} for pluralization",
432                        token.lineno,
433                        exc=TemplateAssertionError,
434                    )
435                plural_expr = variables[token.value]
436                num_called_num = token.value == "num"
437            parser.stream.expect("block_end")
438            plural_names, plural = self._parse_block(parser, False)
439            next(parser.stream)
440            referenced.update(plural_names)
441        else:
442            next(parser.stream)
443
444        # register free names as simple name expressions
445        for name in referenced:
446            if name not in variables:
447                variables[name] = nodes.Name(name, "load")
448
449        if not have_plural:
450            plural_expr = None
451        elif plural_expr is None:
452            parser.fail("pluralize without variables", lineno)
453
454        if trimmed is None:
455            trimmed = self.environment.policies["ext.i18n.trimmed"]
456        if trimmed:
457            singular = self._trim_whitespace(singular)
458            if plural:
459                plural = self._trim_whitespace(plural)
460
461        node = self._make_node(
462            singular,
463            plural,
464            context,
465            variables,
466            plural_expr,
467            bool(referenced),
468            num_called_num and have_plural,
469        )
470        node.set_lineno(lineno)
471        if plural_expr_assignment is not None:
472            return [plural_expr_assignment, node]
473        else:
474            return node
475
476    def _trim_whitespace(self, string: str, _ws_re: t.Pattern[str] = _ws_re) -> str:
477        return _ws_re.sub(" ", string.strip())
478
479    def _parse_block(
480        self, parser: "Parser", allow_pluralize: bool
481    ) -> t.Tuple[t.List[str], str]:
482        """Parse until the next block tag with a given name."""
483        referenced = []
484        buf = []
485
486        while True:
487            if parser.stream.current.type == "data":
488                buf.append(parser.stream.current.value.replace("%", "%%"))
489                next(parser.stream)
490            elif parser.stream.current.type == "variable_begin":
491                next(parser.stream)
492                name = parser.stream.expect("name").value
493                referenced.append(name)
494                buf.append(f"%({name})s")
495                parser.stream.expect("variable_end")
496            elif parser.stream.current.type == "block_begin":
497                next(parser.stream)
498                block_name = (
499                    parser.stream.current.value
500                    if parser.stream.current.type == "name"
501                    else None
502                )
503                if block_name == "endtrans":
504                    break
505                elif block_name == "pluralize":
506                    if allow_pluralize:
507                        break
508                    parser.fail(
509                        "a translatable section can have only one pluralize section"
510                    )
511                elif block_name == "trans":
512                    parser.fail(
513                        "trans blocks can't be nested; did you mean `endtrans`?"
514                    )
515                parser.fail(
516                    f"control structures in translatable sections are not allowed; "
517                    f"saw `{block_name}`"
518                )
519            elif parser.stream.eos:
520                parser.fail("unclosed translation block")
521            else:
522                raise RuntimeError("internal parser error")
523
524        return referenced, concat(buf)
525
526    def _make_node(
527        self,
528        singular: str,
529        plural: t.Optional[str],
530        context: t.Optional[str],
531        variables: t.Dict[str, nodes.Expr],
532        plural_expr: t.Optional[nodes.Expr],
533        vars_referenced: bool,
534        num_called_num: bool,
535    ) -> nodes.Output:
536        """Generates a useful node from the data provided."""
537        newstyle = self.environment.newstyle_gettext  # type: ignore
538        node: nodes.Expr
539
540        # no variables referenced?  no need to escape for old style
541        # gettext invocations only if there are vars.
542        if not vars_referenced and not newstyle:
543            singular = singular.replace("%%", "%")
544            if plural:
545                plural = plural.replace("%%", "%")
546
547        func_name = "gettext"
548        func_args: t.List[nodes.Expr] = [nodes.Const(singular)]
549
550        if context is not None:
551            func_args.insert(0, nodes.Const(context))
552            func_name = f"p{func_name}"
553
554        if plural_expr is not None:
555            func_name = f"n{func_name}"
556            func_args.extend((nodes.Const(plural), plural_expr))
557
558        node = nodes.Call(nodes.Name(func_name, "load"), func_args, [], None, None)
559
560        # in case newstyle gettext is used, the method is powerful
561        # enough to handle the variable expansion and autoescape
562        # handling itself
563        if newstyle:
564            for key, value in variables.items():
565                # the function adds that later anyways in case num was
566                # called num, so just skip it.
567                if num_called_num and key == "num":
568                    continue
569                node.kwargs.append(nodes.Keyword(key, value))
570
571        # otherwise do that here
572        else:
573            # mark the return value as safe if we are in an
574            # environment with autoescaping turned on
575            node = nodes.MarkSafeIfAutoescape(node)
576            if variables:
577                node = nodes.Mod(
578                    node,
579                    nodes.Dict(
580                        [
581                            nodes.Pair(nodes.Const(key), value)
582                            for key, value in variables.items()
583                        ]
584                    ),
585                )
586        return nodes.Output([node])
587
588
589class ExprStmtExtension(Extension):
590    """Adds a `do` tag to Jinja that works like the print statement just
591    that it doesn't print the return value.
592    """
593
594    tags = {"do"}
595
596    def parse(self, parser: "Parser") -> nodes.ExprStmt:
597        node = nodes.ExprStmt(lineno=next(parser.stream).lineno)
598        node.node = parser.parse_tuple()
599        return node
600
601
602class LoopControlExtension(Extension):
603    """Adds break and continue to the template engine."""
604
605    tags = {"break", "continue"}
606
607    def parse(self, parser: "Parser") -> t.Union[nodes.Break, nodes.Continue]:
608        token = next(parser.stream)
609        if token.value == "break":
610            return nodes.Break(lineno=token.lineno)
611        return nodes.Continue(lineno=token.lineno)
612
613
614class DebugExtension(Extension):
615    """A ``{% debug %}`` tag that dumps the available variables,
616    filters, and tests.
617
618    .. code-block:: html+jinja
619
620        <pre>{% debug %}</pre>
621
622    .. code-block:: text
623
624        {'context': {'cycler': <class 'jinja2.utils.Cycler'>,
625                     ...,
626                     'namespace': <class 'jinja2.utils.Namespace'>},
627         'filters': ['abs', 'attr', 'batch', 'capitalize', 'center', 'count', 'd',
628                     ..., 'urlencode', 'urlize', 'wordcount', 'wordwrap', 'xmlattr'],
629         'tests': ['!=', '<', '<=', '==', '>', '>=', 'callable', 'defined',
630                   ..., 'odd', 'sameas', 'sequence', 'string', 'undefined', 'upper']}
631
632    .. versionadded:: 2.11.0
633    """
634
635    tags = {"debug"}
636
637    def parse(self, parser: "Parser") -> nodes.Output:
638        lineno = parser.stream.expect("name:debug").lineno
639        context = nodes.ContextReference()
640        result = self.call_method("_render", [context], lineno=lineno)
641        return nodes.Output([result], lineno=lineno)
642
643    def _render(self, context: Context) -> str:
644        result = {
645            "context": context.get_all(),
646            "filters": sorted(self.environment.filters.keys()),
647            "tests": sorted(self.environment.tests.keys()),
648        }
649
650        # Set the depth since the intent is to show the top few names.
651        return pprint.pformat(result, depth=3, compact=True)
652
653
654def extract_from_ast(
655    ast: nodes.Template,
656    gettext_functions: t.Sequence[str] = GETTEXT_FUNCTIONS,
657    babel_style: bool = True,
658) -> t.Iterator[
659    t.Tuple[int, str, t.Union[t.Optional[str], t.Tuple[t.Optional[str], ...]]]
660]:
661    """Extract localizable strings from the given template node.  Per
662    default this function returns matches in babel style that means non string
663    parameters as well as keyword arguments are returned as `None`.  This
664    allows Babel to figure out what you really meant if you are using
665    gettext functions that allow keyword arguments for placeholder expansion.
666    If you don't want that behavior set the `babel_style` parameter to `False`
667    which causes only strings to be returned and parameters are always stored
668    in tuples.  As a consequence invalid gettext calls (calls without a single
669    string parameter or string parameters after non-string parameters) are
670    skipped.
671
672    This example explains the behavior:
673
674    >>> from jinja2 import Environment
675    >>> env = Environment()
676    >>> node = env.parse('{{ (_("foo"), _(), ngettext("foo", "bar", 42)) }}')
677    >>> list(extract_from_ast(node))
678    [(1, '_', 'foo'), (1, '_', ()), (1, 'ngettext', ('foo', 'bar', None))]
679    >>> list(extract_from_ast(node, babel_style=False))
680    [(1, '_', ('foo',)), (1, 'ngettext', ('foo', 'bar'))]
681
682    For every string found this function yields a ``(lineno, function,
683    message)`` tuple, where:
684
685    * ``lineno`` is the number of the line on which the string was found,
686    * ``function`` is the name of the ``gettext`` function used (if the
687      string was extracted from embedded Python code), and
688    *   ``message`` is the string, or a tuple of strings for functions
689         with multiple string arguments.
690
691    This extraction function operates on the AST and is because of that unable
692    to extract any comments.  For comment support you have to use the babel
693    extraction interface or extract comments yourself.
694    """
695    out: t.Union[t.Optional[str], t.Tuple[t.Optional[str], ...]]
696
697    for node in ast.find_all(nodes.Call):
698        if (
699            not isinstance(node.node, nodes.Name)
700            or node.node.name not in gettext_functions
701        ):
702            continue
703
704        strings: t.List[t.Optional[str]] = []
705
706        for arg in node.args:
707            if isinstance(arg, nodes.Const) and isinstance(arg.value, str):
708                strings.append(arg.value)
709            else:
710                strings.append(None)
711
712        for _ in node.kwargs:
713            strings.append(None)
714        if node.dyn_args is not None:
715            strings.append(None)
716        if node.dyn_kwargs is not None:
717            strings.append(None)
718
719        if not babel_style:
720            out = tuple(x for x in strings if x is not None)
721
722            if not out:
723                continue
724        else:
725            if len(strings) == 1:
726                out = strings[0]
727            else:
728                out = tuple(strings)
729
730        yield node.lineno, node.node.name, out
731
732
733class _CommentFinder:
734    """Helper class to find comments in a token stream.  Can only
735    find comments for gettext calls forwards.  Once the comment
736    from line 4 is found, a comment for line 1 will not return a
737    usable value.
738    """
739
740    def __init__(
741        self, tokens: t.Sequence[t.Tuple[int, str, str]], comment_tags: t.Sequence[str]
742    ) -> None:
743        self.tokens = tokens
744        self.comment_tags = comment_tags
745        self.offset = 0
746        self.last_lineno = 0
747
748    def find_backwards(self, offset: int) -> t.List[str]:
749        try:
750            for _, token_type, token_value in reversed(
751                self.tokens[self.offset : offset]
752            ):
753                if token_type in ("comment", "linecomment"):
754                    try:
755                        prefix, comment = token_value.split(None, 1)
756                    except ValueError:
757                        continue
758                    if prefix in self.comment_tags:
759                        return [comment.rstrip()]
760            return []
761        finally:
762            self.offset = offset
763
764    def find_comments(self, lineno: int) -> t.List[str]:
765        if not self.comment_tags or self.last_lineno > lineno:
766            return []
767        for idx, (token_lineno, _, _) in enumerate(self.tokens[self.offset :]):
768            if token_lineno > lineno:
769                return self.find_backwards(self.offset + idx)
770        return self.find_backwards(len(self.tokens))
771
772
773def babel_extract(
774    fileobj: t.BinaryIO,
775    keywords: t.Sequence[str],
776    comment_tags: t.Sequence[str],
777    options: t.Dict[str, t.Any],
778) -> t.Iterator[
779    t.Tuple[
780        int, str, t.Union[t.Optional[str], t.Tuple[t.Optional[str], ...]], t.List[str]
781    ]
782]:
783    """Babel extraction method for Jinja templates.
784
785    .. versionchanged:: 2.3
786       Basic support for translation comments was added.  If `comment_tags`
787       is now set to a list of keywords for extraction, the extractor will
788       try to find the best preceding comment that begins with one of the
789       keywords.  For best results, make sure to not have more than one
790       gettext call in one line of code and the matching comment in the
791       same line or the line before.
792
793    .. versionchanged:: 2.5.1
794       The `newstyle_gettext` flag can be set to `True` to enable newstyle
795       gettext calls.
796
797    .. versionchanged:: 2.7
798       A `silent` option can now be provided.  If set to `False` template
799       syntax errors are propagated instead of being ignored.
800
801    :param fileobj: the file-like object the messages should be extracted from
802    :param keywords: a list of keywords (i.e. function names) that should be
803                     recognized as translation functions
804    :param comment_tags: a list of translator tags to search for and include
805                         in the results.
806    :param options: a dictionary of additional options (optional)
807    :return: an iterator over ``(lineno, funcname, message, comments)`` tuples.
808             (comments will be empty currently)
809    """
810    extensions: t.Dict[t.Type[Extension], None] = {}
811
812    for extension_name in options.get("extensions", "").split(","):
813        extension_name = extension_name.strip()
814
815        if not extension_name:
816            continue
817
818        extensions[import_string(extension_name)] = None
819
820    if InternationalizationExtension not in extensions:
821        extensions[InternationalizationExtension] = None
822
823    def getbool(options: t.Mapping[str, str], key: str, default: bool = False) -> bool:
824        return options.get(key, str(default)).lower() in {"1", "on", "yes", "true"}
825
826    silent = getbool(options, "silent", True)
827    environment = Environment(
828        options.get("block_start_string", defaults.BLOCK_START_STRING),
829        options.get("block_end_string", defaults.BLOCK_END_STRING),
830        options.get("variable_start_string", defaults.VARIABLE_START_STRING),
831        options.get("variable_end_string", defaults.VARIABLE_END_STRING),
832        options.get("comment_start_string", defaults.COMMENT_START_STRING),
833        options.get("comment_end_string", defaults.COMMENT_END_STRING),
834        options.get("line_statement_prefix") or defaults.LINE_STATEMENT_PREFIX,
835        options.get("line_comment_prefix") or defaults.LINE_COMMENT_PREFIX,
836        getbool(options, "trim_blocks", defaults.TRIM_BLOCKS),
837        getbool(options, "lstrip_blocks", defaults.LSTRIP_BLOCKS),
838        defaults.NEWLINE_SEQUENCE,
839        getbool(options, "keep_trailing_newline", defaults.KEEP_TRAILING_NEWLINE),
840        tuple(extensions),
841        cache_size=0,
842        auto_reload=False,
843    )
844
845    if getbool(options, "trimmed"):
846        environment.policies["ext.i18n.trimmed"] = True
847    if getbool(options, "newstyle_gettext"):
848        environment.newstyle_gettext = True  # type: ignore
849
850    source = fileobj.read().decode(options.get("encoding", "utf-8"))
851    try:
852        node = environment.parse(source)
853        tokens = list(environment.lex(environment.preprocess(source)))
854    except TemplateSyntaxError:
855        if not silent:
856            raise
857        # skip templates with syntax errors
858        return
859
860    finder = _CommentFinder(tokens, comment_tags)
861    for lineno, func, message in extract_from_ast(node, keywords):
862        yield lineno, func, message, finder.find_comments(lineno)
863
864
865#: nicer import names
866i18n = InternationalizationExtension
867do = ExprStmtExtension
868loopcontrols = LoopControlExtension
869debug = DebugExtension
GETTEXT_FUNCTIONS: Tuple[str, ...] = ('_', 'gettext', 'ngettext', 'pgettext', 'npgettext')
class Extension:
 55class Extension:
 56    """Extensions can be used to add extra functionality to the Jinja template
 57    system at the parser level.  Custom extensions are bound to an environment
 58    but may not store environment specific data on `self`.  The reason for
 59    this is that an extension can be bound to another environment (for
 60    overlays) by creating a copy and reassigning the `environment` attribute.
 61
 62    As extensions are created by the environment they cannot accept any
 63    arguments for configuration.  One may want to work around that by using
 64    a factory function, but that is not possible as extensions are identified
 65    by their import name.  The correct way to configure the extension is
 66    storing the configuration values on the environment.  Because this way the
 67    environment ends up acting as central configuration storage the
 68    attributes may clash which is why extensions have to ensure that the names
 69    they choose for configuration are not too generic.  ``prefix`` for example
 70    is a terrible name, ``fragment_cache_prefix`` on the other hand is a good
 71    name as includes the name of the extension (fragment cache).
 72    """
 73
 74    identifier: t.ClassVar[str]
 75
 76    def __init_subclass__(cls) -> None:
 77        cls.identifier = f"{cls.__module__}.{cls.__name__}"
 78
 79    #: if this extension parses this is the list of tags it's listening to.
 80    tags: t.Set[str] = set()
 81
 82    #: the priority of that extension.  This is especially useful for
 83    #: extensions that preprocess values.  A lower value means higher
 84    #: priority.
 85    #:
 86    #: .. versionadded:: 2.4
 87    priority = 100
 88
 89    def __init__(self, environment: Environment) -> None:
 90        self.environment = environment
 91
 92    def bind(self, environment: Environment) -> "Extension":
 93        """Create a copy of this extension bound to another environment."""
 94        rv = object.__new__(self.__class__)
 95        rv.__dict__.update(self.__dict__)
 96        rv.environment = environment
 97        return rv
 98
 99    def preprocess(
100        self, source: str, name: t.Optional[str], filename: t.Optional[str] = None
101    ) -> str:
102        """This method is called before the actual lexing and can be used to
103        preprocess the source.  The `filename` is optional.  The return value
104        must be the preprocessed source.
105        """
106        return source
107
108    def filter_stream(
109        self, stream: "TokenStream"
110    ) -> t.Union["TokenStream", t.Iterable["Token"]]:
111        """It's passed a :class:`~jinja2.lexer.TokenStream` that can be used
112        to filter tokens returned.  This method has to return an iterable of
113        :class:`~jinja2.lexer.Token`\\s, but it doesn't have to return a
114        :class:`~jinja2.lexer.TokenStream`.
115        """
116        return stream
117
118    def parse(self, parser: "Parser") -> t.Union[nodes.Node, t.List[nodes.Node]]:
119        """If any of the :attr:`tags` matched this method is called with the
120        parser as first argument.  The token the parser stream is pointing at
121        is the name token that matched.  This method has to return one or a
122        list of multiple nodes.
123        """
124        raise NotImplementedError()
125
126    def attr(
127        self, name: str, lineno: t.Optional[int] = None
128    ) -> nodes.ExtensionAttribute:
129        """Return an attribute node for the current extension.  This is useful
130        to pass constants on extensions to generated template code.
131
132        ::
133
134            self.attr('_my_attribute', lineno=lineno)
135        """
136        return nodes.ExtensionAttribute(self.identifier, name, lineno=lineno)
137
138    def call_method(
139        self,
140        name: str,
141        args: t.Optional[t.List[nodes.Expr]] = None,
142        kwargs: t.Optional[t.List[nodes.Keyword]] = None,
143        dyn_args: t.Optional[nodes.Expr] = None,
144        dyn_kwargs: t.Optional[nodes.Expr] = None,
145        lineno: t.Optional[int] = None,
146    ) -> nodes.Call:
147        """Call a method of the extension.  This is a shortcut for
148        :meth:`attr` + :class:`jinja2.nodes.Call`.
149        """
150        if args is None:
151            args = []
152        if kwargs is None:
153            kwargs = []
154        return nodes.Call(
155            self.attr(name, lineno=lineno),
156            args,
157            kwargs,
158            dyn_args,
159            dyn_kwargs,
160            lineno=lineno,
161        )

Extensions can be used to add extra functionality to the Jinja template system at the parser level. Custom extensions are bound to an environment but may not store environment specific data on self. The reason for this is that an extension can be bound to another environment (for overlays) by creating a copy and reassigning the environment attribute.

As extensions are created by the environment they cannot accept any arguments for configuration. One may want to work around that by using a factory function, but that is not possible as extensions are identified by their import name. The correct way to configure the extension is storing the configuration values on the environment. Because this way the environment ends up acting as central configuration storage the attributes may clash which is why extensions have to ensure that the names they choose for configuration are not too generic. prefix for example is a terrible name, fragment_cache_prefix on the other hand is a good name as includes the name of the extension (fragment cache).

Extension(environment: jinja2.environment.Environment)
89    def __init__(self, environment: Environment) -> None:
90        self.environment = environment
identifier: ClassVar[str]
tags: Set[str] = set()
priority = 100
environment
def bind( self, environment: jinja2.environment.Environment) -> Extension:
92    def bind(self, environment: Environment) -> "Extension":
93        """Create a copy of this extension bound to another environment."""
94        rv = object.__new__(self.__class__)
95        rv.__dict__.update(self.__dict__)
96        rv.environment = environment
97        return rv

Create a copy of this extension bound to another environment.

def preprocess( self, source: str, name: Optional[str], filename: Optional[str] = None) -> str:
 99    def preprocess(
100        self, source: str, name: t.Optional[str], filename: t.Optional[str] = None
101    ) -> str:
102        """This method is called before the actual lexing and can be used to
103        preprocess the source.  The `filename` is optional.  The return value
104        must be the preprocessed source.
105        """
106        return source

This method is called before the actual lexing and can be used to preprocess the source. The filename is optional. The return value must be the preprocessed source.

def filter_stream( self, stream: jinja2.lexer.TokenStream) -> Union[jinja2.lexer.TokenStream, Iterable[jinja2.lexer.Token]]:
108    def filter_stream(
109        self, stream: "TokenStream"
110    ) -> t.Union["TokenStream", t.Iterable["Token"]]:
111        """It's passed a :class:`~jinja2.lexer.TokenStream` that can be used
112        to filter tokens returned.  This method has to return an iterable of
113        :class:`~jinja2.lexer.Token`\\s, but it doesn't have to return a
114        :class:`~jinja2.lexer.TokenStream`.
115        """
116        return stream

It's passed a ~jinja2.lexer.TokenStream that can be used to filter tokens returned. This method has to return an iterable of ~jinja2.lexer.Token\s, but it doesn't have to return a ~jinja2.lexer.TokenStream.

def parse( self, parser: jinja2.parser.Parser) -> Union[jinja2.nodes.Node, List[jinja2.nodes.Node]]:
118    def parse(self, parser: "Parser") -> t.Union[nodes.Node, t.List[nodes.Node]]:
119        """If any of the :attr:`tags` matched this method is called with the
120        parser as first argument.  The token the parser stream is pointing at
121        is the name token that matched.  This method has to return one or a
122        list of multiple nodes.
123        """
124        raise NotImplementedError()

If any of the tags matched this method is called with the parser as first argument. The token the parser stream is pointing at is the name token that matched. This method has to return one or a list of multiple nodes.

def attr( self, name: str, lineno: Optional[int] = None) -> jinja2.nodes.ExtensionAttribute:
126    def attr(
127        self, name: str, lineno: t.Optional[int] = None
128    ) -> nodes.ExtensionAttribute:
129        """Return an attribute node for the current extension.  This is useful
130        to pass constants on extensions to generated template code.
131
132        ::
133
134            self.attr('_my_attribute', lineno=lineno)
135        """
136        return nodes.ExtensionAttribute(self.identifier, name, lineno=lineno)

Return an attribute node for the current extension. This is useful to pass constants on extensions to generated template code.

::

self.attr('_my_attribute', lineno=lineno)
def call_method( self, name: str, args: Optional[List[jinja2.nodes.Expr]] = None, kwargs: Optional[List[jinja2.nodes.Keyword]] = None, dyn_args: Optional[jinja2.nodes.Expr] = None, dyn_kwargs: Optional[jinja2.nodes.Expr] = None, lineno: Optional[int] = None) -> jinja2.nodes.Call:
138    def call_method(
139        self,
140        name: str,
141        args: t.Optional[t.List[nodes.Expr]] = None,
142        kwargs: t.Optional[t.List[nodes.Keyword]] = None,
143        dyn_args: t.Optional[nodes.Expr] = None,
144        dyn_kwargs: t.Optional[nodes.Expr] = None,
145        lineno: t.Optional[int] = None,
146    ) -> nodes.Call:
147        """Call a method of the extension.  This is a shortcut for
148        :meth:`attr` + :class:`jinja2.nodes.Call`.
149        """
150        if args is None:
151            args = []
152        if kwargs is None:
153            kwargs = []
154        return nodes.Call(
155            self.attr(name, lineno=lineno),
156            args,
157            kwargs,
158            dyn_args,
159            dyn_kwargs,
160            lineno=lineno,
161        )

Call a method of the extension. This is a shortcut for attr() + jinja2.nodes.Call.

class InternationalizationExtension(Extension):
246class InternationalizationExtension(Extension):
247    """This extension adds gettext support to Jinja."""
248
249    tags = {"trans"}
250
251    # TODO: the i18n extension is currently reevaluating values in a few
252    # situations.  Take this example:
253    #   {% trans count=something() %}{{ count }} foo{% pluralize
254    #     %}{{ count }} fooss{% endtrans %}
255    # something is called twice here.  One time for the gettext value and
256    # the other time for the n-parameter of the ngettext function.
257
258    def __init__(self, environment: Environment) -> None:
259        super().__init__(environment)
260        environment.globals["_"] = _gettext_alias
261        environment.extend(
262            install_gettext_translations=self._install,
263            install_null_translations=self._install_null,
264            install_gettext_callables=self._install_callables,
265            uninstall_gettext_translations=self._uninstall,
266            extract_translations=self._extract,
267            newstyle_gettext=False,
268        )
269
270    def _install(
271        self, translations: "_SupportedTranslations", newstyle: t.Optional[bool] = None
272    ) -> None:
273        # ugettext and ungettext are preferred in case the I18N library
274        # is providing compatibility with older Python versions.
275        gettext = getattr(translations, "ugettext", None)
276        if gettext is None:
277            gettext = translations.gettext
278        ngettext = getattr(translations, "ungettext", None)
279        if ngettext is None:
280            ngettext = translations.ngettext
281
282        pgettext = getattr(translations, "pgettext", None)
283        npgettext = getattr(translations, "npgettext", None)
284        self._install_callables(
285            gettext, ngettext, newstyle=newstyle, pgettext=pgettext, npgettext=npgettext
286        )
287
288    def _install_null(self, newstyle: t.Optional[bool] = None) -> None:
289        import gettext
290
291        translations = gettext.NullTranslations()
292
293        if hasattr(translations, "pgettext"):
294            # Python < 3.8
295            pgettext = translations.pgettext
296        else:
297
298            def pgettext(c: str, s: str) -> str:
299                return s
300
301        if hasattr(translations, "npgettext"):
302            npgettext = translations.npgettext
303        else:
304
305            def npgettext(c: str, s: str, p: str, n: int) -> str:
306                return s if n == 1 else p
307
308        self._install_callables(
309            gettext=translations.gettext,
310            ngettext=translations.ngettext,
311            newstyle=newstyle,
312            pgettext=pgettext,
313            npgettext=npgettext,
314        )
315
316    def _install_callables(
317        self,
318        gettext: t.Callable[[str], str],
319        ngettext: t.Callable[[str, str, int], str],
320        newstyle: t.Optional[bool] = None,
321        pgettext: t.Optional[t.Callable[[str, str], str]] = None,
322        npgettext: t.Optional[t.Callable[[str, str, str, int], str]] = None,
323    ) -> None:
324        if newstyle is not None:
325            self.environment.newstyle_gettext = newstyle  # type: ignore
326        if self.environment.newstyle_gettext:  # type: ignore
327            gettext = _make_new_gettext(gettext)
328            ngettext = _make_new_ngettext(ngettext)
329
330            if pgettext is not None:
331                pgettext = _make_new_pgettext(pgettext)
332
333            if npgettext is not None:
334                npgettext = _make_new_npgettext(npgettext)
335
336        self.environment.globals.update(
337            gettext=gettext, ngettext=ngettext, pgettext=pgettext, npgettext=npgettext
338        )
339
340    def _uninstall(self, translations: "_SupportedTranslations") -> None:
341        for key in ("gettext", "ngettext", "pgettext", "npgettext"):
342            self.environment.globals.pop(key, None)
343
344    def _extract(
345        self,
346        source: t.Union[str, nodes.Template],
347        gettext_functions: t.Sequence[str] = GETTEXT_FUNCTIONS,
348    ) -> t.Iterator[
349        t.Tuple[int, str, t.Union[t.Optional[str], t.Tuple[t.Optional[str], ...]]]
350    ]:
351        if isinstance(source, str):
352            source = self.environment.parse(source)
353        return extract_from_ast(source, gettext_functions)
354
355    def parse(self, parser: "Parser") -> t.Union[nodes.Node, t.List[nodes.Node]]:
356        """Parse a translatable tag."""
357        lineno = next(parser.stream).lineno
358
359        context = None
360        context_token = parser.stream.next_if("string")
361
362        if context_token is not None:
363            context = context_token.value
364
365        # find all the variables referenced.  Additionally a variable can be
366        # defined in the body of the trans block too, but this is checked at
367        # a later state.
368        plural_expr: t.Optional[nodes.Expr] = None
369        plural_expr_assignment: t.Optional[nodes.Assign] = None
370        num_called_num = False
371        variables: t.Dict[str, nodes.Expr] = {}
372        trimmed = None
373        while parser.stream.current.type != "block_end":
374            if variables:
375                parser.stream.expect("comma")
376
377            # skip colon for python compatibility
378            if parser.stream.skip_if("colon"):
379                break
380
381            token = parser.stream.expect("name")
382            if token.value in variables:
383                parser.fail(
384                    f"translatable variable {token.value!r} defined twice.",
385                    token.lineno,
386                    exc=TemplateAssertionError,
387                )
388
389            # expressions
390            if parser.stream.current.type == "assign":
391                next(parser.stream)
392                variables[token.value] = var = parser.parse_expression()
393            elif trimmed is None and token.value in ("trimmed", "notrimmed"):
394                trimmed = token.value == "trimmed"
395                continue
396            else:
397                variables[token.value] = var = nodes.Name(token.value, "load")
398
399            if plural_expr is None:
400                if isinstance(var, nodes.Call):
401                    plural_expr = nodes.Name("_trans", "load")
402                    variables[token.value] = plural_expr
403                    plural_expr_assignment = nodes.Assign(
404                        nodes.Name("_trans", "store"), var
405                    )
406                else:
407                    plural_expr = var
408                num_called_num = token.value == "num"
409
410        parser.stream.expect("block_end")
411
412        plural = None
413        have_plural = False
414        referenced = set()
415
416        # now parse until endtrans or pluralize
417        singular_names, singular = self._parse_block(parser, True)
418        if singular_names:
419            referenced.update(singular_names)
420            if plural_expr is None:
421                plural_expr = nodes.Name(singular_names[0], "load")
422                num_called_num = singular_names[0] == "num"
423
424        # if we have a pluralize block, we parse that too
425        if parser.stream.current.test("name:pluralize"):
426            have_plural = True
427            next(parser.stream)
428            if parser.stream.current.type != "block_end":
429                token = parser.stream.expect("name")
430                if token.value not in variables:
431                    parser.fail(
432                        f"unknown variable {token.value!r} for pluralization",
433                        token.lineno,
434                        exc=TemplateAssertionError,
435                    )
436                plural_expr = variables[token.value]
437                num_called_num = token.value == "num"
438            parser.stream.expect("block_end")
439            plural_names, plural = self._parse_block(parser, False)
440            next(parser.stream)
441            referenced.update(plural_names)
442        else:
443            next(parser.stream)
444
445        # register free names as simple name expressions
446        for name in referenced:
447            if name not in variables:
448                variables[name] = nodes.Name(name, "load")
449
450        if not have_plural:
451            plural_expr = None
452        elif plural_expr is None:
453            parser.fail("pluralize without variables", lineno)
454
455        if trimmed is None:
456            trimmed = self.environment.policies["ext.i18n.trimmed"]
457        if trimmed:
458            singular = self._trim_whitespace(singular)
459            if plural:
460                plural = self._trim_whitespace(plural)
461
462        node = self._make_node(
463            singular,
464            plural,
465            context,
466            variables,
467            plural_expr,
468            bool(referenced),
469            num_called_num and have_plural,
470        )
471        node.set_lineno(lineno)
472        if plural_expr_assignment is not None:
473            return [plural_expr_assignment, node]
474        else:
475            return node
476
477    def _trim_whitespace(self, string: str, _ws_re: t.Pattern[str] = _ws_re) -> str:
478        return _ws_re.sub(" ", string.strip())
479
480    def _parse_block(
481        self, parser: "Parser", allow_pluralize: bool
482    ) -> t.Tuple[t.List[str], str]:
483        """Parse until the next block tag with a given name."""
484        referenced = []
485        buf = []
486
487        while True:
488            if parser.stream.current.type == "data":
489                buf.append(parser.stream.current.value.replace("%", "%%"))
490                next(parser.stream)
491            elif parser.stream.current.type == "variable_begin":
492                next(parser.stream)
493                name = parser.stream.expect("name").value
494                referenced.append(name)
495                buf.append(f"%({name})s")
496                parser.stream.expect("variable_end")
497            elif parser.stream.current.type == "block_begin":
498                next(parser.stream)
499                block_name = (
500                    parser.stream.current.value
501                    if parser.stream.current.type == "name"
502                    else None
503                )
504                if block_name == "endtrans":
505                    break
506                elif block_name == "pluralize":
507                    if allow_pluralize:
508                        break
509                    parser.fail(
510                        "a translatable section can have only one pluralize section"
511                    )
512                elif block_name == "trans":
513                    parser.fail(
514                        "trans blocks can't be nested; did you mean `endtrans`?"
515                    )
516                parser.fail(
517                    f"control structures in translatable sections are not allowed; "
518                    f"saw `{block_name}`"
519                )
520            elif parser.stream.eos:
521                parser.fail("unclosed translation block")
522            else:
523                raise RuntimeError("internal parser error")
524
525        return referenced, concat(buf)
526
527    def _make_node(
528        self,
529        singular: str,
530        plural: t.Optional[str],
531        context: t.Optional[str],
532        variables: t.Dict[str, nodes.Expr],
533        plural_expr: t.Optional[nodes.Expr],
534        vars_referenced: bool,
535        num_called_num: bool,
536    ) -> nodes.Output:
537        """Generates a useful node from the data provided."""
538        newstyle = self.environment.newstyle_gettext  # type: ignore
539        node: nodes.Expr
540
541        # no variables referenced?  no need to escape for old style
542        # gettext invocations only if there are vars.
543        if not vars_referenced and not newstyle:
544            singular = singular.replace("%%", "%")
545            if plural:
546                plural = plural.replace("%%", "%")
547
548        func_name = "gettext"
549        func_args: t.List[nodes.Expr] = [nodes.Const(singular)]
550
551        if context is not None:
552            func_args.insert(0, nodes.Const(context))
553            func_name = f"p{func_name}"
554
555        if plural_expr is not None:
556            func_name = f"n{func_name}"
557            func_args.extend((nodes.Const(plural), plural_expr))
558
559        node = nodes.Call(nodes.Name(func_name, "load"), func_args, [], None, None)
560
561        # in case newstyle gettext is used, the method is powerful
562        # enough to handle the variable expansion and autoescape
563        # handling itself
564        if newstyle:
565            for key, value in variables.items():
566                # the function adds that later anyways in case num was
567                # called num, so just skip it.
568                if num_called_num and key == "num":
569                    continue
570                node.kwargs.append(nodes.Keyword(key, value))
571
572        # otherwise do that here
573        else:
574            # mark the return value as safe if we are in an
575            # environment with autoescaping turned on
576            node = nodes.MarkSafeIfAutoescape(node)
577            if variables:
578                node = nodes.Mod(
579                    node,
580                    nodes.Dict(
581                        [
582                            nodes.Pair(nodes.Const(key), value)
583                            for key, value in variables.items()
584                        ]
585                    ),
586                )
587        return nodes.Output([node])

This extension adds gettext support to Jinja.

InternationalizationExtension(environment: jinja2.environment.Environment)
258    def __init__(self, environment: Environment) -> None:
259        super().__init__(environment)
260        environment.globals["_"] = _gettext_alias
261        environment.extend(
262            install_gettext_translations=self._install,
263            install_null_translations=self._install_null,
264            install_gettext_callables=self._install_callables,
265            uninstall_gettext_translations=self._uninstall,
266            extract_translations=self._extract,
267            newstyle_gettext=False,
268        )
tags = {'trans'}
def parse( self, parser: jinja2.parser.Parser) -> Union[jinja2.nodes.Node, List[jinja2.nodes.Node]]:
355    def parse(self, parser: "Parser") -> t.Union[nodes.Node, t.List[nodes.Node]]:
356        """Parse a translatable tag."""
357        lineno = next(parser.stream).lineno
358
359        context = None
360        context_token = parser.stream.next_if("string")
361
362        if context_token is not None:
363            context = context_token.value
364
365        # find all the variables referenced.  Additionally a variable can be
366        # defined in the body of the trans block too, but this is checked at
367        # a later state.
368        plural_expr: t.Optional[nodes.Expr] = None
369        plural_expr_assignment: t.Optional[nodes.Assign] = None
370        num_called_num = False
371        variables: t.Dict[str, nodes.Expr] = {}
372        trimmed = None
373        while parser.stream.current.type != "block_end":
374            if variables:
375                parser.stream.expect("comma")
376
377            # skip colon for python compatibility
378            if parser.stream.skip_if("colon"):
379                break
380
381            token = parser.stream.expect("name")
382            if token.value in variables:
383                parser.fail(
384                    f"translatable variable {token.value!r} defined twice.",
385                    token.lineno,
386                    exc=TemplateAssertionError,
387                )
388
389            # expressions
390            if parser.stream.current.type == "assign":
391                next(parser.stream)
392                variables[token.value] = var = parser.parse_expression()
393            elif trimmed is None and token.value in ("trimmed", "notrimmed"):
394                trimmed = token.value == "trimmed"
395                continue
396            else:
397                variables[token.value] = var = nodes.Name(token.value, "load")
398
399            if plural_expr is None:
400                if isinstance(var, nodes.Call):
401                    plural_expr = nodes.Name("_trans", "load")
402                    variables[token.value] = plural_expr
403                    plural_expr_assignment = nodes.Assign(
404                        nodes.Name("_trans", "store"), var
405                    )
406                else:
407                    plural_expr = var
408                num_called_num = token.value == "num"
409
410        parser.stream.expect("block_end")
411
412        plural = None
413        have_plural = False
414        referenced = set()
415
416        # now parse until endtrans or pluralize
417        singular_names, singular = self._parse_block(parser, True)
418        if singular_names:
419            referenced.update(singular_names)
420            if plural_expr is None:
421                plural_expr = nodes.Name(singular_names[0], "load")
422                num_called_num = singular_names[0] == "num"
423
424        # if we have a pluralize block, we parse that too
425        if parser.stream.current.test("name:pluralize"):
426            have_plural = True
427            next(parser.stream)
428            if parser.stream.current.type != "block_end":
429                token = parser.stream.expect("name")
430                if token.value not in variables:
431                    parser.fail(
432                        f"unknown variable {token.value!r} for pluralization",
433                        token.lineno,
434                        exc=TemplateAssertionError,
435                    )
436                plural_expr = variables[token.value]
437                num_called_num = token.value == "num"
438            parser.stream.expect("block_end")
439            plural_names, plural = self._parse_block(parser, False)
440            next(parser.stream)
441            referenced.update(plural_names)
442        else:
443            next(parser.stream)
444
445        # register free names as simple name expressions
446        for name in referenced:
447            if name not in variables:
448                variables[name] = nodes.Name(name, "load")
449
450        if not have_plural:
451            plural_expr = None
452        elif plural_expr is None:
453            parser.fail("pluralize without variables", lineno)
454
455        if trimmed is None:
456            trimmed = self.environment.policies["ext.i18n.trimmed"]
457        if trimmed:
458            singular = self._trim_whitespace(singular)
459            if plural:
460                plural = self._trim_whitespace(plural)
461
462        node = self._make_node(
463            singular,
464            plural,
465            context,
466            variables,
467            plural_expr,
468            bool(referenced),
469            num_called_num and have_plural,
470        )
471        node.set_lineno(lineno)
472        if plural_expr_assignment is not None:
473            return [plural_expr_assignment, node]
474        else:
475            return node

Parse a translatable tag.

identifier: ClassVar[str] = 'InternationalizationExtension'
class ExprStmtExtension(Extension):
590class ExprStmtExtension(Extension):
591    """Adds a `do` tag to Jinja that works like the print statement just
592    that it doesn't print the return value.
593    """
594
595    tags = {"do"}
596
597    def parse(self, parser: "Parser") -> nodes.ExprStmt:
598        node = nodes.ExprStmt(lineno=next(parser.stream).lineno)
599        node.node = parser.parse_tuple()
600        return node

Adds a do tag to Jinja that works like the print statement just that it doesn't print the return value.

tags = {'do'}
def parse(self, parser: jinja2.parser.Parser) -> jinja2.nodes.ExprStmt:
597    def parse(self, parser: "Parser") -> nodes.ExprStmt:
598        node = nodes.ExprStmt(lineno=next(parser.stream).lineno)
599        node.node = parser.parse_tuple()
600        return node

If any of the tags matched this method is called with the parser as first argument. The token the parser stream is pointing at is the name token that matched. This method has to return one or a list of multiple nodes.

identifier: ClassVar[str] = 'ExprStmtExtension'
class LoopControlExtension(Extension):
603class LoopControlExtension(Extension):
604    """Adds break and continue to the template engine."""
605
606    tags = {"break", "continue"}
607
608    def parse(self, parser: "Parser") -> t.Union[nodes.Break, nodes.Continue]:
609        token = next(parser.stream)
610        if token.value == "break":
611            return nodes.Break(lineno=token.lineno)
612        return nodes.Continue(lineno=token.lineno)

Adds break and continue to the template engine.

tags = {'continue', 'break'}
def parse( self, parser: jinja2.parser.Parser) -> Union[jinja2.nodes.Break, jinja2.nodes.Continue]:
608    def parse(self, parser: "Parser") -> t.Union[nodes.Break, nodes.Continue]:
609        token = next(parser.stream)
610        if token.value == "break":
611            return nodes.Break(lineno=token.lineno)
612        return nodes.Continue(lineno=token.lineno)

If any of the tags matched this method is called with the parser as first argument. The token the parser stream is pointing at is the name token that matched. This method has to return one or a list of multiple nodes.

identifier: ClassVar[str] = 'LoopControlExtension'
class DebugExtension(Extension):
615class DebugExtension(Extension):
616    """A ``{% debug %}`` tag that dumps the available variables,
617    filters, and tests.
618
619    .. code-block:: html+jinja
620
621        <pre>{% debug %}</pre>
622
623    .. code-block:: text
624
625        {'context': {'cycler': <class 'jinja2.utils.Cycler'>,
626                     ...,
627                     'namespace': <class 'jinja2.utils.Namespace'>},
628         'filters': ['abs', 'attr', 'batch', 'capitalize', 'center', 'count', 'd',
629                     ..., 'urlencode', 'urlize', 'wordcount', 'wordwrap', 'xmlattr'],
630         'tests': ['!=', '<', '<=', '==', '>', '>=', 'callable', 'defined',
631                   ..., 'odd', 'sameas', 'sequence', 'string', 'undefined', 'upper']}
632
633    .. versionadded:: 2.11.0
634    """
635
636    tags = {"debug"}
637
638    def parse(self, parser: "Parser") -> nodes.Output:
639        lineno = parser.stream.expect("name:debug").lineno
640        context = nodes.ContextReference()
641        result = self.call_method("_render", [context], lineno=lineno)
642        return nodes.Output([result], lineno=lineno)
643
644    def _render(self, context: Context) -> str:
645        result = {
646            "context": context.get_all(),
647            "filters": sorted(self.environment.filters.keys()),
648            "tests": sorted(self.environment.tests.keys()),
649        }
650
651        # Set the depth since the intent is to show the top few names.
652        return pprint.pformat(result, depth=3, compact=True)

A {% debug %} tag that dumps the available variables, filters, and tests.

<pre>{% debug %}</pre>
{'context': {'cycler': <class 'jinja2.utils.Cycler'>,
             ...,
             'namespace': <class 'jinja2.utils.Namespace'>},
 'filters': ['abs', 'attr', 'batch', 'capitalize', 'center', 'count', 'd',
             ..., 'urlencode', 'urlize', 'wordcount', 'wordwrap', 'xmlattr'],
 'tests': ['!=', '<', '<=', '==', '>', '>=', 'callable', 'defined',
           ..., 'odd', 'sameas', 'sequence', 'string', 'undefined', 'upper']}

New in version 2.11.0.

tags = {'debug'}
def parse(self, parser: jinja2.parser.Parser) -> jinja2.nodes.Output:
638    def parse(self, parser: "Parser") -> nodes.Output:
639        lineno = parser.stream.expect("name:debug").lineno
640        context = nodes.ContextReference()
641        result = self.call_method("_render", [context], lineno=lineno)
642        return nodes.Output([result], lineno=lineno)

If any of the tags matched this method is called with the parser as first argument. The token the parser stream is pointing at is the name token that matched. This method has to return one or a list of multiple nodes.

identifier: ClassVar[str] = 'DebugExtension'
def extract_from_ast( ast: jinja2.nodes.Template, gettext_functions: Sequence[str] = ('_', 'gettext', 'ngettext', 'pgettext', 'npgettext'), babel_style: bool = True) -> Iterator[Tuple[int, str, Union[str, NoneType, Tuple[Optional[str], ...]]]]:
655def extract_from_ast(
656    ast: nodes.Template,
657    gettext_functions: t.Sequence[str] = GETTEXT_FUNCTIONS,
658    babel_style: bool = True,
659) -> t.Iterator[
660    t.Tuple[int, str, t.Union[t.Optional[str], t.Tuple[t.Optional[str], ...]]]
661]:
662    """Extract localizable strings from the given template node.  Per
663    default this function returns matches in babel style that means non string
664    parameters as well as keyword arguments are returned as `None`.  This
665    allows Babel to figure out what you really meant if you are using
666    gettext functions that allow keyword arguments for placeholder expansion.
667    If you don't want that behavior set the `babel_style` parameter to `False`
668    which causes only strings to be returned and parameters are always stored
669    in tuples.  As a consequence invalid gettext calls (calls without a single
670    string parameter or string parameters after non-string parameters) are
671    skipped.
672
673    This example explains the behavior:
674
675    >>> from jinja2 import Environment
676    >>> env = Environment()
677    >>> node = env.parse('{{ (_("foo"), _(), ngettext("foo", "bar", 42)) }}')
678    >>> list(extract_from_ast(node))
679    [(1, '_', 'foo'), (1, '_', ()), (1, 'ngettext', ('foo', 'bar', None))]
680    >>> list(extract_from_ast(node, babel_style=False))
681    [(1, '_', ('foo',)), (1, 'ngettext', ('foo', 'bar'))]
682
683    For every string found this function yields a ``(lineno, function,
684    message)`` tuple, where:
685
686    * ``lineno`` is the number of the line on which the string was found,
687    * ``function`` is the name of the ``gettext`` function used (if the
688      string was extracted from embedded Python code), and
689    *   ``message`` is the string, or a tuple of strings for functions
690         with multiple string arguments.
691
692    This extraction function operates on the AST and is because of that unable
693    to extract any comments.  For comment support you have to use the babel
694    extraction interface or extract comments yourself.
695    """
696    out: t.Union[t.Optional[str], t.Tuple[t.Optional[str], ...]]
697
698    for node in ast.find_all(nodes.Call):
699        if (
700            not isinstance(node.node, nodes.Name)
701            or node.node.name not in gettext_functions
702        ):
703            continue
704
705        strings: t.List[t.Optional[str]] = []
706
707        for arg in node.args:
708            if isinstance(arg, nodes.Const) and isinstance(arg.value, str):
709                strings.append(arg.value)
710            else:
711                strings.append(None)
712
713        for _ in node.kwargs:
714            strings.append(None)
715        if node.dyn_args is not None:
716            strings.append(None)
717        if node.dyn_kwargs is not None:
718            strings.append(None)
719
720        if not babel_style:
721            out = tuple(x for x in strings if x is not None)
722
723            if not out:
724                continue
725        else:
726            if len(strings) == 1:
727                out = strings[0]
728            else:
729                out = tuple(strings)
730
731        yield node.lineno, node.node.name, out

Extract localizable strings from the given template node. Per default this function returns matches in babel style that means non string parameters as well as keyword arguments are returned as None. This allows Babel to figure out what you really meant if you are using gettext functions that allow keyword arguments for placeholder expansion. If you don't want that behavior set the babel_style parameter to False which causes only strings to be returned and parameters are always stored in tuples. As a consequence invalid gettext calls (calls without a single string parameter or string parameters after non-string parameters) are skipped.

This example explains the behavior:

>>> from jinja2 import Environment
>>> env = Environment()
>>> node = env.parse('{{ (_("foo"), _(), ngettext("foo", "bar", 42)) }}')
>>> list(extract_from_ast(node))
[(1, '_', 'foo'), (1, '_', ()), (1, 'ngettext', ('foo', 'bar', None))]
>>> list(extract_from_ast(node, babel_style=False))
[(1, '_', ('foo',)), (1, 'ngettext', ('foo', 'bar'))]

For every string found this function yields a (lineno, function, message) tuple, where:

  • lineno is the number of the line on which the string was found,
  • function is the name of the gettext function used (if the string was extracted from embedded Python code), and
  • message is the string, or a tuple of strings for functions with multiple string arguments.

This extraction function operates on the AST and is because of that unable to extract any comments. For comment support you have to use the babel extraction interface or extract comments yourself.

def babel_extract( fileobj: <class 'BinaryIO'>, keywords: Sequence[str], comment_tags: Sequence[str], options: Dict[str, Any]) -> Iterator[Tuple[int, str, Union[str, NoneType, Tuple[Optional[str], ...]], List[str]]]:
774def babel_extract(
775    fileobj: t.BinaryIO,
776    keywords: t.Sequence[str],
777    comment_tags: t.Sequence[str],
778    options: t.Dict[str, t.Any],
779) -> t.Iterator[
780    t.Tuple[
781        int, str, t.Union[t.Optional[str], t.Tuple[t.Optional[str], ...]], t.List[str]
782    ]
783]:
784    """Babel extraction method for Jinja templates.
785
786    .. versionchanged:: 2.3
787       Basic support for translation comments was added.  If `comment_tags`
788       is now set to a list of keywords for extraction, the extractor will
789       try to find the best preceding comment that begins with one of the
790       keywords.  For best results, make sure to not have more than one
791       gettext call in one line of code and the matching comment in the
792       same line or the line before.
793
794    .. versionchanged:: 2.5.1
795       The `newstyle_gettext` flag can be set to `True` to enable newstyle
796       gettext calls.
797
798    .. versionchanged:: 2.7
799       A `silent` option can now be provided.  If set to `False` template
800       syntax errors are propagated instead of being ignored.
801
802    :param fileobj: the file-like object the messages should be extracted from
803    :param keywords: a list of keywords (i.e. function names) that should be
804                     recognized as translation functions
805    :param comment_tags: a list of translator tags to search for and include
806                         in the results.
807    :param options: a dictionary of additional options (optional)
808    :return: an iterator over ``(lineno, funcname, message, comments)`` tuples.
809             (comments will be empty currently)
810    """
811    extensions: t.Dict[t.Type[Extension], None] = {}
812
813    for extension_name in options.get("extensions", "").split(","):
814        extension_name = extension_name.strip()
815
816        if not extension_name:
817            continue
818
819        extensions[import_string(extension_name)] = None
820
821    if InternationalizationExtension not in extensions:
822        extensions[InternationalizationExtension] = None
823
824    def getbool(options: t.Mapping[str, str], key: str, default: bool = False) -> bool:
825        return options.get(key, str(default)).lower() in {"1", "on", "yes", "true"}
826
827    silent = getbool(options, "silent", True)
828    environment = Environment(
829        options.get("block_start_string", defaults.BLOCK_START_STRING),
830        options.get("block_end_string", defaults.BLOCK_END_STRING),
831        options.get("variable_start_string", defaults.VARIABLE_START_STRING),
832        options.get("variable_end_string", defaults.VARIABLE_END_STRING),
833        options.get("comment_start_string", defaults.COMMENT_START_STRING),
834        options.get("comment_end_string", defaults.COMMENT_END_STRING),
835        options.get("line_statement_prefix") or defaults.LINE_STATEMENT_PREFIX,
836        options.get("line_comment_prefix") or defaults.LINE_COMMENT_PREFIX,
837        getbool(options, "trim_blocks", defaults.TRIM_BLOCKS),
838        getbool(options, "lstrip_blocks", defaults.LSTRIP_BLOCKS),
839        defaults.NEWLINE_SEQUENCE,
840        getbool(options, "keep_trailing_newline", defaults.KEEP_TRAILING_NEWLINE),
841        tuple(extensions),
842        cache_size=0,
843        auto_reload=False,
844    )
845
846    if getbool(options, "trimmed"):
847        environment.policies["ext.i18n.trimmed"] = True
848    if getbool(options, "newstyle_gettext"):
849        environment.newstyle_gettext = True  # type: ignore
850
851    source = fileobj.read().decode(options.get("encoding", "utf-8"))
852    try:
853        node = environment.parse(source)
854        tokens = list(environment.lex(environment.preprocess(source)))
855    except TemplateSyntaxError:
856        if not silent:
857            raise
858        # skip templates with syntax errors
859        return
860
861    finder = _CommentFinder(tokens, comment_tags)
862    for lineno, func, message in extract_from_ast(node, keywords):
863        yield lineno, func, message, finder.find_comments(lineno)

Babel extraction method for Jinja templates.

Changed in version 2.3: Basic support for translation comments was added. If comment_tags is now set to a list of keywords for extraction, the extractor will try to find the best preceding comment that begins with one of the keywords. For best results, make sure to not have more than one gettext call in one line of code and the matching comment in the same line or the line before.

Changed in version 2.5.1: The newstyle_gettext flag can be set to True to enable newstyle gettext calls.

Changed in version 2.7: A silent option can now be provided. If set to False template syntax errors are propagated instead of being ignored.

Parameters
  • fileobj: the file-like object the messages should be extracted from
  • keywords: a list of keywords (i.e. function names) that should be recognized as translation functions
  • comment_tags: a list of translator tags to search for and include in the results.
  • options: a dictionary of additional options (optional)
Returns

an iterator over (lineno, funcname, message, comments) tuples. (comments will be empty currently)

do = <class 'ExprStmtExtension'>
loopcontrols = <class 'LoopControlExtension'>
debug = <class 'DebugExtension'>