lib.rs - mozsearch

mozilla-central/third_party/rust/rinja_parser/src/lib.rs (file symbol)

Enable keyboard shortcuts

Source code

File a bug in Firefox Build System :: General

Revision control

Copy as Markdown

Other Tools

#![cfg_attr(docsrs, feature(doc_cfg, doc_auto_cfg))]

#![deny(elided_lifetimes_in_paths)]

#![deny(unreachable_pub)]

use std::borrow::Cow;

use std::cell::Cell;

use std::env::current_dir;

use std::ops::{Deref, DerefMut};

use std::path::Path;

use std::sync::Arc;

use std::{fmt, str};

use nom::branch::alt;

use nom::bytes::complete::{escaped, is_not, tag, take_till, take_while_m_n};

use nom::character::complete::{anychar, char, one_of, satisfy};

use nom::combinator::{consumed, cut, fail, map, not, opt, recognize, value};

use nom::error::{ErrorKind, FromExternalError};

use nom::multi::{many0_count, many1};

use nom::sequence::{delimited, pair, preceded, tuple};

use nom::{AsChar, InputTakeAtPosition};

pub mod expr;

pub use expr::{Expr, Filter};

mod memchr_splitter;

pub mod node;

pub use node::Node;

mod target;

pub use target::Target;

#[cfg(test)]

mod tests;

mod _parsed {

    use std::path::Path;

    use std::sync::Arc;

    use std::{fmt, mem};

    use super::node::Node;

    use super::{Ast, ParseError, Syntax};

    pub struct Parsed {

        // `source` must outlive `ast`, so `ast` must be declared before `source`

        ast: Ast<'static>,

        #[allow(dead_code)]

        source: Arc<str>,

    impl Parsed {

        /// If `file_path` is `None`, it means the `source` is an inline template. Therefore, if

        /// a parsing error occurs, we won't display the path as it wouldn't be useful.

        pub fn new(

            source: Arc<str>,

            file_path: Option<Arc<Path>>,

            syntax: &Syntax<'_>,

        ) -> Result<Self, ParseError> {

            // Self-referential borrowing: `self` will keep the source alive as `String`,

            // internally we will transmute it to `&'static str` to satisfy the compiler.

            // However, we only expose the nodes with a lifetime limited to `self`.

            let src = unsafe { mem::transmute::<&str, &'static str>(source.as_ref()) };

            let ast = Ast::from_str(src, file_path, syntax)?;

            Ok(Self { ast, source })

        // The return value's lifetime must be limited to `self` to uphold the unsafe invariant.

        #[must_use]

        pub fn nodes(&self) -> &[Node<'_>] {

            &self.ast.nodes

        #[must_use]

        pub fn source(&self) -> &str {

            &self.source

    impl fmt::Debug for Parsed {

        fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {

            f.debug_struct("Parsed")

                .field("nodes", &self.ast.nodes)

                .finish_non_exhaustive()

    impl PartialEq for Parsed {

        fn eq(&self, other: &Self) -> bool {

            self.ast.nodes == other.ast.nodes

    impl Default for Parsed {

        fn default() -> Self {

            Self {

                ast: Ast::default(),

                source: "".into(),

pub use _parsed::Parsed;

#[derive(Debug, Default)]

pub struct Ast<'a> {

    nodes: Vec<Node<'a>>,

impl<'a> Ast<'a> {

    /// If `file_path` is `None`, it means the `source` is an inline template. Therefore, if

    /// a parsing error occurs, we won't display the path as it wouldn't be useful.

    pub fn from_str(

        src: &'a str,

        file_path: Option<Arc<Path>>,

        syntax: &Syntax<'_>,

    ) -> Result<Self, ParseError> {

        match Node::parse_template(src, &State::new(syntax)) {

            Ok(("", nodes)) => Ok(Self { nodes }),

            Ok(_) | Err(nom::Err::Incomplete(_)) => unreachable!(),

            Err(

                nom::Err::Error(ErrorContext { input, message, .. })

                | nom::Err::Failure(ErrorContext { input, message, .. }),

            ) => Err(ParseError {

                message,

                offset: src.len() - input.len(),

                file_path,

}),

    #[must_use]

    pub fn nodes(&self) -> &[Node<'a>] {

        &self.nodes

/// Struct used to wrap types with their associated "span" which is used when generating errors

/// in the code generation.

pub struct WithSpan<'a, T> {

    inner: T,

    span: &'a str,

impl<'a, T> WithSpan<'a, T> {

    pub const fn new(inner: T, span: &'a str) -> Self {

        Self { inner, span }

    pub fn span(&self) -> &'a str {

        self.span

    pub fn deconstruct(self) -> (T, &'a str) {

        let Self { inner, span } = self;

        (inner, span)

impl<'a, T> Deref for WithSpan<'a, T> {

    type Target = T;

    fn deref(&self) -> &Self::Target {

        &self.inner

impl<'a, T> DerefMut for WithSpan<'a, T> {

    fn deref_mut(&mut self) -> &mut Self::Target {

        &mut self.inner

impl<'a, T: fmt::Debug> fmt::Debug for WithSpan<'a, T> {

    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {

        write!(f, "{:?}", self.inner)

impl<'a, T: Clone> Clone for WithSpan<'a, T> {

    fn clone(&self) -> Self {

        Self {

            inner: self.inner.clone(),

            span: self.span,

impl<'a, T: PartialEq> PartialEq for WithSpan<'a, T> {

    fn eq(&self, other: &Self) -> bool {

        // We never want to compare the span information.

        self.inner == other.inner

#[derive(Debug, Clone, PartialEq, Eq)]

pub struct ParseError {

    pub message: Option<Cow<'static, str>>,

    pub offset: usize,

    pub file_path: Option<Arc<Path>>,

impl std::error::Error for ParseError {}

impl fmt::Display for ParseError {

    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {

        let ParseError {

            message,

            file_path,

            offset,

        } = self;

        if let Some(message) = message {

            writeln!(f, "{message}")?;

        let path = file_path

            .as_ref()

            .and_then(|path| Some(strip_common(&current_dir().ok()?, path)));

        match path {

            Some(path) => write!(f, "failed to parse template source\n  --> {path}@{offset}"),

            None => write!(f, "failed to parse template source near offset {offset}"),

pub(crate) type ParseErr<'a> = nom::Err<ErrorContext<'a>>;

pub(crate) type ParseResult<'a, T = &'a str> = Result<(&'a str, T), ParseErr<'a>>;

/// This type is used to handle `nom` errors and in particular to add custom error messages.

/// It used to generate `ParserError`.

///

/// It cannot be used to replace `ParseError` because it expects a generic, which would make

/// `rinja`'s users experience less good (since this generic is only needed for `nom`).

#[derive(Debug)]

pub(crate) struct ErrorContext<'a> {

    pub(crate) input: &'a str,

    pub(crate) message: Option<Cow<'static, str>>,

impl<'a> ErrorContext<'a> {

    fn unclosed(kind: &str, tag: &str, i: &'a str) -> Self {

        Self::new(format!("unclosed {kind}, missing {tag:?}"), i)

    fn new(message: impl Into<Cow<'static, str>>, input: &'a str) -> Self {

        Self {

            input,

            message: Some(message.into()),

impl<'a> nom::error::ParseError<&'a str> for ErrorContext<'a> {

    fn from_error_kind(input: &'a str, _code: ErrorKind) -> Self {

        Self {

            input,

            message: None,

    fn append(_: &'a str, _: ErrorKind, other: Self) -> Self {

        other

impl<'a, E: std::fmt::Display> FromExternalError<&'a str, E> for ErrorContext<'a> {

    fn from_external_error(input: &'a str, _kind: ErrorKind, e: E) -> Self {

        Self {

            input,

            message: Some(Cow::Owned(e.to_string())),

impl<'a> From<ErrorContext<'a>> for nom::Err<ErrorContext<'a>> {

    fn from(cx: ErrorContext<'a>) -> Self {

        Self::Failure(cx)

fn is_ws(c: char) -> bool {

    matches!(c, ' ' | '\t' | '\r' | '\n')

fn not_ws(c: char) -> bool {

    !is_ws(c)

fn ws<'a, O>(

    inner: impl FnMut(&'a str) -> ParseResult<'a, O>,

) -> impl FnMut(&'a str) -> ParseResult<'a, O> {

    delimited(take_till(not_ws), inner, take_till(not_ws))

/// Skips input until `end` was found, but does not consume it.

/// Returns tuple that would be returned when parsing `end`.

fn skip_till<'a, 'b, O>(

    candidate_finder: impl crate::memchr_splitter::Splitter,

    end: impl FnMut(&'a str) -> ParseResult<'a, O>,

) -> impl FnMut(&'a str) -> ParseResult<'a, (&'a str, O)> {

    let mut next = alt((map(end, Some), map(anychar, |_| None)));

    move |start: &'a str| {

        let mut i = start;

        loop {

            i = match candidate_finder.split(i) {

                Some((_, j)) => j,

                None => return Err(nom::Err::Error(ErrorContext::new("`end` not found`", i))),

};

            i = match next(i)? {

                (j, Some(lookahead)) => return Ok((i, (j, lookahead))),

                (j, None) => j,

};

fn keyword<'a>(k: &'a str) -> impl FnMut(&'a str) -> ParseResult<'a> {

    move |i: &'a str| -> ParseResult<'a> {

        let (j, v) = identifier(i)?;

        if k == v { Ok((j, v)) } else { fail(i) }

fn identifier(input: &str) -> ParseResult<'_> {

    fn start(s: &str) -> ParseResult<'_> {

        s.split_at_position1_complete(

            |c| !(c.is_alpha() || c == '_' || c >= '\u{0080}'),

            nom::error::ErrorKind::Alpha,

    fn tail(s: &str) -> ParseResult<'_> {

        s.split_at_position1_complete(

            |c| !(c.is_alphanum() || c == '_' || c >= '\u{0080}'),

            nom::error::ErrorKind::Alpha,

    recognize(pair(start, opt(tail)))(input)

fn bool_lit(i: &str) -> ParseResult<'_> {

    alt((keyword("false"), keyword("true")))(i)

#[derive(Debug, Clone, Copy, PartialEq)]

pub enum Num<'a> {

    Int(&'a str, Option<IntKind>),

    Float(&'a str, Option<FloatKind>),

fn num_lit<'a>(start: &'a str) -> ParseResult<'a, Num<'a>> {

    fn num_lit_suffix<'a, T: Copy>(

        kind: &'a str,

        list: &[(&str, T)],

        start: &'a str,

        i: &'a str,

    ) -> ParseResult<'a, T> {

        let (i, suffix) = identifier(i)?;

        if let Some(value) = list

            .iter()

            .copied()

            .find_map(|(name, value)| (name == suffix).then_some(value))

            Ok((i, value))

        } else {

            Err(nom::Err::Failure(ErrorContext::new(

                format!("unknown {kind} suffix `{suffix}`"),

                start,

)))

    // Equivalent to <https://github.com/rust-lang/rust/blob/e3f909b2bbd0b10db6f164d466db237c582d3045/compiler/rustc_lexer/src/lib.rs#L587-L620>.

    let int_with_base = pair(opt(char('-')), |i| {

        let (i, (kind, base)) = consumed(preceded(

            char('0'),

            alt((

                value(2, char('b')),

                value(8, char('o')),

                value(16, char('x')),

)),

        ))(i)?;

        match opt(separated_digits(base, false))(i)? {

            (i, Some(_)) => Ok((i, ())),

            (_, None) => Err(nom::Err::Failure(ErrorContext::new(

                format!("expected digits after `{kind}`"),

                start,

            ))),

});

    // Equivalent to <https://github.com/rust-lang/rust/blob/e3f909b2bbd0b10db6f164d466db237c582d3045/compiler/rustc_lexer/src/lib.rs#L626-L653>:

    // no `_` directly after the decimal point `.`, or between `e` and `+/-`.

    let float = |i: &'a str| -> ParseResult<'a, ()> {

        let (i, has_dot) = opt(pair(char('.'), separated_digits(10, true)))(i)?;

        let (i, has_exp) = opt(|i| {

            let (i, (kind, op)) = pair(one_of("eE"), opt(one_of("+-")))(i)?;

            match opt(separated_digits(10, op.is_none()))(i)? {

                (i, Some(_)) => Ok((i, ())),

                (_, None) => Err(nom::Err::Failure(ErrorContext::new(

                    format!("expected decimal digits, `+` or `-` after exponent `{kind}`"),

                    start,

                ))),

        })(i)?;

        match (has_dot, has_exp) {

            (Some(_), _) | (_, Some(())) => Ok((i, ())),

            _ => fail(start),

};

    let (i, num) = if let Ok((i, Some(num))) = opt(recognize(int_with_base))(start) {

        let (i, suffix) = opt(|i| num_lit_suffix("integer", INTEGER_TYPES, start, i))(i)?;

        (i, Num::Int(num, suffix))

    } else {

        let (i, (num, float)) = consumed(preceded(

            pair(opt(char('-')), separated_digits(10, true)),

            opt(float),

        ))(start)?;

        if float.is_some() {

            let (i, suffix) = opt(|i| num_lit_suffix("float", FLOAT_TYPES, start, i))(i)?;

            (i, Num::Float(num, suffix))

        } else {

            let (i, suffix) = opt(|i| num_lit_suffix("number", NUM_TYPES, start, i))(i)?;

            match suffix {

                Some(NumKind::Int(kind)) => (i, Num::Int(num, Some(kind))),

                Some(NumKind::Float(kind)) => (i, Num::Float(num, Some(kind))),

                None => (i, Num::Int(num, None)),

};

    Ok((i, num))

/// Underscore separated digits of the given base, unless `start` is true this may start

/// with an underscore.

fn separated_digits(radix: u32, start: bool) -> impl Fn(&str) -> ParseResult<'_> {

    move |i| {

        recognize(tuple((

            |i| match start {

                true => Ok((i, 0)),

                false => many0_count(char('_'))(i),

},

            satisfy(|ch| ch.is_digit(radix)),

            many0_count(satisfy(|ch| ch == '_' || ch.is_digit(radix))),

        )))(i)

#[derive(Clone, Copy, Debug, PartialEq)]

pub enum StrPrefix {

    Binary,

    CLike,

impl StrPrefix {

    #[must_use]

    pub fn to_char(self) -> char {

        match self {

            Self::Binary => 'b',

            Self::CLike => 'c',

impl fmt::Display for StrPrefix {

    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {

        use std::fmt::Write;

        f.write_char(self.to_char())

#[derive(Clone, Debug, PartialEq)]

pub struct StrLit<'a> {

    pub prefix: Option<StrPrefix>,

    pub content: &'a str,

fn str_lit_without_prefix(i: &str) -> ParseResult<'_> {

    let (i, s) = delimited(

        char('"'),

        opt(escaped(is_not("\\\""), '\\', anychar)),

        char('"'),

    )(i)?;

    Ok((i, s.unwrap_or_default()))

fn str_lit(i: &str) -> Result<(&str, StrLit<'_>), ParseErr<'_>> {

    let (i, (prefix, content)) =

        tuple((opt(alt((char('b'), char('c')))), str_lit_without_prefix))(i)?;

    let prefix = match prefix {

        Some('b') => Some(StrPrefix::Binary),

        Some('c') => Some(StrPrefix::CLike),

        _ => None,

};

    Ok((i, StrLit { prefix, content }))

#[derive(Clone, Copy, Debug, PartialEq)]

pub enum CharPrefix {

    Binary,

#[derive(Clone, Debug, PartialEq)]

pub struct CharLit<'a> {

    pub prefix: Option<CharPrefix>,

    pub content: &'a str,

// Information about allowed character escapes is available at:

// <https://doc.rust-lang.org/reference/tokens.html#character-literals>.

fn char_lit(i: &str) -> Result<(&str, CharLit<'_>), ParseErr<'_>> {

    let start = i;

    let (i, (b_prefix, s)) = tuple((

        opt(char('b')),

        delimited(

            char('\''),

            opt(escaped(is_not("\\\'"), '\\', anychar)),

            char('\''),

),

    ))(i)?;

    let Some(s) = s else {

        return Err(nom::Err::Failure(ErrorContext::new(

            "empty character literal",

            start,

        )));

};

    let Ok(("", c)) = Char::parse(s) else {

        return Err(nom::Err::Failure(ErrorContext::new(

            "invalid character",

            start,

        )));

};

    let (nb, max_value, err1, err2) = match c {

        Char::Literal | Char::Escaped => {

            return Ok((i, CharLit {

                prefix: b_prefix.map(|_| CharPrefix::Binary),

                content: s,

            }));

        Char::AsciiEscape(nb) => (

nb,

            // `0x7F` is the maximum value for a `\x` escaped character.

            0x7F,

            "invalid character in ascii escape",

            "must be a character in the range [\\x00-\\x7f]",

),

        Char::UnicodeEscape(nb) => (

nb,

            // `0x10FFFF` is the maximum value for a `\u` escaped character.

            0x0010_FFFF,

            "invalid character in unicode escape",

            "unicode escape must be at most 10FFFF",

),

};

    let Ok(nb) = u32::from_str_radix(nb, 16) else {

        return Err(nom::Err::Failure(ErrorContext::new(err1, start)));

};

    if nb > max_value {

        return Err(nom::Err::Failure(ErrorContext::new(err2, start)));

    Ok((i, CharLit {

        prefix: b_prefix.map(|_| CharPrefix::Binary),

        content: s,

}))

/// Represents the different kinds of char declarations:

enum Char<'a> {

    /// Any character that is not escaped.

    Literal,

    /// An escaped character (like `\n`) which doesn't require any extra check.

    Escaped,

    /// Ascii escape (like `\x12`).

    AsciiEscape(&'a str),

    /// Unicode escape (like `\u{12}`).

    UnicodeEscape(&'a str),

impl<'a> Char<'a> {

    fn parse(i: &'a str) -> ParseResult<'a, Self> {

        if i.chars().count() == 1 {

            return Ok(("", Self::Literal));

        map(

            tuple((

                char('\\'),

                alt((

                    map(char('n'), |_| Self::Escaped),

                    map(char('r'), |_| Self::Escaped),

                    map(char('t'), |_| Self::Escaped),

                    map(char('\\'), |_| Self::Escaped),

                    map(char('0'), |_| Self::Escaped),

                    map(char('\''), |_| Self::Escaped),

                    // Not useful but supported by rust.

                    map(char('"'), |_| Self::Escaped),

                    map(

                        tuple((

                            char('x'),

                            take_while_m_n(2, 2, |c: char| c.is_ascii_hexdigit()),

)),

                        |(_, s)| Self::AsciiEscape(s),

),

                    map(

                        tuple((

                            tag("u{"),

                            take_while_m_n(1, 6, |c: char| c.is_ascii_hexdigit()),

                            char('}'),

)),

                        |(_, s, _)| Self::UnicodeEscape(s),

),

)),

)),

            |(_, ch)| ch,

        )(i)

enum PathOrIdentifier<'a> {

    Path(Vec<&'a str>),

    Identifier(&'a str),

fn path_or_identifier(i: &str) -> ParseResult<'_, PathOrIdentifier<'_>> {

    let root = ws(opt(tag("::")));

    let tail = opt(many1(preceded(ws(tag("::")), identifier)));

    let (i, (root, start, rest)) = tuple((root, identifier, tail))(i)?;

    let rest = rest.as_deref().unwrap_or_default();

    // The returned identifier can be assumed to be path if:

    // - it is an absolute path (starts with `::`), or

    // - it has multiple components (at least one `::`), or

    // - the first letter is uppercase

    match (root, start, rest) {

        (Some(_), start, tail) => {

            let mut path = Vec::with_capacity(2 + tail.len());

            path.push("");

            path.push(start);

            path.extend(rest);

            Ok((i, PathOrIdentifier::Path(path)))

        (None, name, []) if name.chars().next().map_or(true, char::is_lowercase) => {

            Ok((i, PathOrIdentifier::Identifier(name)))

        (None, start, tail) => {

            let mut path = Vec::with_capacity(1 + tail.len());

            path.push(start);

            path.extend(rest);

            Ok((i, PathOrIdentifier::Path(path)))

struct State<'a> {

    syntax: &'a Syntax<'a>,

    loop_depth: Cell<usize>,

    level: Cell<Level>,

impl<'a> State<'a> {

    fn new(syntax: &'a Syntax<'a>) -> State<'a> {

        State {

            syntax,

            loop_depth: Cell::new(0),

            level: Cell::new(Level::default()),

    fn nest<'b, T, F: FnOnce(&'b str) -> ParseResult<'b, T>>(

        &self,

        i: &'b str,

        callback: F,

    ) -> ParseResult<'b, T> {

        let prev_level = self.level.get();

        let (_, level) = prev_level.nest(i)?;

        self.level.set(level);

        let ret = callback(i);

        self.level.set(prev_level);

ret

    fn tag_block_start<'i>(&self, i: &'i str) -> ParseResult<'i> {

        tag(self.syntax.block_start)(i)

    fn tag_block_end<'i>(&self, i: &'i str) -> ParseResult<'i> {

        tag(self.syntax.block_end)(i)

    fn tag_comment_start<'i>(&self, i: &'i str) -> ParseResult<'i> {

        tag(self.syntax.comment_start)(i)

    fn tag_comment_end<'i>(&self, i: &'i str) -> ParseResult<'i> {

        tag(self.syntax.comment_end)(i)

    fn tag_expr_start<'i>(&self, i: &'i str) -> ParseResult<'i> {

        tag(self.syntax.expr_start)(i)

    fn tag_expr_end<'i>(&self, i: &'i str) -> ParseResult<'i> {

        tag(self.syntax.expr_end)(i)

    fn enter_loop(&self) {

        self.loop_depth.set(self.loop_depth.get() + 1);

    fn leave_loop(&self) {

        self.loop_depth.set(self.loop_depth.get() - 1);

    fn is_in_loop(&self) -> bool {

        self.loop_depth.get() > 0

#[derive(Default, Hash, PartialEq, Clone, Copy)]

pub struct Syntax<'a>(InnerSyntax<'a>);

// This abstraction ensures that the fields are readable, but not writable.

#[derive(Hash, PartialEq, Clone, Copy)]

pub struct InnerSyntax<'a> {

    pub block_start: &'a str,

    pub block_end: &'a str,

    pub expr_start: &'a str,

    pub expr_end: &'a str,

    pub comment_start: &'a str,

    pub comment_end: &'a str,

impl<'a> Deref for Syntax<'a> {

    type Target = InnerSyntax<'a>;

    #[inline]

    fn deref(&self) -> &Self::Target {

        &self.0

impl Default for InnerSyntax<'static> {

    fn default() -> Self {

        Self {

            block_start: "{%",

            block_end: "%}",

            expr_start: "{{",

            expr_end: "}}",

            comment_start: "{#",

            comment_end: "#}",

impl<'a> fmt::Debug for Syntax<'a> {

    #[inline]

    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {

        fmt_syntax("Syntax", self, f)

impl<'a> fmt::Debug for InnerSyntax<'a> {

    #[inline]

    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {

        fmt_syntax("InnerSyntax", self, f)

fn fmt_syntax(name: &str, inner: &InnerSyntax<'_>, f: &mut fmt::Formatter<'_>) -> fmt::Result {

    f.debug_struct(name)

        .field("block_start", &inner.block_start)

        .field("block_end", &inner.block_end)

        .field("expr_start", &inner.expr_start)

        .field("expr_end", &inner.expr_end)

        .field("comment_start", &inner.comment_start)

        .field("comment_end", &inner.comment_end)

        .finish()

#[derive(Debug, Default, Clone, Copy, Hash, PartialEq)]

#[cfg_attr(feature = "config", derive(serde::Deserialize))]

pub struct SyntaxBuilder<'a> {

    pub name: &'a str,

    pub block_start: Option<&'a str>,

    pub block_end: Option<&'a str>,

    pub expr_start: Option<&'a str>,

    pub expr_end: Option<&'a str>,

    pub comment_start: Option<&'a str>,

    pub comment_end: Option<&'a str>,

impl<'a> SyntaxBuilder<'a> {

    pub fn to_syntax(&self) -> Result<Syntax<'a>, String> {

        let default = InnerSyntax::default();

        let syntax = Syntax(InnerSyntax {

            block_start: self.block_start.unwrap_or(default.block_start),

            block_end: self.block_end.unwrap_or(default.block_end),

            expr_start: self.expr_start.unwrap_or(default.expr_start),

            expr_end: self.expr_end.unwrap_or(default.expr_end),

            comment_start: self.comment_start.unwrap_or(default.comment_start),

            comment_end: self.comment_end.unwrap_or(default.comment_end),

});

        for (s, k, is_closing) in [

            (syntax.block_start, "opening block", false),

            (syntax.block_end, "closing block", true),

            (syntax.expr_start, "opening expression", false),

            (syntax.expr_end, "closing expression", true),

            (syntax.comment_start, "opening comment", false),

            (syntax.comment_end, "closing comment", true),

] {

            if s.len() < 2 {

                return Err(format!(

                    "delimiters must be at least two characters long. \

                        The {k} delimiter ({s:?}) is too short",

));

            } else if s.chars().any(char::is_whitespace) {

                return Err(format!(

                    "delimiters may not contain white spaces. \

                        The {k} delimiter ({s:?}) contains white spaces",

));

            } else if is_closing

                && ['(', '-', '+', '~', '.', '>', '<', '&', '|', '!']

                    .contains(&s.chars().next().unwrap())

                return Err(format!(

                    "closing delimiters may not start with operators. \

                        The {k} delimiter ({s:?}) starts with operator `{}`",

                    s.chars().next().unwrap(),

));

        for ((s1, k1), (s2, k2)) in [

                (syntax.block_start, "block"),

                (syntax.expr_start, "expression"),

),

                (syntax.block_start, "block"),

                (syntax.comment_start, "comment"),

),

                (syntax.expr_start, "expression"),

                (syntax.comment_start, "comment"),

),

] {

            if s1.starts_with(s2) || s2.starts_with(s1) {

                let (s1, k1, s2, k2) = match s1.len() < s2.len() {

                    true => (s1, k1, s2, k2),

                    false => (s2, k2, s1, k1),

};

                return Err(format!(

                    "an opening delimiter may not be the prefix of another delimiter. \

                        The {k1} delimiter ({s1:?}) clashes with the {k2} delimiter ({s2:?})",

));

        Ok(syntax)

#[derive(Clone, Copy, Default)]

pub(crate) struct Level(u8);

impl Level {

    fn nest(self, i: &str) -> ParseResult<'_, Level> {

        if self.0 >= Self::MAX_DEPTH {

            return Err(nom::Err::Failure(ErrorContext::new(

                "your template code is too deeply nested, or last expression is too complex",

i,

            )));

        Ok((i, Level(self.0 + 1)))

    const MAX_DEPTH: u8 = 128;

fn filter<'a>(

    i: &'a str,

    level: &mut Level,

) -> ParseResult<'a, (&'a str, Option<Vec<WithSpan<'a, Expr<'a>>>>)> {

    let (j, _) = take_till(not_ws)(i)?;

    let had_spaces = i.len() != j.len();

    let (j, _) = pair(char('|'), not(char('|')))(j)?;

    if !had_spaces {

        *level = level.nest(i)?.1;

        cut(pair(

            ws(identifier),

            opt(|i| Expr::arguments(i, *level, false)),

        ))(j)

    } else {

        Err(nom::Err::Failure(ErrorContext::new(

            "the filter operator `|` must not be preceded by any whitespace characters\n\

            the binary OR operator is called `bitor` in rinja",

i,

)))

/// Returns the common parts of two paths.

///

/// The goal of this function is to reduce the path length based on the `base` argument

/// (generally the path where the program is running into). For example:

///

/// ```text

/// current dir: /a/b/c

/// path:        /a/b/c/d/e.txt

/// ```

///

/// `strip_common` will return `d/e.txt`.

#[must_use]

pub fn strip_common(base: &Path, path: &Path) -> String {

    let path = match path.canonicalize() {

        Ok(path) => path,

        Err(_) => return path.display().to_string(),

};

    let mut components_iter = path.components().peekable();

    for current_path_component in base.components() {

        let Some(path_component) = components_iter.peek() else {

            return path.display().to_string();

};

        if current_path_component != *path_component {

            break;

        components_iter.next();

    let path_parts = components_iter

        .map(|c| c.as_os_str().to_string_lossy())

        .collect::<Vec<_>>();

    if path_parts.is_empty() {

        path.display().to_string()

    } else {

        path_parts.join(std::path::MAIN_SEPARATOR_STR)

#[derive(Debug, Clone, Copy, PartialEq, Eq)]

pub enum IntKind {

I8,

    I16,

    I32,

    I64,

    I128,

    Isize,

U8,

    U16,

    U32,

    U64,

    U128,

    Usize,

#[derive(Debug, Clone, Copy, PartialEq, Eq)]

pub enum FloatKind {

    F16,

    F32,

    F64,

    F128,

#[derive(Debug, Clone, Copy, PartialEq, Eq)]

enum NumKind {

    Int(IntKind),

    Float(FloatKind),

/// Primitive integer types. Also used as number suffixes.

const INTEGER_TYPES: &[(&str, IntKind)] = &[

    ("i8", IntKind::I8),

    ("i16", IntKind::I16),

    ("i32", IntKind::I32),

    ("i64", IntKind::I64),

    ("i128", IntKind::I128),

    ("isize", IntKind::Isize),

    ("u8", IntKind::U8),

    ("u16", IntKind::U16),

    ("u32", IntKind::U32),

    ("u64", IntKind::U64),

    ("u128", IntKind::U128),

    ("usize", IntKind::Usize),

];

/// Primitive floating point types. Also used as number suffixes.

const FLOAT_TYPES: &[(&str, FloatKind)] = &[

    ("f16", FloatKind::F16),

    ("f32", FloatKind::F32),

    ("f64", FloatKind::F64),

    ("f128", FloatKind::F128),

];

/// Primitive numeric types. Also used as number suffixes.

const NUM_TYPES: &[(&str, NumKind)] = &{

    let mut list = [("", NumKind::Int(IntKind::I8)); INTEGER_TYPES.len() + FLOAT_TYPES.len()];

    let mut i = 0;

    let mut o = 0;

    while i < INTEGER_TYPES.len() {

        let (name, value) = INTEGER_TYPES[i];

        list[o] = (name, NumKind::Int(value));

        i += 1;

        o += 1;

    let mut i = 0;

    while i < FLOAT_TYPES.len() {

        let (name, value) = FLOAT_TYPES[i];

        list[o] = (name, NumKind::Float(value));

        i += 1;

        o += 1;

    list

};

/// Complete list of named primitive types.

const PRIMITIVE_TYPES: &[&str] = &{

    let mut list = [""; NUM_TYPES.len() + 1];

    let mut i = 0;

    let mut o = 0;

    while i < NUM_TYPES.len() {

        list[o] = NUM_TYPES[i].0;

        i += 1;

        o += 1;

    list[o] = "bool";

    list

};

#[cfg(not(windows))]

#[cfg(test)]

mod test {

    use std::path::Path;

    use super::*;

    #[test]

    fn test_strip_common() {

        // Full path is returned instead of empty when the entire path is in common.

        assert_eq!(strip_common(Path::new("home"), Path::new("home")), "home");

        let cwd = std::env::current_dir().expect("current_dir failed");

        // We need actual existing paths for `canonicalize` to work, so let's do that.

        let entry = cwd

            .read_dir()

            .expect("read_dir failed")

            .filter_map(std::result::Result::ok)

            .find(|f| f.path().is_file())

            .expect("no entry");

        // Since they have the complete path in common except for the folder entry name, it should

        // return only the folder entry name.

        assert_eq!(

            strip_common(&cwd, &entry.path()),

            entry.file_name().to_string_lossy()

);

        // In this case it cannot canonicalize `/a/b/c` so it returns the path as is.

        assert_eq!(strip_common(&cwd, Path::new("/a/b/c")), "/a/b/c");

    #[test]

    fn test_num_lit() {

        // Should fail.

        assert!(num_lit(".").is_err());

        // Should succeed.

        assert_eq!(

            num_lit("1.2E-02").unwrap(),

            ("", Num::Float("1.2E-02", None))

);

        assert_eq!(num_lit("4e3").unwrap(), ("", Num::Float("4e3", None)),);

        assert_eq!(num_lit("4e+_3").unwrap(), ("", Num::Float("4e+_3", None)),);

        // Not supported because Rust wants a number before the `.`.

        assert!(num_lit(".1").is_err());

        assert!(num_lit(".1E-02").is_err());

        // A `_` directly after the `.` denotes a field.

        assert_eq!(num_lit("1._0").unwrap(), ("._0", Num::Int("1", None)));

        assert_eq!(num_lit("1_.0").unwrap(), ("", Num::Float("1_.0", None)));

        // Not supported (voluntarily because of `1..` syntax).

        assert_eq!(num_lit("1.").unwrap(), (".", Num::Int("1", None)));

        assert_eq!(num_lit("1_.").unwrap(), (".", Num::Int("1_", None)));

        assert_eq!(num_lit("1_2.").unwrap(), (".", Num::Int("1_2", None)));

        // Numbers with suffixes

        assert_eq!(

            num_lit("-1usize").unwrap(),

            ("", Num::Int("-1", Some(IntKind::Usize)))

);

        assert_eq!(

            num_lit("123_f32").unwrap(),

            ("", Num::Float("123_", Some(FloatKind::F32)))

);

        assert_eq!(

            num_lit("1_.2_e+_3_f64|into_isize").unwrap(),

                "|into_isize",

                Num::Float("1_.2_e+_3_", Some(FloatKind::F64))

);

        assert_eq!(

            num_lit("4e3f128").unwrap(),

            ("", Num::Float("4e3", Some(FloatKind::F128))),

);

    #[test]

    fn test_char_lit() {

        let lit = |s: &'static str| crate::CharLit {

            prefix: None,

            content: s,

};

        assert_eq!(char_lit("'a'").unwrap(), ("", lit("a")));

        assert_eq!(char_lit("'字'").unwrap(), ("", lit("字")));

        // Escaped single characters.

        assert_eq!(char_lit("'\\\"'").unwrap(), ("", lit("\\\"")));

        assert_eq!(char_lit("'\\''").unwrap(), ("", lit("\\'")));

        assert_eq!(char_lit("'\\t'").unwrap(), ("", lit("\\t")));

        assert_eq!(char_lit("'\\n'").unwrap(), ("", lit("\\n")));

        assert_eq!(char_lit("'\\r'").unwrap(), ("", lit("\\r")));

        assert_eq!(char_lit("'\\0'").unwrap(), ("", lit("\\0")));

        // Escaped ascii characters (up to `0x7F`).

        assert_eq!(char_lit("'\\x12'").unwrap(), ("", lit("\\x12")));

        assert_eq!(char_lit("'\\x02'").unwrap(), ("", lit("\\x02")));

        assert_eq!(char_lit("'\\x6a'").unwrap(), ("", lit("\\x6a")));

        assert_eq!(char_lit("'\\x7F'").unwrap(), ("", lit("\\x7F")));

        // Escaped unicode characters (up to `0x10FFFF`).

        assert_eq!(char_lit("'\\u{A}'").unwrap(), ("", lit("\\u{A}")));

        assert_eq!(char_lit("'\\u{10}'").unwrap(), ("", lit("\\u{10}")));

        assert_eq!(char_lit("'\\u{aa}'").unwrap(), ("", lit("\\u{aa}")));

        assert_eq!(char_lit("'\\u{10FFFF}'").unwrap(), ("", lit("\\u{10FFFF}")));

        // Check with `b` prefix.

        assert_eq!(

            char_lit("b'a'").unwrap(),

            ("", crate::CharLit {

                prefix: Some(crate::CharPrefix::Binary),

                content: "a"

})

);

        // Should fail.

        assert!(char_lit("''").is_err());

        assert!(char_lit("'\\o'").is_err());

        assert!(char_lit("'\\x'").is_err());

        assert!(char_lit("'\\x1'").is_err());

        assert!(char_lit("'\\x80'").is_err());

        assert!(char_lit("'\\u'").is_err());

        assert!(char_lit("'\\u{}'").is_err());

        assert!(char_lit("'\\u{110000}'").is_err());

    #[test]

    fn test_str_lit() {

        assert_eq!(

            str_lit(r#"b"hello""#).unwrap(),

            ("", StrLit {

                prefix: Some(StrPrefix::Binary),

                content: "hello"

})

);

        assert_eq!(

            str_lit(r#"c"hello""#).unwrap(),

            ("", StrLit {

                prefix: Some(StrPrefix::CLike),

                content: "hello"

})

);

        assert!(str_lit(r#"d"hello""#).is_err());