typst/src/syntax/parsing.rs

//! Parsing of source code into syntax models.

use std::iter::FromIterator;

use crate::{Pass, Feedback};
use super::func::{FuncHeader, FuncArgs, FuncArg};
use super::expr::*;
use super::scope::Scope;
use super::span::{Position, Span, Spanned};
use super::tokens::{Token, Tokens, TokenizationMode};
use super::*;


/// The context for parsing.
#[derive(Debug, Copy, Clone)]
pub struct ParseContext<'a> {
    /// The scope containing function definitions.
    pub scope: &'a Scope,
}

/// Parse source code into a syntax model.
///
/// All errors and decorations are offset by the `start` position.
pub fn parse(start: Position, src: &str, ctx: ParseContext) -> Pass<SyntaxModel> {
    let mut model = SyntaxModel::new();
    let mut feedback = Feedback::new();

    // We always start in body mode. The header tokenization mode is only used
    // in the `FuncParser`.
    let mut tokens = Tokens::new(start, src, TokenizationMode::Body);

    while let Some(token) = tokens.next() {
        let span = token.span;

        let node = match token.v {
            Token::LineComment(_) | Token::BlockComment(_) => continue,

            // Only at least two newlines mean a _real_ newline indicating a
            // paragraph break.
            Token::Space(newlines) => if newlines >= 2 {
                Node::Parbreak
            } else {
                Node::Space
            },

            Token::Function { header, body, terminated } => {
                let parsed = FuncParser::new(header, body, ctx).parse();
                feedback.extend_offset(span.start, parsed.feedback);

                if !terminated {
                    feedback.errors.push(err!(Span::at(span.end);
                        "expected closing bracket"));
                }

                parsed.output
            }

            Token::Star       => Node::ToggleBolder,
            Token::Underscore => Node::ToggleItalic,
            Token::Backslash  => Node::Linebreak,

            Token::Raw { raw, terminated } => {
                if !terminated {
                    feedback.errors.push(err!(Span::at(span.end);
                        "expected backtick"));
                }

                Node::Raw(unescape_raw(raw))
            }

            Token::Text(text) => Node::Text(text.to_string()),

            other => {
                feedback.errors.push(err!(span; "unexpected {}", other.name()));
                continue;
            }
        };

        model.add(Spanned { v: node, span: token.span });
    }

    Pass::new(model, feedback)
}

/// Performs the function parsing.
struct FuncParser<'s> {
    ctx: ParseContext<'s>,
    feedback: Feedback,

    /// ```typst
    /// [tokens][body]
    ///  ^^^^^^
    /// ```
    tokens: Tokens<'s>,
    peeked: Option<Option<Spanned<Token<'s>>>>,

    /// The spanned body string if there is a body.
    /// ```typst
    /// [tokens][body]
    ///          ^^^^
    /// ```
    body: Option<Spanned<&'s str>>,
}

impl<'s> FuncParser<'s> {
    /// Create a new function parser.
    fn new(
        header: &'s str,
        body: Option<Spanned<&'s str>>,
        ctx: ParseContext<'s>
    ) -> FuncParser<'s> {
        FuncParser {
            ctx,
            feedback: Feedback::new(),
            tokens: Tokens::new(Position::new(0, 1), header, TokenizationMode::Header),
            peeked: None,
            body,
        }
    }

    /// Do the parsing.
    fn parse(mut self) -> Pass<Node> {
        let parsed = if let Some(header) = self.parse_func_header() {
            let name = header.name.v.as_str();
            let (parser, deco) = match self.ctx.scope.get_parser(name) {
                // A valid function.
                Ok(parser) => (parser, Decoration::ValidFuncName),

                // The fallback parser was returned. Invalid function.
                Err(parser) => {
                    self.feedback.errors.push(err!(header.name.span; "unknown function"));
                    (parser, Decoration::InvalidFuncName)
                }
            };

            self.feedback.decos.push(Spanned::new(deco, header.name.span));

            parser(header, self.body, self.ctx)
        } else {
            let default = FuncHeader {
                name: Spanned::new(Ident("".to_string()), Span::ZERO),
                args: FuncArgs::new(),
            };

            // Use the fallback function such that the body is still rendered
            // even if the header is completely unparsable.
            self.ctx.scope.get_fallback_parser()(default, self.body, self.ctx)
        };

        self.feedback.extend(parsed.feedback);

        Pass::new(Node::Model(parsed.output), self.feedback)
    }

    /// Parse the header tokens.
    fn parse_func_header(&mut self) -> Option<FuncHeader> {
        let start = self.pos();
        self.skip_whitespace();

        let name = match self.parse_ident() {
            Some(ident) => ident,
            None => {
                let other = self.eat();
                self.expected_found_or_at("identifier", other, start);
                return None;
            }
        };

        self.skip_whitespace();
        let args = match self.eat().map(Spanned::value) {
            Some(Token::Colon) => self.parse_func_args(),
            Some(_) => {
                self.expected_at("colon", name.span.end);
                FuncArgs::new()
            }
            None => FuncArgs::new(),
        };

        Some(FuncHeader { name, args })
    }

    /// Parse the argument list between colons and end of the header.
    fn parse_func_args(&mut self) -> FuncArgs {
        // Parse a collection until the token is `None`, that is, the end of the
        // header.
        self.parse_collection(None, |p| {
            // If we have an identifier we might have a keyword argument,
            // otherwise its for sure a postional argument.
            if let Some(ident) = p.parse_ident() {
                // This could still be a named tuple
                if let Some(Token::LeftParen) = p.peekv() {
                    return Ok(FuncArg::Pos(
                        p.parse_named_tuple(ident)
                            .map(|t| Expr::NamedTuple(t))
                    ));
                }

                p.skip_whitespace();

                if let Some(Token::Equals) = p.peekv() {
                    p.eat();
                    p.skip_whitespace();

                    // Semantic highlighting for argument keys.
                    p.feedback.decos.push(
                        Spanned::new(Decoration::ArgumentKey, ident.span));

                    let value = p.parse_expr().ok_or(("value", None))?;

                    // Add a keyword argument.
                    Ok(FuncArg::Key(Pair { key: ident, value }))
                } else {
                    // Add a positional argument because there was no equals
                    // sign after the identifier that could have been a key.
                    Ok(FuncArg::Pos(ident.map(|id| Expr::Ident(id))))
                }
            } else {
                // Add a positional argument because we haven't got an
                // identifier that could be an argument key.
                p.parse_expr().map(|expr| FuncArg::Pos(expr))
                    .ok_or(("argument", None))
            }
        }).v
    }

    /// Parse an atomic or compound (tuple / object) expression.
    fn parse_expr(&mut self) -> Option<Spanned<Expr>> {
        let first = self.peek()?;
        macro_rules! take {
            ($v:expr) => ({ self.eat(); Spanned { v: $v, span: first.span } });
        }

        Some(match first.v {
            Token::ExprIdent(i) => {
                let name = take!(Ident(i.to_string()));

                // This could be a named tuple or an identifier
                if let Some(Token::LeftParen) = self.peekv() {
                    self.parse_named_tuple(name).map(|t| Expr::NamedTuple(t))
                } else {
                    name.map(|i| Expr::Ident(i))
                }
            },
            Token::ExprStr { string, terminated } => {
                if !terminated {
                    self.expected_at("quote", first.span.end);
                }

                take!(Expr::Str(unescape_string(string)))
            }

            Token::ExprNumber(n) => take!(Expr::Number(n)),
            Token::ExprSize(s) => take!(Expr::Size(s)),
            Token::ExprBool(b) => take!(Expr::Bool(b)),
            Token::ExprHex(s) => {
                if let Some(color) = RgbaColor::from_str(s) {
                    take!(Expr::Color(color))
                } else {
                    // Heal color by assuming black
                    self.feedback.errors.push(err!(first.span;
                        "invalid color"));
                    take!(Expr::Color(RgbaColor::new_healed(0, 0, 0, 255)))
                }
            },

            Token::LeftParen => self.parse_tuple().map(|t| Expr::Tuple(t)),
            Token::LeftBrace => self.parse_object().map(|o| Expr::Object(o)),

            _ => return None,
        })
    }

    /// Parse a tuple expression: `(<expr>, ...)`.
    fn parse_tuple(&mut self) -> Spanned<Tuple> {
        let token = self.eat();
        debug_assert_eq!(token.map(Spanned::value), Some(Token::LeftParen));

        // Parse a collection until a right paren appears and complain about
        // missing a `value` when an invalid token is encoutered.
        self.parse_collection(Some(Token::RightParen),
            |p| p.parse_expr().ok_or(("value", None)))
    }

    /// Parse a tuple expression: `name(<expr>, ...)` with a given identifier.
    fn parse_named_tuple(&mut self, name: Spanned<Ident>) -> Spanned<NamedTuple> {
        let tuple = self.parse_tuple();
        let start = name.span.start;
        let end = tuple.span.end;
        Spanned::new(NamedTuple::new(name, tuple), Span::new(start, end))
    }

    /// Parse an object expression: `{ <key>: <value>, ... }`.
    fn parse_object(&mut self) -> Spanned<Object> {
        let token = self.eat();
        debug_assert_eq!(token.map(Spanned::value), Some(Token::LeftBrace));

        // Parse a collection until a right brace appears.
        self.parse_collection(Some(Token::RightBrace), |p| {
            // Expect an identifier as the key.
            let key = p.parse_ident().ok_or(("key", None))?;

            // Expect a colon behind the key (only separated by whitespace).
            let behind_key = p.pos();
            p.skip_whitespace();
            if p.peekv() != Some(Token::Colon) {
                return Err(("colon", Some(behind_key)));
            }

            p.eat();
            p.skip_whitespace();

            // Semantic highlighting for object keys.
            p.feedback.decos.push(
                Spanned::new(Decoration::ObjectKey, key.span));

            let value = p.parse_expr().ok_or(("value", None))?;

            Ok(Pair { key, value })
        })
    }

    /// Parse a comma-separated collection where each item is parsed through
    /// `parse_item` until the `end` token is met.
    fn parse_collection<C, I, F>(
        &mut self,
        end: Option<Token>,
        mut parse_item: F
    ) -> Spanned<C>
    where
        C: FromIterator<I>,
        F: FnMut(&mut Self) -> Result<I, (&'static str, Option<Position>)>,
    {
        let start = self.pos();

        // Parse the comma separated items.
        let collection = std::iter::from_fn(|| {
            self.skip_whitespace();
            let peeked = self.peekv();

            // We finished as expected.
            if peeked == end {
                self.eat();
                return None;
            }

            // We finished without the expected end token (which has to be a
            // `Some` value at this point since otherwise we would have already
            // returned in the previous case).
            if peeked == None {
                self.eat();
                self.expected_at(end.unwrap().name(), self.pos());
                return None;
            }

            // Try to parse a collection item.
            match parse_item(self) {
                Ok(item) => {
                    // Expect a comma behind the item (only separated by
                    // whitespace).
                    let behind_item = self.pos();
                    self.skip_whitespace();
                    match self.peekv() {
                        Some(Token::Comma) => { self.eat(); }
                        t @ Some(_) if t != end => self.expected_at("comma", behind_item),
                        _ => {}
                    }

                    return Some(Some(item));
                }

                // The item parser expected something different at either some
                // given position or instead of the currently peekable token.
                Err((expected, Some(pos))) => self.expected_at(expected, pos),
                Err((expected, None)) => {
                    let token = self.peek();
                    if token.map(Spanned::value) != end {
                        self.eat();
                    }
                    self.expected_found_or_at(expected, token, self.pos());
                }
            }

            Some(None)
        }).filter_map(|x| x).collect();

        let end = self.pos();
        Spanned::new(collection, Span { start, end })
    }

    /// Try to parse an identifier and do nothing if the peekable token is no
    /// identifier.
    fn parse_ident(&mut self) -> Option<Spanned<Ident>> {
        match self.peek() {
            Some(Spanned { v: Token::ExprIdent(s), span }) => {
                self.eat();
                Some(Spanned { v: Ident(s.to_string()), span })
            }
            _ => None
        }
    }

    /// Skip all whitespace/comment tokens.
    fn skip_whitespace(&mut self) {
        self.eat_until(|t| match t {
            Token::Space(_) | Token::LineComment(_) |
            Token::BlockComment(_) => false,
            _ => true,
        }, false)
    }

    /// Add an error about an expected `thing` which was not found, showing
    /// what was found instead.
    fn expected_found(&mut self, thing: &str, found: Spanned<Token>) {
        self.feedback.errors.push(err!(found.span;
            "expected {}, found {}", thing, found.v.name()));
    }

    /// Add an error about an `thing` which was expected but not found at the
    /// given position.
    fn expected_at(&mut self, thing: &str, pos: Position) {
        self.feedback.errors.push(err!(Span::at(pos); "expected {}", thing));
    }

    /// Add a expected-found-error if `found` is `Some` and an expected-error
    /// otherwise.
    fn expected_found_or_at(
        &mut self,
        thing: &str,
        found: Option<Spanned<Token>>,
        pos: Position
    ) {
        match found {
            Some(found) => self.expected_found(thing, found),
            None => self.expected_at(thing, pos),
        }
    }

    /// Consume tokens until the function returns true and only consume the last
    /// token if instructed to so by `eat_match`.
    fn eat_until<F>(&mut self, mut f: F, eat_match: bool)
    where F: FnMut(Token<'s>) -> bool {
        while let Some(token) = self.peek() {
            if f(token.v) {
                if eat_match {
                    self.eat();
                }
                break;
            }

            self.eat();
        }
    }

    /// Consume and return the next token.
    fn eat(&mut self) -> Option<Spanned<Token<'s>>> {
        self.peeked.take()
            .unwrap_or_else(|| self.tokens.next())
    }

    /// Peek at the next token without consuming it.
    fn peek(&mut self) -> Option<Spanned<Token<'s>>> {
        let iter = &mut self.tokens;
        *self.peeked.get_or_insert_with(|| iter.next())
    }

    /// Peek at the unspanned value of the next token.
    fn peekv(&mut self) -> Option<Token<'s>> {
        self.peek().map(Spanned::value)
    }

    /// The position at the end of the last eaten token / start of the peekable
    /// token.
    fn pos(&self) -> Position {
        self.peeked.flatten()
            .map(|s| s.span.start)
            .unwrap_or_else(|| self.tokens.pos())
    }
}

/// Unescape a string: `the string is \"this\"` => `the string is "this"`.
fn unescape_string(string: &str) -> String {
    let mut s = String::with_capacity(string.len());
    let mut iter = string.chars();

    while let Some(c) = iter.next() {
        if c == '\\' {
            match iter.next() {
                Some('\\') => s.push('\\'),
                Some('"') => s.push('"'),
                Some('n') => s.push('\n'),
                Some('t') => s.push('\t'),
                Some(c) => { s.push('\\'); s.push(c); }
                None => s.push('\\'),
            }
        } else {
            s.push(c);
        }
    }

    s
}

/// Unescape raw markup into lines.
fn unescape_raw(raw: &str) -> Vec<String> {
    let mut lines = Vec::new();
    let mut s = String::new();
    let mut iter = raw.chars().peekable();

    while let Some(c) = iter.next() {
        if c == '\\' {
            match iter.next() {
                Some('`') => s.push('`'),
                Some(c) => { s.push('\\'); s.push(c); }
                None => s.push('\\'),
            }
        } else if is_newline_char(c) {
            if c == '\r' && iter.peek() == Some(&'\n') {
                iter.next();
            }

            lines.push(std::mem::replace(&mut s, String::new()));
        } else {
            s.push(c);
        }
    }

    lines.push(s);
    lines
}


#[cfg(test)]
#[allow(non_snake_case)]
mod tests {
    use crate::size::Size;
    use crate::syntax::test::{DebugFn, check, zspan};
    use crate::syntax::func::Value;
    use super::*;

    use Decoration::*;
    use Node::{
        Space as S, ToggleItalic as Italic, ToggleBolder as Bold,
        Parbreak, Linebreak,
    };

    use Expr::{Number as Num, Size as Sz, Bool};
    fn Id(text: &str) -> Expr { Expr::Ident(Ident(text.to_string())) }
    fn Str(text: &str) -> Expr { Expr::Str(text.to_string()) }
    fn Pt(points: f32) -> Expr { Expr::Size(Size::pt(points)) }

    fn ClrS(color: &str) -> Expr {
        Expr::Color(
            RgbaColor::from_str(color).expect("Test color invalid")
        )
    }
    fn ClrS_Healed() -> Expr {
        let mut c = RgbaColor::from_str("000f")
            .expect("Test color invalid");
        c.healed = true;
        Expr::Color(c)
    }
    fn Clr(r: u8, g: u8, b: u8, a: u8) -> Expr {
        Expr::Color(RgbaColor::new(r, g, b, a))
    }

    fn T(text: &str) -> Node { Node::Text(text.to_string()) }

    /// Create a raw text node.
    macro_rules! raw {
        ($($line:expr),* $(,)?) => {
            Node::Raw(vec![$($line.to_string()),*])
        };
    }

    /// Create a tuple expression.
    macro_rules! tuple {
        ($($items:expr),* $(,)?) => {
            Expr::Tuple(Tuple { items: spanned![vec $($items),*].0 })
        };
    }

    /// Create a named tuple expression.
    macro_rules! named_tuple {
        ($name:expr $(, $items:expr)* $(,)?) => {
            Expr::NamedTuple(NamedTuple::new(
                zspan(Ident($name.to_string())),
                zspan(Tuple { items: spanned![vec $($items),*].0 })
            ))
        };
    }

    /// Create an object expression.
    macro_rules! object {
        ($($key:expr => $value:expr),* $(,)?) => {
            Expr::Object(Object {
                pairs: vec![$(Pair {
                    key: zspan(Ident($key.to_string())),
                    value: zspan($value),
                }),*]
            })
        };
    }

    /// Test whether the given string parses into
    /// - the given node list (required).
    /// - the given error list (optional, if omitted checks against empty list).
    /// - the given decoration list (optional, if omitted it is not tested).
    macro_rules! p {
        ($source:expr => [$($model:tt)*]) => {
            p!($source => [$($model)*], []);
        };

        ($source:expr => [$($model:tt)*], [$($errors:tt)*] $(, [$($decos:tt)*])? $(,)?) => {
            let mut scope = Scope::new::<DebugFn>();
            scope.add::<DebugFn>("f");
            scope.add::<DebugFn>("n");
            scope.add::<DebugFn>("box");
            scope.add::<DebugFn>("val");

            let ctx = ParseContext { scope: &scope };
            let pass = parse(Position::ZERO, $source, ctx);

            // Test model
            let (exp, cmp) = spanned![vec $($model)*];
            check($source, exp, pass.output.nodes, cmp);

            // Test errors
            let (exp, cmp) = spanned![vec $($errors)*];
            let exp = exp.into_iter()
                .map(|s: Spanned<&str>| s.map(|e| e.to_string()))
                .collect::<Vec<_>>();
            let found = pass.feedback.errors.into_iter()
                .map(|s| s.map(|e| e.message))
                .collect::<Vec<_>>();
            check($source, exp, found, cmp);

            // Test decos
            $(let (exp, cmp) = spanned![vec $($decos)*];
            check($source, exp, pass.feedback.decos, cmp);)?
        };
    }

    /// Write down a `DebugFn` function model compactly.
    macro_rules! func {
        ($name:tt $(: ($($pos:tt)*), { $($key:tt)* } )? $(; $($body:tt)*)?) => ({
            #[allow(unused_mut)]
            let mut args = FuncArgs::new();
            $(args.pos = Tuple::parse(zspan(tuple!($($pos)*))).unwrap();)?
            $(args.key = Object::parse(zspan(object! { $($key)* })).unwrap();)?

            Node::Model(Box::new(DebugFn {
                header: FuncHeader {
                    name: spanned!(item $name).map(|s| Ident(s.to_string())),
                    args,
                },
                body: func!(@body $($($body)*)?),
            }))
        });

        (@body [$($body:tt)*]) => ({
            Some(SyntaxModel { nodes: spanned![vec $($body)*].0 })
        });
        (@body) => (None);
    }

    #[test]
    fn parse_color_strings() {
        assert_eq!(Clr(0xf6, 0x12, 0x43, 0xff), ClrS("f61243ff"));
        assert_eq!(Clr(0xb3, 0xd8, 0xb3, 0xff), ClrS("b3d8b3"));
        assert_eq!(Clr(0xfc, 0xd2, 0xa9, 0xad), ClrS("fCd2a9AD"));
        assert_eq!(Clr(0x22, 0x33, 0x33, 0xff), ClrS("233"));
        assert_eq!(Clr(0x11, 0x11, 0x11, 0xbb), ClrS("111b"));
    }

    #[test]
    fn unescape_strings() {
        fn test(string: &str, expected: &str) {
            assert_eq!(unescape_string(string), expected.to_string());
        }

        test(r#"hello world"#,  "hello world");
        test(r#"hello\nworld"#, "hello\nworld");
        test(r#"a\"bc"#,        "a\"bc");
        test(r#"a\\"#,          "a\\");
        test(r#"a\\\nbc"#,      "a\\\nbc");
        test(r#"a\tbc"#,        "a\tbc");
        test(r"🌎",             "🌎");
        test(r"🌎\",            r"🌎\");
        test(r"\🌎",            r"\🌎");
    }

    #[test]
    fn unescape_raws() {
        fn test(raw: &str, expected: Node) {
            let vec = if let Node::Raw(v) = expected { v } else { panic!() };
            assert_eq!(unescape_raw(raw), vec);
        }

        test("raw\\`",     raw!["raw`"]);
        test("raw\ntext",  raw!["raw", "text"]);
        test("a\r\nb",     raw!["a", "b"]);
        test("a\n\nb",     raw!["a", "", "b"]);
        test("a\r\x0Bb",   raw!["a", "", "b"]);
        test("a\r\n\r\nb", raw!["a", "", "b"]);
        test("raw\\a",     raw!["raw\\a"]);
        test("raw\\",      raw!["raw\\"]);
    }

    #[test]
    fn parse_basic_nodes() {
        // Basic nodes
        p!(""                     => []);
        p!("hi"                   => [T("hi")]);
        p!("*hi"                  => [Bold, T("hi")]);
        p!("hi_"                  => [T("hi"), Italic]);
        p!("hi you"               => [T("hi"), S, T("you")]);
        p!("hi// you\nw"          => [T("hi"), S, T("w")]);
        p!("\n\n\nhello"          => [Parbreak, T("hello")]);
        p!("first//\n//\nsecond"  => [T("first"), S, S, T("second")]);
        p!("first//\n \nsecond"   => [T("first"), Parbreak, T("second")]);
        p!("first/*\n \n*/second" => [T("first"), T("second")]);
        p!(r"a\ b"                => [T("a"), Linebreak, S, T("b")]);
        p!("💜\n\n 🌍"            => [T("💜"), Parbreak, T("🌍")]);

        // Raw markup
        p!("`py`"         => [raw!["py"]]);
        p!("[val][`hi]`]" => [func!("val"; [raw!["hi]"]])]);
        p!("`hi\nyou"     => [raw!["hi", "you"]], [(1:3, 1:3, "expected backtick")]);
        p!("`hi\\`du`"    => [raw!["hi`du"]]);

        // Spanned nodes
        p!("Hi"      => [(0:0, 0:2, T("Hi"))]);
        p!("*Hi*"    => [(0:0, 0:1, Bold), (0:1, 0:3, T("Hi")), (0:3, 0:4, Bold)]);
        p!("🌎\n*/[n]" =>
            [(0:0, 0:1, T("🌎")), (0:1, 1:0, S), (1:2, 1:5, func!((0:1, 0:2, "n")))],
            [(1:0, 1:2, "unexpected end of block comment")],
            [(1:3, 1:4, ValidFuncName)],
        );
    }

    #[test]
    fn parse_function_names() {
        // No closing bracket
        p!("[" => [func!("")], [
            (0:1, 0:1, "expected identifier"),
            (0:1, 0:1, "expected closing bracket")
        ]);

        // No name
        p!("[]" => [func!("")], [(0:1, 0:1, "expected identifier")]);
        p!("[\"]" => [func!("")], [
            (0:1, 0:3, "expected identifier, found string"),
            (0:3, 0:3, "expected closing bracket"),
        ]);

        // An unknown name
        p!("[hi]" =>
            [func!("hi")],
            [(0:1, 0:3, "unknown function")],
            [(0:1, 0:3, InvalidFuncName)],
        );

        // A valid name
        p!("[f]"   => [func!("f")], [], [(0:1, 0:2, ValidFuncName)]);
        p!("[  f]" => [func!("f")], [], [(0:3, 0:4, ValidFuncName)]);

        // An invalid token for a name
        p!("[12]"   => [func!("")], [(0:1, 0:3, "expected identifier, found number")], []);
        p!("[🌎]"   => [func!("")], [(0:1, 0:2, "expected identifier, found invalid token")], []);
        p!("[  🌎]" => [func!("")], [(0:3, 0:4, "expected identifier, found invalid token")], []);
    }

    #[test]
    fn parse_colon_starting_function_arguments() {
        // No colon before arg
        p!("[val\"s\"]" => [func!("val")], [(0:4, 0:4, "expected colon")]);

        // No colon before valid, but wrong token
        p!("[val=]" => [func!("val")], [(0:4, 0:4, "expected colon")]);

        // No colon before invalid tokens, which are ignored
        p!("[val/🌎:$]" =>
            [func!("val")],
            [(0:4, 0:4, "expected colon")],
            [(0:1, 0:4, ValidFuncName)],
        );

        // String in invalid header without colon still parsed as string
        // Note: No "expected quote" error because not even the string was
        //       expected.
        p!("[val/\"]" => [func!("val")], [
            (0:4, 0:4, "expected colon"),
            (0:7, 0:7, "expected closing bracket"),
        ]);

        // Just colon without args
        p!("[val:]"         => [func!("val")]);
        p!("[val:/*12pt*/]" => [func!("val")]);

        // Whitespace / comments around colon
        p!("[val\n:\ntrue]"      => [func!("val": (Bool(true)), {})]);
        p!("[val/*:*/://\ntrue]" => [func!("val": (Bool(true)), {})]);
    }

    #[test]
    fn parse_one_positional_argument() {
        // Different expressions
        p!("[val: true]"   =>
            [func!("val": (Bool(true)), {})], [],
            [(0:1, 0:4, ValidFuncName)],
        );
        p!("[val: _]"      => [func!("val": (Id("_")), {})]);
        p!("[val: name]"   => [func!("val": (Id("name")), {})]);
        p!("[val: \"hi\"]" => [func!("val": (Str("hi")), {})]);
        p!("[val: \"a\n[]\\\"string\"]" => [func!("val": (Str("a\n[]\"string")), {})]);
        p!("[val: 3.14]"   => [func!("val": (Num(3.14)), {})]);
        p!("[val: 4.5cm]"  => [func!("val": (Sz(Size::cm(4.5))), {})]);
        p!("[val: 12e1pt]" => [func!("val": (Pt(12e1)), {})]);
        p!("[val: #f7a20500]" => [func!("val": (ClrS("f7a20500")), {})]);

        // Unclosed string.
        p!("[val: \"hello]" => [func!("val": (Str("hello]")), {})], [
            (0:13, 0:13, "expected quote"),
            (0:13, 0:13, "expected closing bracket"),
        ]);

        //Invalid colors
        p!("[val: #12345]" => [func!("val": (ClrS_Healed()), {})], [
            (0:6, 0:12, "invalid color"),
        ]);
        p!("[val: #a5]" => [func!("val": (ClrS_Healed()), {})], [
            (0:6, 0:9, "invalid color"),
        ]);
        p!("[val: #14b2ah]" => [func!("val": (ClrS_Healed()), {})], [
            (0:6, 0:13, "invalid color"),
        ]);
        p!("[val: #f075ff011]" => [func!("val": (ClrS_Healed()), {})], [
            (0:6, 0:16, "invalid color"),
        ]);
    }

    #[test]
    fn parse_tuples() {
        // Empty tuple
        p!("[val: ()]" => [func!("val": (tuple!()), {})]);
        p!("[val: empty()]" => [func!("val": (named_tuple!("empty")), {})]);

        // Invalid value
        p!("[val: (🌎)]" =>
            [func!("val": (tuple!()), {})],
            [(0:7, 0:8, "expected value, found invalid token")],
        );
        p!("[val: sound(\x07)]" =>
            [func!("val": (named_tuple!("sound")), {})],
            [(0:12, 0:13, "expected value, found invalid token")],
        );

        // Invalid tuple name
        p!("[val: 👠(\"abc\", 13e-5)]" =>
            [func!("val": (tuple!(Str("abc"), Num(13.0e-5))), {})],
            [(0:6, 0:7, "expected argument, found invalid token")],
        );

        // Unclosed tuple
        p!("[val: (hello]" =>
            [func!("val": (tuple!(Id("hello"))), {})],
            [(0:12, 0:12, "expected closing paren")],
        );
        p!("[val: lang(中文]" =>
            [func!("val": (named_tuple!("lang", Id("中文"))), {})],
            [(0:13, 0:13, "expected closing paren")],
        );

        // Valid values
        p!("[val: (1, 2)]" => [func!("val": (tuple!(Num(1.0), Num(2.0))), {})]);
        p!("[val: (\"s\",)]" => [func!("val": (tuple!(Str("s"))), {})]);
        p!("[val: cmyk(1, 46, 0, 0)]" =>
            [func!("val": (named_tuple!(
                "cmyk", Num(1.0), Num(46.0), Num(0.0), Num(0.0)
            )), {})]
        );
        p!("[val: items(\"fire\", #f93a6d)]" =>
            [func!("val": (named_tuple!(
                "items", Str("fire"), ClrS("f93a6d")
            )), {})]
        );

        // Nested tuples
        p!("[val: (1, (2))]" =>
            [func!("val": (tuple!(Num(1.0), tuple!(Num(2.0)))), {})]
        );
        p!("[val: css(1pt, rgb(90, 102, 254), \"solid\")]" =>
            [func!("val": (named_tuple!(
                "css", Pt(1.0), named_tuple!(
                    "rgb", Num(90.0), Num(102.0), Num(254.0)
                ), Str("solid")
            )), {})]
        );

        // Invalid commas
        p!("[val: (,)]" =>
            [func!("val": (tuple!()), {})],
            [(0:7, 0:8, "expected value, found comma")],
        );
        p!("[val: nose(,)]" =>
            [func!("val": (named_tuple!("nose")), {})],
            [(0:11, 0:12, "expected value, found comma")],
        );
        p!("[val: (true false)]" =>
            [func!("val": (tuple!(Bool(true), Bool(false))), {})],
            [(0:11, 0:11, "expected comma")],
        );
    }

    #[test]
    fn parse_objects() {
        let f = || func!("val": (object! {}), {});

        // Okay objects
        p!("[val: {}]" => [f()]);
        p!("[val: { key: value }]" =>
            [func!("val": (object! { "key" => Id("value") }), {})]);

        // Unclosed object
        p!("[val: {hello: world]" =>
            [func!("val": (object! { "hello" => Id("world") }), {})],
            [(0:19, 0:19, "expected closing brace")],
        );
        p!("[val: { a]" =>
            [func!("val": (object! {}), {})],
            [(0:9, 0:9, "expected colon"), (0:9, 0:9, "expected closing brace")],
        );

        // Missing key
        p!("[val: {,}]" => [f()], [(0:7, 0:8, "expected key, found comma")]);
        p!("[val: { 12pt }]" => [f()], [(0:8, 0:12, "expected key, found size")]);
        p!("[val: { : }]" => [f()], [(0:8, 0:9, "expected key, found colon")]);

        // Missing colon
        p!("[val: { key }]" => [f()], [(0:11, 0:11, "expected colon")]);
        p!("[val: { key false }]" => [f()], [
            (0:11, 0:11, "expected colon"),
            (0:12, 0:17, "expected key, found bool"),
        ]);
        p!("[val: { a b:c }]" =>
            [func!("val": (object! { "b" => Id("c") }), {})],
            [(0:9, 0:9, "expected colon")],
        );

        // Missing value
        p!("[val: { key: : }]" => [f()], [(0:13, 0:14, "expected value, found colon")]);
        p!("[val: { key: , k: \"s\" }]" =>
            [func!("val": (object! { "k" => Str("s") }), {})],
            [(0:13, 0:14, "expected value, found comma")],
        );

        // Missing comma, invalid token
        p!("[val: left={ a: 2, b: false 🌎 }]" =>
            [func!("val": (), {
                "left" => object! {
                    "a" => Num(2.0),
                    "b" => Bool(false),
                }
            })],
            [(0:27, 0:27, "expected comma"),
             (0:28, 0:29, "expected key, found invalid token")],
        );
    }

    #[test]
    fn parse_nested_tuples_and_objects() {
        p!("[val: (1, { ab: (), d: (3, 14pt) }), false]" => [func!("val": (
            tuple!(
                Num(1.0),
                object!(
                    "ab" => tuple!(),
                    "d" => tuple!(Num(3.0), Pt(14.0)),
                ),
            ),
            Bool(false),
        ), {})]);
    }

    #[test]
    fn parse_one_keyword_argument() {
        // Correct
        p!("[val: x=true]" =>
            [func!("val": (), { "x" => Bool(true) })], [],
            [(0:6, 0:7, ArgumentKey), (0:1, 0:4, ValidFuncName)],
        );

        // Spacing around keyword arguments
        p!("\n [val: \n hi \n = /* //\n */ \"s\n\"]" =>
            [S, func!("val": (), { "hi" => Str("s\n") })], [],
            [(2:1, 2:3, ArgumentKey), (1:2, 1:5, ValidFuncName)],
        );

        // Missing value
        p!("[val: x=]" =>
            [func!("val")],
            [(0:8, 0:8, "expected value")],
            [(0:6, 0:7, ArgumentKey), (0:1, 0:4, ValidFuncName)],
        );
    }

    #[test]
    fn parse_multiple_mixed_arguments() {
        p!("[val: a,]" => [func!("val": (Id("a")), {})]);
        p!("[val: 12pt, key=value]" =>
            [func!("val": (Pt(12.0)), { "key" => Id("value") })], [],
            [(0:12, 0:15, ArgumentKey), (0:1, 0:4, ValidFuncName)],
        );
        p!("[val: a , \"b\" , c]" => [func!("val": (Id("a"), Str("b"), Id("c")), {})]);
    }

    #[test]
    fn parse_invalid_values() {
        p!("[val: )]"     => [func!("val")], [(0:6, 0:7, "expected argument, found closing paren")]);
        p!("[val: }]"     => [func!("val")], [(0:6, 0:7, "expected argument, found closing brace")]);
        p!("[val: :]"     => [func!("val")], [(0:6, 0:7, "expected argument, found colon")]);
        p!("[val: ,]"     => [func!("val")], [(0:6, 0:7, "expected argument, found comma")]);
        p!("[val: =]"     => [func!("val")], [(0:6, 0:7, "expected argument, found equals sign")]);
        p!("[val: 🌎]"    => [func!("val")], [(0:6, 0:7, "expected argument, found invalid token")]);
        p!("[val: 12ept]" => [func!("val")], [(0:6, 0:11, "expected argument, found invalid token")]);
        p!("[val: [hi]]"  =>
            [func!("val")],
            [(0:6, 0:10, "expected argument, found function")],
            [(0:1, 0:4, ValidFuncName)],
        );
    }

    #[test]
    fn parse_invalid_key_value_pairs() {
        // Invalid keys
        p!("[val: true=you]" =>
            [func!("val": (Bool(true), Id("you")), {})],
            [(0:10, 0:10, "expected comma"),
             (0:10, 0:11, "expected argument, found equals sign")],
            [(0:1, 0:4, ValidFuncName)],
        );

        p!("[box: z=y=4]" =>
            [func!("box": (Num(4.0)), { "z" => Id("y") })],
            [(0:9, 0:9, "expected comma"),
             (0:9, 0:10, "expected argument, found equals sign")],
        );

        // Invalid colon after keyable positional argument
        p!("[val: key:12]" =>
            [func!("val": (Id("key"), Num(12.0)), {})],
            [(0:9, 0:9, "expected comma"),
             (0:9, 0:10, "expected argument, found colon")],
            [(0:1, 0:4, ValidFuncName)],
        );

        // Invalid colon after non-keyable positional argument
        p!("[val: true:12]" => [func!("val": (Bool(true), Num(12.0)), {})],
            [(0:10, 0:10, "expected comma"),
             (0:10, 0:11, "expected argument, found colon")],
            [(0:1, 0:4, ValidFuncName)],
        );
    }

    #[test]
    fn parse_invalid_commas() {
        // Missing commas
        p!("[val: 1pt 1]" =>
            [func!("val": (Pt(1.0), Num(1.0)), {})],
            [(0:9, 0:9, "expected comma")],
        );
        p!(r#"[val: _"s"]"# =>
            [func!("val": (Id("_"), Str("s")), {})],
            [(0:7, 0:7, "expected comma")],
        );

        // Unexpected commas
        p!("[val:,]" => [func!("val")], [(0:5, 0:6, "expected argument, found comma")]);
        p!("[val: key=,]" => [func!("val")], [(0:10, 0:11, "expected value, found comma")]);
        p!("[val:, true]" =>
            [func!("val": (Bool(true)), {})],
            [(0:5, 0:6, "expected argument, found comma")],
        );
    }

    #[test]
    fn parse_bodies() {
        p!("[val][Hi]" => [func!("val"; [T("Hi")])]);

        // Body nodes in bodies.
        p!("[val:*][*Hi*]" =>
            [func!("val"; [Bold, T("Hi"), Bold])],
            [(0:5, 0:6, "expected argument, found invalid token")],
        );

        // Errors in bodies.
        p!(" [val][ */ ]" =>
            [S, func!("val"; [S, S])],
            [(0:8, 0:10, "unexpected end of block comment")],
        );
    }

    #[test]
    fn parse_spanned_functions() {
        // Space before function
        p!(" [val]" =>
            [(0:0, 0:1, S), (0:1, 0:6, func!((0:1, 0:4, "val")))], [],
            [(0:2, 0:5, ValidFuncName)],
        );

        // Newline before function
        p!(" \n\r\n[val]" =>
            [(0:0, 2:0, Parbreak), (2:0, 2:5, func!((0:1, 0:4, "val")))], [],
            [(2:1, 2:4, ValidFuncName)],
        );

        // Content before function
        p!("hello [val][world] 🌎" =>
            [
                (0:0, 0:5, T("hello")),
                (0:5, 0:6, S),
                (0:6, 0:18, func!((0:1, 0:4, "val"); [(0:6, 0:11, T("world"))])),
                (0:18, 0:19, S),
                (0:19, 0:20, T("🌎"))
            ], [],
            [(0:7, 0:10, ValidFuncName)],
        );

        // Nested function
        p!(" [val][\nbody[ box]\n ]" =>
            [
                (0:0, 0:1, S),
                (0:1, 2:2, func!((0:1, 0:4, "val"); [
                    (0:6, 1:0, S),
                    (1:0, 1:4, T("body")),
                    (1:4, 1:10, func!((0:2, 0:5, "box"))),
                    (1:10, 2:1, S),
                ]))
            ], [],
            [(0:2, 0:5, ValidFuncName), (1:6, 1:9, ValidFuncName)],
        );
    }
}