From f4f83af7831c309923feaf453069a6a75e181084 Mon Sep 17 00:00:00 2001 From: Nadrieril Date: Wed, 11 Sep 2019 21:11:39 +0200 Subject: Rename match_inputs to match_nodes to reflect new terminology --- dhall_syntax/src/parser.rs | 76 +++++------ pest_consume/examples/csv/main.rs | 10 +- pest_consume/src/lib.rs | 2 +- pest_consume_macros/src/lib.rs | 6 +- pest_consume_macros/src/match_inputs.rs | 218 -------------------------------- pest_consume_macros/src/match_nodes.rs | 218 ++++++++++++++++++++++++++++++++ 6 files changed, 265 insertions(+), 265 deletions(-) delete mode 100644 pest_consume_macros/src/match_inputs.rs create mode 100644 pest_consume_macros/src/match_nodes.rs diff --git a/dhall_syntax/src/parser.rs b/dhall_syntax/src/parser.rs index d945435..c0b9712 100644 --- a/dhall_syntax/src/parser.rs +++ b/dhall_syntax/src/parser.rs @@ -6,7 +6,7 @@ use std::rc::Rc; use dgp::Rule; use dhall_generated_parser as dgp; -use pest_consume::{match_inputs, Parser}; +use pest_consume::{match_nodes, Parser}; use crate::map::{DupTreeMap, DupTreeSet}; use crate::ExprF::*; @@ -167,7 +167,7 @@ impl DhallParser { fn double_quote_literal( input: ParseInput, ) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [double_quote_chunk(chunks)..] => { chunks.collect() } @@ -177,7 +177,7 @@ impl DhallParser { fn double_quote_chunk( input: ParseInput, ) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [expression(e)] => { InterpolatedTextContents::Expr(e) }, @@ -264,7 +264,7 @@ impl DhallParser { fn single_quote_literal( input: ParseInput, ) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [single_quote_continue(lines)] => { let newline: ParsedText = "\n".to_string().into(); @@ -303,7 +303,7 @@ impl DhallParser { fn single_quote_continue( input: ParseInput, ) -> ParseResult>>> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [expression(e), single_quote_continue(lines)] => { let c = InterpolatedTextContents::Expr(e); let mut lines = lines; @@ -388,7 +388,7 @@ impl DhallParser { #[alias(expression, shortcut = true)] fn identifier(input: ParseInput) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [variable(v)] => { spanned(input, Var(v)) }, @@ -397,7 +397,7 @@ impl DhallParser { } fn variable(input: ParseInput) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [label(l), natural_literal(idx)] => { V(l, idx) }, @@ -439,7 +439,7 @@ impl DhallParser { .collect()) } fn path(input: ParseInput) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [path_component(components)..] => { components.collect() } @@ -450,7 +450,7 @@ impl DhallParser { fn local( input: ParseInput, ) -> ParseResult>> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [local_path((prefix, p))] => ImportLocation::Local(prefix, p), )) } @@ -459,19 +459,19 @@ impl DhallParser { fn parent_path( input: ParseInput, ) -> ParseResult<(FilePrefix, Vec)> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [path(p)] => (FilePrefix::Parent, p) )) } #[alias(local_path)] fn here_path(input: ParseInput) -> ParseResult<(FilePrefix, Vec)> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [path(p)] => (FilePrefix::Here, p) )) } #[alias(local_path)] fn home_path(input: ParseInput) -> ParseResult<(FilePrefix, Vec)> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [path(p)] => (FilePrefix::Home, p) )) } @@ -479,7 +479,7 @@ impl DhallParser { fn absolute_path( input: ParseInput, ) -> ParseResult<(FilePrefix, Vec)> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [path(p)] => (FilePrefix::Absolute, p) )) } @@ -493,7 +493,7 @@ impl DhallParser { } fn http_raw(input: ParseInput) -> ParseResult>> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [scheme(sch), authority(auth), path(p)] => URL { scheme: sch, authority: auth, @@ -523,7 +523,7 @@ impl DhallParser { fn http( input: ParseInput, ) -> ParseResult>> { - Ok(ImportLocation::Remote(match_inputs!(input.children(); + Ok(ImportLocation::Remote(match_nodes!(input.children(); [http_raw(url)] => url, [http_raw(url), expression(e)] => URL { headers: Some(e), ..url }, ))) @@ -533,7 +533,7 @@ impl DhallParser { fn env( input: ParseInput, ) -> ParseResult>> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [environment_variable(v)] => ImportLocation::Env(v), )) } @@ -543,7 +543,7 @@ impl DhallParser { } #[alias(environment_variable)] fn posix_environment_variable(input: ParseInput) -> ParseResult { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [posix_environment_variable_character(chars)..] => { chars.collect() }, @@ -588,7 +588,7 @@ impl DhallParser { ) -> ParseResult>> { use crate::Import; let mode = ImportMode::Code; - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [import_type(location)] => Import { mode, location, hash: None }, [import_type(location), hash(h)] => Import { mode, location, hash: Some(h) }, )) @@ -606,7 +606,7 @@ impl DhallParser { #[alias(expression)] fn import(input: ParseInput) -> ParseResult> { use crate::Import; - let import = match_inputs!(input.children(); + let import = match_nodes!(input.children(); [import_hashed(imp)] => { Import { mode: ImportMode::Code, ..imp } }, @@ -641,13 +641,13 @@ impl DhallParser { #[alias(expression)] fn empty_list_literal(input: ParseInput) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [expression(e)] => spanned(input, EmptyListLit(e)), )) } fn expression(input: ParseInput) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [lambda(()), label(l), expression(typ), arrow(()), expression(body)] => { spanned(input, Lam(l, typ, body)) @@ -694,7 +694,7 @@ impl DhallParser { fn let_binding( input: ParseInput, ) -> ParseResult<(Label, Option>, Expr, Span)> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [label(name), expression(annot), expression(expr)] => (name, Some(annot), expr, input_to_span(input)), [label(name), expression(expr)] => @@ -744,7 +744,7 @@ impl DhallParser { fn application_expression( input: ParseInput, ) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [expression(e)] => e, [expression(first), expression(rest)..] => { rest.fold( @@ -765,7 +765,7 @@ impl DhallParser { fn first_application_expression( input: ParseInput, ) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [Some_(()), expression(e)] => { spanned(input, SomeLit(e)) }, @@ -783,7 +783,7 @@ impl DhallParser { fn selector_expression( input: ParseInput, ) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [expression(e)] => e, [expression(first), selector(rest)..] => { rest.fold( @@ -806,7 +806,7 @@ impl DhallParser { fn selector( input: ParseInput, ) -> ParseResult<(Either>, Span)> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [label(l)] => (Either::Left(l), input_to_span(input)), [labels(ls)] => (Either::Right(ls), input_to_span(input)), // [expression(_e)] => unimplemented!("selection by expression"), // TODO @@ -814,7 +814,7 @@ impl DhallParser { } fn labels(input: ParseInput) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [label(ls)..] => ls.collect(), )) } @@ -823,7 +823,7 @@ impl DhallParser { fn primitive_expression( input: ParseInput, ) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [double_literal(n)] => spanned(input, DoubleLit(n)), [natural_literal(n)] => spanned(input, NaturalLit(n)), [integer_literal(n)] => spanned(input, IntegerLit(n)), @@ -849,7 +849,7 @@ impl DhallParser { fn non_empty_record_type_or_literal( input: ParseInput, ) -> ParseResult> { - let e = match_inputs!(input.children(); + let e = match_nodes!(input.children(); [label(first_label), non_empty_record_type(rest)] => { let (first_expr, mut map) = rest; map.insert(first_label, first_expr); @@ -867,7 +867,7 @@ impl DhallParser { fn non_empty_record_type( input: ParseInput, ) -> ParseResult<(Expr, DupTreeMap>)> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [expression(expr), record_type_entry(entries)..] => { (expr, entries.collect()) } @@ -877,7 +877,7 @@ impl DhallParser { fn record_type_entry( input: ParseInput, ) -> ParseResult<(Label, Expr)> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [label(name), expression(expr)] => (name, expr) )) } @@ -885,7 +885,7 @@ impl DhallParser { fn non_empty_record_literal( input: ParseInput, ) -> ParseResult<(Expr, DupTreeMap>)> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [expression(expr), record_literal_entry(entries)..] => { (expr, entries.collect()) } @@ -895,14 +895,14 @@ impl DhallParser { fn record_literal_entry( input: ParseInput, ) -> ParseResult<(Label, Expr)> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [label(name), expression(expr)] => (name, expr) )) } #[alias(expression)] fn union_type(input: ParseInput) -> ParseResult> { - let map = match_inputs!(input.children(); + let map = match_nodes!(input.children(); [empty_union_type(_)] => Default::default(), [union_type_entry(entries)..] => entries.collect(), ); @@ -916,7 +916,7 @@ impl DhallParser { fn union_type_entry( input: ParseInput, ) -> ParseResult<(Label, Option>)> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [label(name), expression(expr)] => (name, Some(expr)), [label(name)] => (name, None), )) @@ -926,7 +926,7 @@ impl DhallParser { fn non_empty_list_literal( input: ParseInput, ) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [expression(items)..] => spanned( input, NEListLit(items.collect()) @@ -936,7 +936,7 @@ impl DhallParser { #[alias(expression)] fn final_expression(input: ParseInput) -> ParseResult> { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [expression(e), EOI(_)] => e )) } @@ -949,7 +949,7 @@ pub fn parse_expr(input_str: &str) -> ParseResult> { input_str, rc_input_str, )?; - Ok(match_inputs!(; inputs; + Ok(match_nodes!(; inputs; [expression(e)] => e, )) } diff --git a/pest_consume/examples/csv/main.rs b/pest_consume/examples/csv/main.rs index 037948b..bb9f8fc 100644 --- a/pest_consume/examples/csv/main.rs +++ b/pest_consume/examples/csv/main.rs @@ -1,5 +1,5 @@ #![feature(slice_patterns)] -use pest_consume::{match_inputs, Parser}; +use pest_consume::{match_nodes, Parser}; #[derive(pest_derive::Parser)] #[grammar = "../examples/csv/csv.pest"] @@ -32,20 +32,20 @@ impl CSVParser { } fn field(input: Node) -> ParseResult { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [number(n)] => CSVField::Number(n), [string(s)] => CSVField::String(s), )) } fn record(input: Node) -> ParseResult { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [field(fields)..] => fields.collect(), )) } fn file(input: Node) -> ParseResult { - Ok(match_inputs!(input.children(); + Ok(match_nodes!(input.children(); [record(records).., EOI(_)] => records.collect(), )) } @@ -53,7 +53,7 @@ impl CSVParser { fn parse_csv(input_str: &str) -> ParseResult { let inputs = CSVParser::parse(Rule::file, input_str)?; - Ok(match_inputs!(; inputs; + Ok(match_nodes!(; inputs; [file(e)] => e, )) } diff --git a/pest_consume/src/lib.rs b/pest_consume/src/lib.rs index f14f6f5..319810a 100644 --- a/pest_consume/src/lib.rs +++ b/pest_consume/src/lib.rs @@ -7,7 +7,7 @@ use pest::Parser as PestParser; use pest::RuleType; #[proc_macro_hack::proc_macro_hack] -pub use pest_consume_macros::match_inputs; +pub use pest_consume_macros::match_nodes; pub use pest_consume_macros::parser; mod node { diff --git a/pest_consume_macros/src/lib.rs b/pest_consume_macros/src/lib.rs index 7f9f464..d726b5d 100644 --- a/pest_consume_macros/src/lib.rs +++ b/pest_consume_macros/src/lib.rs @@ -6,7 +6,7 @@ extern crate proc_macro; mod make_parser; -mod match_inputs; +mod match_nodes; use proc_macro::TokenStream; @@ -19,8 +19,8 @@ pub fn parser(attrs: TokenStream, input: TokenStream) -> TokenStream { } #[proc_macro_hack::proc_macro_hack] -pub fn match_inputs(input: TokenStream) -> TokenStream { - TokenStream::from(match match_inputs::match_inputs(input) { +pub fn match_nodes(input: TokenStream) -> TokenStream { + TokenStream::from(match match_nodes::match_nodes(input) { Ok(tokens) => tokens, Err(err) => err.to_compile_error(), }) diff --git a/pest_consume_macros/src/match_inputs.rs b/pest_consume_macros/src/match_inputs.rs deleted file mode 100644 index 773f806..0000000 --- a/pest_consume_macros/src/match_inputs.rs +++ /dev/null @@ -1,218 +0,0 @@ -use proc_macro2::{Span, TokenStream}; -use quote::quote; -use syn::parse::{Parse, ParseStream, Result}; -use syn::punctuated::Punctuated; -use syn::spanned::Spanned; -use syn::{ - bracketed, parenthesized, parse_quote, token, Error, Expr, Ident, Pat, - Token, Type, -}; - -#[derive(Debug, Clone)] -struct ChildrenBranch { - pattern_span: Span, - pattern: Punctuated, - body: Expr, -} - -#[derive(Debug, Clone)] -enum ChildrenBranchPatternItem { - Single { rule_name: Ident, binder: Pat }, - Multiple { rule_name: Ident, binder: Ident }, -} - -#[derive(Debug, Clone)] -struct ParseChildrenInput { - parser: Type, - input_expr: Expr, - branches: Punctuated, -} - -impl Parse for ChildrenBranch { - fn parse(input: ParseStream) -> Result { - let contents; - let _: token::Bracket = bracketed!(contents in input); - let pattern_unparsed: TokenStream = contents.fork().parse()?; - let pattern_span = pattern_unparsed.span(); - let pattern = Punctuated::parse_terminated(&contents)?; - let _: Token![=>] = input.parse()?; - let body = input.parse()?; - - Ok(ChildrenBranch { - pattern_span, - pattern, - body, - }) - } -} - -impl Parse for ChildrenBranchPatternItem { - fn parse(input: ParseStream) -> Result { - let contents; - let rule_name = input.parse()?; - parenthesized!(contents in input); - if input.peek(Token![..]) { - let binder = contents.parse()?; - let _: Token![..] = input.parse()?; - Ok(ChildrenBranchPatternItem::Multiple { rule_name, binder }) - } else if input.is_empty() || input.peek(Token![,]) { - let binder = contents.parse()?; - Ok(ChildrenBranchPatternItem::Single { rule_name, binder }) - } else { - Err(input.error("expected `..` or nothing")) - } - } -} - -impl Parse for ParseChildrenInput { - fn parse(input: ParseStream) -> Result { - let parser = if input.peek(token::Lt) { - let _: token::Lt = input.parse()?; - let parser = input.parse()?; - let _: token::Gt = input.parse()?; - let _: Token![;] = input.parse()?; - parser - } else { - parse_quote!(Self) - }; - let input_expr = input.parse()?; - let _: Token![;] = input.parse()?; - let branches = Punctuated::parse_terminated(input)?; - - Ok(ParseChildrenInput { - parser, - input_expr, - branches, - }) - } -} - -fn make_parser_branch( - branch: &ChildrenBranch, - i_inputs: &Ident, - parser: &Type, -) -> Result { - use ChildrenBranchPatternItem::{Multiple, Single}; - - let body = &branch.body; - let aliased_rule = quote!(<#parser as ::pest_consume::Parser>::AliasedRule); - - // Convert the input pattern into a pattern-match on the Rules of the children. This uses - // slice_patterns. - // A single pattern just checks that the rule matches; a variable-length pattern binds the - // subslice and checks, in the if-guard, that its elements all match the chosen Rule. - let i_variable_pattern = - Ident::new("___variable_pattern", Span::call_site()); - let match_pat = branch.pattern.iter().map(|item| match item { - Single { rule_name, .. } => quote!(#aliased_rule::#rule_name), - Multiple { .. } => quote!(#i_variable_pattern @ ..), - }); - let match_filter = branch.pattern.iter().map(|item| match item { - Single { .. } => quote!(), - Multiple { rule_name, .. } => quote!( - { - // We can't use .all() directly in the pattern guard; see - // https://github.com/rust-lang/rust/issues/59803. - let all_match = |slice: &[_]| { - slice.iter().all(|r| - *r == #aliased_rule::#rule_name - ) - }; - all_match(#i_variable_pattern) - } && - ), - }); - - // Once we have found a branch that matches, we need to parse the children. - let mut singles_before_multiple = Vec::new(); - let mut multiple = None; - let mut singles_after_multiple = Vec::new(); - for item in &branch.pattern { - match item { - Single { - rule_name, binder, .. - } => { - if multiple.is_none() { - singles_before_multiple.push((rule_name, binder)) - } else { - singles_after_multiple.push((rule_name, binder)) - } - } - Multiple { - rule_name, binder, .. - } => { - if multiple.is_none() { - multiple = Some((rule_name, binder)) - } else { - return Err(Error::new( - branch.pattern_span.clone(), - "multiple variable-length patterns are not allowed", - )); - } - } - } - } - let mut parses = Vec::new(); - for (rule_name, binder) in singles_before_multiple.into_iter() { - parses.push(quote!( - let #binder = #parser::#rule_name( - #i_inputs.next().unwrap() - )?; - )) - } - // Note the `rev()`: we are taking inputs from the end of the iterator in reverse order, so that - // only the unmatched inputs are left for the variable-length pattern, if any. - for (rule_name, binder) in singles_after_multiple.into_iter().rev() { - parses.push(quote!( - let #binder = #parser::#rule_name( - #i_inputs.next_back().unwrap() - )?; - )) - } - if let Some((rule_name, binder)) = multiple { - parses.push(quote!( - let #binder = #i_inputs - .map(|i| #parser::#rule_name(i)) - .collect::, _>>()? - .into_iter(); - )) - } - - Ok(quote!( - [#(#match_pat),*] if #(#match_filter)* true => { - #(#parses)* - #body - } - )) -} - -pub fn match_inputs( - input: proc_macro::TokenStream, -) -> Result { - let input: ParseChildrenInput = syn::parse(input)?; - - let i_input_rules = Ident::new("___input_rules", Span::call_site()); - let i_inputs = Ident::new("___inputs", Span::call_site()); - - let input_expr = &input.input_expr; - let parser = &input.parser; - let branches = input - .branches - .iter() - .map(|br| make_parser_branch(br, &i_inputs, parser)) - .collect::>>()?; - - Ok(quote!({ - #[allow(unused_mut)] - let mut #i_inputs = #input_expr; - let #i_input_rules = #i_inputs.aliased_rules::<#parser>(); - - #[allow(unreachable_code)] - match #i_input_rules.as_slice() { - #(#branches,)* - [..] => return Err(#i_inputs.error( - format!("Unexpected children: {:?}", #i_input_rules) - )), - } - })) -} diff --git a/pest_consume_macros/src/match_nodes.rs b/pest_consume_macros/src/match_nodes.rs new file mode 100644 index 0000000..251b7ef --- /dev/null +++ b/pest_consume_macros/src/match_nodes.rs @@ -0,0 +1,218 @@ +use proc_macro2::{Span, TokenStream}; +use quote::quote; +use syn::parse::{Parse, ParseStream, Result}; +use syn::punctuated::Punctuated; +use syn::spanned::Spanned; +use syn::{ + bracketed, parenthesized, parse_quote, token, Error, Expr, Ident, Pat, + Token, Type, +}; + +#[derive(Debug, Clone)] +struct ChildrenBranch { + pattern_span: Span, + pattern: Punctuated, + body: Expr, +} + +#[derive(Debug, Clone)] +enum ChildrenBranchPatternItem { + Single { rule_name: Ident, binder: Pat }, + Multiple { rule_name: Ident, binder: Ident }, +} + +#[derive(Debug, Clone)] +struct ParseChildrenInput { + parser: Type, + input_expr: Expr, + branches: Punctuated, +} + +impl Parse for ChildrenBranch { + fn parse(input: ParseStream) -> Result { + let contents; + let _: token::Bracket = bracketed!(contents in input); + let pattern_unparsed: TokenStream = contents.fork().parse()?; + let pattern_span = pattern_unparsed.span(); + let pattern = Punctuated::parse_terminated(&contents)?; + let _: Token![=>] = input.parse()?; + let body = input.parse()?; + + Ok(ChildrenBranch { + pattern_span, + pattern, + body, + }) + } +} + +impl Parse for ChildrenBranchPatternItem { + fn parse(input: ParseStream) -> Result { + let contents; + let rule_name = input.parse()?; + parenthesized!(contents in input); + if input.peek(Token![..]) { + let binder = contents.parse()?; + let _: Token![..] = input.parse()?; + Ok(ChildrenBranchPatternItem::Multiple { rule_name, binder }) + } else if input.is_empty() || input.peek(Token![,]) { + let binder = contents.parse()?; + Ok(ChildrenBranchPatternItem::Single { rule_name, binder }) + } else { + Err(input.error("expected `..` or nothing")) + } + } +} + +impl Parse for ParseChildrenInput { + fn parse(input: ParseStream) -> Result { + let parser = if input.peek(token::Lt) { + let _: token::Lt = input.parse()?; + let parser = input.parse()?; + let _: token::Gt = input.parse()?; + let _: Token![;] = input.parse()?; + parser + } else { + parse_quote!(Self) + }; + let input_expr = input.parse()?; + let _: Token![;] = input.parse()?; + let branches = Punctuated::parse_terminated(input)?; + + Ok(ParseChildrenInput { + parser, + input_expr, + branches, + }) + } +} + +fn make_parser_branch( + branch: &ChildrenBranch, + i_inputs: &Ident, + parser: &Type, +) -> Result { + use ChildrenBranchPatternItem::{Multiple, Single}; + + let body = &branch.body; + let aliased_rule = quote!(<#parser as ::pest_consume::Parser>::AliasedRule); + + // Convert the input pattern into a pattern-match on the Rules of the children. This uses + // slice_patterns. + // A single pattern just checks that the rule matches; a variable-length pattern binds the + // subslice and checks, in the if-guard, that its elements all match the chosen Rule. + let i_variable_pattern = + Ident::new("___variable_pattern", Span::call_site()); + let match_pat = branch.pattern.iter().map(|item| match item { + Single { rule_name, .. } => quote!(#aliased_rule::#rule_name), + Multiple { .. } => quote!(#i_variable_pattern @ ..), + }); + let match_filter = branch.pattern.iter().map(|item| match item { + Single { .. } => quote!(), + Multiple { rule_name, .. } => quote!( + { + // We can't use .all() directly in the pattern guard; see + // https://github.com/rust-lang/rust/issues/59803. + let all_match = |slice: &[_]| { + slice.iter().all(|r| + *r == #aliased_rule::#rule_name + ) + }; + all_match(#i_variable_pattern) + } && + ), + }); + + // Once we have found a branch that matches, we need to parse the children. + let mut singles_before_multiple = Vec::new(); + let mut multiple = None; + let mut singles_after_multiple = Vec::new(); + for item in &branch.pattern { + match item { + Single { + rule_name, binder, .. + } => { + if multiple.is_none() { + singles_before_multiple.push((rule_name, binder)) + } else { + singles_after_multiple.push((rule_name, binder)) + } + } + Multiple { + rule_name, binder, .. + } => { + if multiple.is_none() { + multiple = Some((rule_name, binder)) + } else { + return Err(Error::new( + branch.pattern_span.clone(), + "multiple variable-length patterns are not allowed", + )); + } + } + } + } + let mut parses = Vec::new(); + for (rule_name, binder) in singles_before_multiple.into_iter() { + parses.push(quote!( + let #binder = #parser::#rule_name( + #i_inputs.next().unwrap() + )?; + )) + } + // Note the `rev()`: we are taking inputs from the end of the iterator in reverse order, so that + // only the unmatched inputs are left for the variable-length pattern, if any. + for (rule_name, binder) in singles_after_multiple.into_iter().rev() { + parses.push(quote!( + let #binder = #parser::#rule_name( + #i_inputs.next_back().unwrap() + )?; + )) + } + if let Some((rule_name, binder)) = multiple { + parses.push(quote!( + let #binder = #i_inputs + .map(|i| #parser::#rule_name(i)) + .collect::, _>>()? + .into_iter(); + )) + } + + Ok(quote!( + [#(#match_pat),*] if #(#match_filter)* true => { + #(#parses)* + #body + } + )) +} + +pub fn match_nodes( + input: proc_macro::TokenStream, +) -> Result { + let input: ParseChildrenInput = syn::parse(input)?; + + let i_input_rules = Ident::new("___input_rules", Span::call_site()); + let i_inputs = Ident::new("___inputs", Span::call_site()); + + let input_expr = &input.input_expr; + let parser = &input.parser; + let branches = input + .branches + .iter() + .map(|br| make_parser_branch(br, &i_inputs, parser)) + .collect::>>()?; + + Ok(quote!({ + #[allow(unused_mut)] + let mut #i_inputs = #input_expr; + let #i_input_rules = #i_inputs.aliased_rules::<#parser>(); + + #[allow(unreachable_code)] + match #i_input_rules.as_slice() { + #(#branches,)* + [..] => return Err(#i_inputs.error( + format!("Unexpected children: {:?}", #i_input_rules) + )), + } + })) +} -- cgit v1.2.3