From 3bc982c1f0222aaa8acc037687a9b1d44578c200 Mon Sep 17 00:00:00 2001 From: Yunkai Zhang Date: Sun, 4 Feb 2024 16:02:25 +0000 Subject: [PATCH 1/3] feat: implemented non-associative parsing in Pratt parser. --- src/pratt.rs | 29 ++++++++++++++++++++++++----- 1 file changed, 24 insertions(+), 5 deletions(-) diff --git a/src/pratt.rs b/src/pratt.rs index cc617cf6..4d731efe 100644 --- a/src/pratt.rs +++ b/src/pratt.rs @@ -131,6 +131,8 @@ pub enum Associativity { Left(u16), /// Specifies that the operator should be right-associative, with the given binding power (see [`right`]). Right(u16), + /// Specifies that the operator should be non-associative, with the given binding power. + Non(u16), } /// Specifies a left [`Associativity`] with the given binding power. @@ -149,18 +151,33 @@ pub fn right(binding_power: u16) -> Associativity { Associativity::Right(binding_power) } +/// Specifies a not-associative [`Associativity`] with the given binding power. +/// +/// Not-associative operators are evaluated from the left-most terms, moving rightward. +pub fn non(binding_power: u16) -> Associativity {Associativity::Non(binding_power)} + impl Associativity { fn left_power(&self) -> u32 { match self { - Self::Left(x) => *x as u32 * 2, - Self::Right(x) => *x as u32 * 2 + 1, + Self::Left(x) => *x as u32 * 3, + Self::Right(x) => *x as u32 * 3, + Self::Non(x) => *x as u32 * 3, } } fn right_power(&self) -> u32 { match self { - Self::Left(x) => *x as u32 * 2 + 1, - Self::Right(x) => *x as u32 * 2, + Self::Left(x) => *x as u32 * 3 + 1, + Self::Right(x) => *x as u32 * 3, + Self::Non(x) => *x as u32 * 3 + 1, + } + } + + fn next_power(&self) -> u32 { + match self { + Self::Left(x) => *x as u32 * 3, + Self::Left(x) => *x as u32 * 3, + Self::Non(x) => *x as u32 * 3 - 1, } } } @@ -467,7 +484,8 @@ macro_rules! impl_pratt_for_tuple { // Infix binary operators $( let assoc = $X.associativity(); - if $X::IS_INFIX && assoc.left_power() >= min_power { + let mut upper_bound: u32 = u32::MAX; + if $X::IS_INFIX && assoc.left_power() >= min_power && assoc.left_power() <= upper_bound { match $X.op_parser().go::(inp) { Ok(op) => match recursive::recurse(|| self.pratt_go::(inp, assoc.right_power())) { Ok(rhs) => { @@ -478,6 +496,7 @@ macro_rules! impl_pratt_for_tuple { $X.fold_infix(lhs, op, rhs, &mut MapExtra::new(pre_expr.offset(), inp)) }, ); + upper_bound = assoc.next_power(); continue }, Err(()) => inp.rewind(pre_op), From 5ad8a795667a9d5f02a19286d770336860eba1e1 Mon Sep 17 00:00:00 2001 From: Yunkai Zhang Date: Sun, 4 Feb 2024 16:09:15 +0000 Subject: [PATCH 2/3] fix: fixed typo in nbp pattern matching --- src/pratt.rs | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/pratt.rs b/src/pratt.rs index 4d731efe..954c9210 100644 --- a/src/pratt.rs +++ b/src/pratt.rs @@ -176,7 +176,7 @@ impl Associativity { fn next_power(&self) -> u32 { match self { Self::Left(x) => *x as u32 * 3, - Self::Left(x) => *x as u32 * 3, + Self::Right(x) => *x as u32 * 3, Self::Non(x) => *x as u32 * 3 - 1, } } From 7185647d524b5c43cf683d846b8ea164bea99596 Mon Sep 17 00:00:00 2001 From: Yunkai Zhang Date: Mon, 5 Feb 2024 23:50:55 +0000 Subject: [PATCH 3/3] added reference description for non-associative pratt parser. --- src/pratt.rs | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/src/pratt.rs b/src/pratt.rs index 954c9210..8c372fd7 100644 --- a/src/pratt.rs +++ b/src/pratt.rs @@ -10,6 +10,8 @@ //! ['binding power'](https://matklad.github.io/2020/04/13/simple-but-powerful-pratt-parsing.html#From-Precedence-to-Binding-Power) //! that determines how strongly operators should bind to the operands around them. //! +//! Here is ['another approach'](https://www.engr.mun.ca/~theo/Misc/pratt_parsing.htm) that provides a more comprehensive perspective of handling multiple operators and patterns +//! //! Pratt parsers are defined with the [`Parser::pratt`] method. //! //! When writing pratt parsers, it is necessary to first define an 'atomic' operand used by the parser for building up @@ -757,10 +759,9 @@ mod tests { )) .map(|x| x.to_string()); - assert_eq!( - parser.parse("1+2!$*3").into_result(), - Ok("(((1 + (2!))$) * 3)".to_string()), - ) + assert!( + parser.parse("ยง1+-~2!$*3").has_errors(), + ); } #[test]