From ae856195ea2d239080488690c27ba5f36e9d5656 Mon Sep 17 00:00:00 2001 From: AurumTheEnd <47597303+aurumtheend@users.noreply.github.com> Date: Fri, 17 May 2024 15:28:55 +0200 Subject: [PATCH] refactor(parser): made intermediate_token use consts instead of runtime iters --- src/parser/structs/intermediate_token.rs | 51 +++++++++++++++--------- src/parser/tokenize.rs | 2 +- 2 files changed, 34 insertions(+), 19 deletions(-) diff --git a/src/parser/structs/intermediate_token.rs b/src/parser/structs/intermediate_token.rs index 209f9e9..f6ca202 100644 --- a/src/parser/structs/intermediate_token.rs +++ b/src/parser/structs/intermediate_token.rs @@ -1,4 +1,3 @@ -use itertools::Itertools; use regex::RegexSet; use crate::parser::utils::LITERAL_IDENTIFIER; @@ -103,25 +102,41 @@ impl<'a> IntermediateToken<'a> { .concat() } - pub fn longest_token_len() -> usize { - Self::all_token_patterns() - .iter() - .max_by(|a, b| a.chars().count().cmp(&b.chars().count())) - .expect("No patterns defined in the library") - .chars() - .count() - } + pub const ALL_TOKEN_PATTERNS_FROM_LONGEST: [&'static str; 26] = [ + Self::FALSE_PATTERN_WORD, + Self::TRUE_PATTERN_WORD, + Self::AND_PATTERN_WORD, + Self::NOT_PATTERN_WORD, + Self::AND_PATTERN_LOGIC, + Self::OR_PATTERN_LOGIC, + Self::OR_PATTERN_WORD, + Self::AND_PATTERN_BIT, + Self::AND_PATTERN_MATH, + Self::AND_PATTERN_MATH_2, + Self::AND_PATTERN_BOOL, + Self::OR_PATTERN_BIT, + Self::OR_PATTERN_MATH, + Self::OR_PATTERN_MATH_2, + Self::OR_PATTERN_BOOL, + Self::NOT_PATTERN_TILDE, + Self::NOT_PATTERN_MARK, + Self::NOT_PATTERN_MATH, + Self::FALSE_PATTERN_CHAR, + Self::FALSE_PATTERN_NUM, + Self::TRUE_PATTERN_CHAR, + Self::TRUE_PATTERN_NUM, + Self::LITERAL_START_PATTERN, + Self::LITERAL_END_PATTERN, + Self::PARENTHESIS_START_PATTERN, + Self::PARENTHESIS_END_PATTERN, + ]; - fn all_token_patterns_ordered_from_longest() -> Vec<&'a str> { - Self::all_token_patterns() - .into_iter() - .sorted_by(|a, b| b.chars().count().cmp(&a.chars().count())) - .collect() - } + // FALSE_PATTERN_WORD == "false" + pub const LONGEST_TOKEN_LEN: usize = 5; // TODO make a trait method pub fn try_from(value: &'a str) -> Option { - let input = Self::all_token_patterns_ordered_from_longest(); + let input = Self::ALL_TOKEN_PATTERNS_FROM_LONGEST; // escape the pattern so that e.g. "^" is not treated as regex, but as a literal character for the And operation let set = RegexSet::new(input.iter().map(|pattern| { @@ -196,7 +211,7 @@ mod tests { #[test] fn test_longest() { - let actual = IntermediateToken::longest_token_len(); + let actual = IntermediateToken::LONGEST_TOKEN_LEN; let expected = IntermediateToken::FALSE_PATTERN_WORD.len(); assert_eq!(actual, expected); @@ -204,7 +219,7 @@ mod tests { #[test] fn test_ordered_patterns() { - let tokens = IntermediateToken::all_token_patterns_ordered_from_longest(); + let tokens = IntermediateToken::ALL_TOKEN_PATTERNS_FROM_LONGEST; assert!(tokens .iter() diff --git a/src/parser/tokenize.rs b/src/parser/tokenize.rs index 39086ae..ae9cb8f 100644 --- a/src/parser/tokenize.rs +++ b/src/parser/tokenize.rs @@ -17,7 +17,7 @@ fn tokenize_level( ) -> Result, TokenizeError> { let mut result = vec![]; let mut buffer = String::new(); - let take_size = IntermediateToken::longest_token_len() + 1; + let take_size = IntermediateToken::LONGEST_TOKEN_LEN + 1; // trim whitespace in case of whitespace after opening parenthesis trim_whitespace_left(input);