thp/src/syntax/utils.rs

use crate::lexic::token::{Token, TokenType};

use super::{ParsingError, ParsingResult};

pub trait Tokenizer {
    fn get_significant<'a>(&'a self, index: usize) -> Option<(&'a Token, usize)>;
}

impl Tokenizer for Vec<Token> {
    /// Returns the first non whitespace token at index & the position the found token
    fn get_significant<'a>(&'a self, index: usize) -> Option<(&'a Token, usize)> {
        let mut current_pos = index;

        // Ignore all whitespace and newlines
        loop {
            match self.get(current_pos) {
                Some(token) => {
                    if token.token_type == TokenType::INDENT
                        || token.token_type == TokenType::DEDENT
                        || token.token_type == TokenType::NewLine
                    {
                        current_pos += 1;
                    } else {
                        return Some((token, current_pos));
                    }
                }
                None => return None,
            }
        }
    }
}

/// Expects the token at `pos` to be an operator of value `operator`. Doesn't ignore whitespace or newlines
pub fn try_operator(tokens: &Vec<Token>, pos: usize, operator: String) -> ParsingResult<&Token> {
    match tokens.get(pos) {
        Some(t) if t.token_type == TokenType::Operator && t.value == operator => Ok((t, pos + 1)),
        Some(t) if t.token_type == TokenType::NewLine || t.token_type == TokenType::EOF => {
            Err(ParsingError::Unmatched)
        }
        Some(t) => Err(ParsingError::Mismatch(t)),
        None => Err(ParsingError::Unmatched),
    }
}

/// Expects the token at `pos` to be of type `token_type`, and returns the token and the next position.
///
/// Ignores all whitespace and newlines.
///
/// Only returns: Ok, Unmatched, Mismatched
pub fn parse_token_type(
    tokens: &Vec<Token>,
    pos: usize,
    token_type: TokenType,
) -> ParsingResult<&Token> {
    let mut current_pos = pos;

    // Ignore all whitespace, newlines and semicolons
    while let Some(t) = tokens.get(current_pos) {
        if t.token_type == TokenType::INDENT
            || t.token_type == TokenType::DEDENT
            || t.token_type == TokenType::NewLine
        {
            current_pos += 1;
        } else {
            break;
        }
    }

    match tokens.get(current_pos) {
        Some(t) if t.token_type == token_type => Ok((t, current_pos + 1)),
        Some(t) if t.token_type == TokenType::EOF || t.token_type == TokenType::NewLine => {
            Err(ParsingError::Unmatched)
        }
        Some(t) => Err(ParsingError::Mismatch(t)),
        None => Err(ParsingError::Unmatched),
    }
}
Parsing refactor pt4 2024-03-15 21:59:28 +00:00			`use crate::lexic::token::{Token, TokenType};`
Parse minimal function declaration 2023-09-09 01:17:46 +00:00
Refactor parsing pt3 2024-03-15 21:56:45 +00:00			`use super::{ParsingError, ParsingResult};`
[syntax] Alternative function to expect tokens 2023-09-20 01:06:38 +00:00
Use expressions as a function call callable 2024-01-02 17:45:45 +00:00			`pub trait Tokenizer {`
			`fn get_significant<'a>(&'a self, index: usize) -> Option<(&'a Token, usize)>;`
			`}`

			`impl Tokenizer for Vec<Token> {`
			`/// Returns the first non whitespace token at index & the position the found token`
			`fn get_significant<'a>(&'a self, index: usize) -> Option<(&'a Token, usize)> {`
			`let mut current_pos = index;`

			`// Ignore all whitespace and newlines`
			`loop {`
			`match self.get(current_pos) {`
			`Some(token) => {`
			`if token.token_type == TokenType::INDENT`
			`\|\| token.token_type == TokenType::DEDENT`
			`\|\| token.token_type == TokenType::NewLine`
			`{`
			`current_pos += 1;`
			`} else {`
			`return Some((token, current_pos));`
			`}`
			`}`
			`None => return None,`
			`}`
			`}`
			`}`
			`}`

Simplify ParseResult struct 2024-03-15 20:49:02 +00:00			/// Expects the token at `pos` to be an operator of value `operator`. Doesn't ignore whitespace or newlines
Parsing refactor pt4 2024-03-15 21:59:28 +00:00			`pub fn try_operator(tokens: &Vec<Token>, pos: usize, operator: String) -> ParsingResult<&Token> {`
[Syntax] Refactor binding parsing 2023-10-06 01:26:47 +00:00			`match tokens.get(pos) {`
Parsing refactor pt4 2024-03-15 21:59:28 +00:00			`Some(t) if t.token_type == TokenType::Operator && t.value == operator => Ok((t, pos + 1)),`
[Syntax] Refactor binding parsing 2023-10-06 01:26:47 +00:00			`Some(t) if t.token_type == TokenType::NewLine \|\| t.token_type == TokenType::EOF => {`
Parsing refactor pt4 2024-03-15 21:59:28 +00:00			`Err(ParsingError::Unmatched)`
[Syntax] Refactor binding parsing 2023-10-06 01:26:47 +00:00			`}`
Parsing refactor pt4 2024-03-15 21:59:28 +00:00			`Some(t) => Err(ParsingError::Mismatch(t)),`
			`None => Err(ParsingError::Unmatched),`
[Syntax] Refactor binding parsing 2023-10-06 01:26:47 +00:00			`}`
			`}`

Refactor parsing return values 2024-03-15 21:07:28 +00:00			/// Expects the token at `pos` to be of type `token_type`, and returns the token and the next position.
			`///`
refactor syntax result pt2 2024-03-15 21:44:29 +00:00			`/// Ignores all whitespace and newlines.`
Refactor parsing pt3 2024-03-15 21:56:45 +00:00			`///`
refactor syntax result pt2 2024-03-15 21:44:29 +00:00			`/// Only returns: Ok, Unmatched, Mismatched`
Parse minimal block of code 2023-09-21 00:53:46 +00:00			`pub fn parse_token_type(`
			`tokens: &Vec<Token>,`
			`pos: usize,`
			`token_type: TokenType,`
Refactor parsing pt3 2024-03-15 21:56:45 +00:00			`) -> ParsingResult<&Token> {`
Parse minimal block of code 2023-09-21 00:53:46 +00:00			`let mut current_pos = pos;`

Refactor parsing pt5 2024-03-15 22:42:35 +00:00			`// Ignore all whitespace, newlines and semicolons`
Parse minimal block of code 2023-09-21 00:53:46 +00:00			`while let Some(t) = tokens.get(current_pos) {`
			`if t.token_type == TokenType::INDENT`
			`\|\| t.token_type == TokenType::DEDENT`
			`\|\| t.token_type == TokenType::NewLine`
			`{`
			`current_pos += 1;`
			`} else {`
			`break;`
			`}`
			`}`

			`match tokens.get(current_pos) {`
Refactor parsing pt3 2024-03-15 21:56:45 +00:00			`Some(t) if t.token_type == token_type => Ok((t, current_pos + 1)),`
Parse minimal block of code 2023-09-21 00:53:46 +00:00			`Some(t) if t.token_type == TokenType::EOF \|\| t.token_type == TokenType::NewLine => {`
Refactor parsing pt3 2024-03-15 21:56:45 +00:00			`Err(ParsingError::Unmatched)`
Parse minimal block of code 2023-09-21 00:53:46 +00:00			`}`
Refactor parsing pt3 2024-03-15 21:56:45 +00:00			`Some(t) => Err(ParsingError::Mismatch(t)),`
			`None => Err(ParsingError::Unmatched),`
Parse minimal block of code 2023-09-21 00:53:46 +00:00			`}`
			`}`
Parse function return datatype 2024-03-18 14:20:21 +00:00