thp/src/syntax/utils.rs

use crate::{
    lexic::token::{Token, TokenType},
    utils::Result3,
};

use super::ParseResult;

pub trait Tokenizer {
    fn get_significant<'a>(&'a self, index: usize) -> Option<(&'a Token, usize)>;
}

impl Tokenizer for Vec<Token> {
    /// Returns the first non whitespace token at index & the position the found token
    fn get_significant<'a>(&'a self, index: usize) -> Option<(&'a Token, usize)> {
        let mut current_pos = index;

        // Ignore all whitespace and newlines
        loop {
            match self.get(current_pos) {
                Some(token) => {
                    if token.token_type == TokenType::INDENT
                        || token.token_type == TokenType::DEDENT
                        || token.token_type == TokenType::NewLine
                    {
                        current_pos += 1;
                    } else {
                        return Some((token, current_pos));
                    }
                }
                None => return None,
            }
        }
    }
}

/// Expects the token at `pos` to be of type `token_type`.
///
/// **Doesn't ignore whitespace or newlines**
pub fn parse_immediate_token_type(
    tokens: &Vec<Token>,
    pos: usize,
    token_type: TokenType,
) -> Result3<&Token> {
    match tokens.get(pos) {
        Some(t) if t.token_type == token_type => Result3::Ok(t),
        Some(t) if t.token_type == TokenType::EOF || t.token_type == TokenType::NewLine => {
            Result3::None
        }
        Some(t) => Result3::Err(t),
        None => Result3::None,
    }
}

/// Expects the token at `pos` to be an operator of value `operator`. Doesn't ignore whitespace or newlines
pub fn try_operator(tokens: &Vec<Token>, pos: usize, operator: String) -> Result3<&Token> {
    match tokens.get(pos) {
        Some(t) if t.token_type == TokenType::Operator && t.value == operator => Result3::Ok(t),
        Some(t) if t.token_type == TokenType::NewLine || t.token_type == TokenType::EOF => {
            Result3::None
        }
        Some(t) => Result3::Err(t),
        None => Result3::None,
    }
}

/// Expects the token at `pos` to be of type `token_type`, and returns the token and the next position.
///
/// Ignores all whitespace and newlines
pub fn parse_token_type(
    tokens: &Vec<Token>,
    pos: usize,
    token_type: TokenType,
) -> ParseResult<&Token> {
    let mut current_pos = pos;

    // Ignore all whitespace and newlines
    while let Some(t) = tokens.get(current_pos) {
        if t.token_type == TokenType::INDENT
            || t.token_type == TokenType::DEDENT
            || t.token_type == TokenType::NewLine
        {
            current_pos += 1;
        } else {
            break;
        }
    }

    match tokens.get(current_pos) {
        Some(t) if t.token_type == token_type => ParseResult::Ok(t, current_pos + 1),
        Some(t) if t.token_type == TokenType::EOF || t.token_type == TokenType::NewLine => {
            ParseResult::Unmatched
        }
        Some(t) => ParseResult::Mismatch(t),
        None => ParseResult::Unmatched,
    }
}
Parse minimal function declaration 2023-09-09 01:17:46 +00:00			`use crate::{`
			`lexic::token::{Token, TokenType},`
			`utils::Result3,`
			`};`

Refactor 2023-10-01 23:41:00 +00:00			`use super::ParseResult;`
[syntax] Alternative function to expect tokens 2023-09-20 01:06:38 +00:00
Use expressions as a function call callable 2024-01-02 17:45:45 +00:00			`pub trait Tokenizer {`
			`fn get_significant<'a>(&'a self, index: usize) -> Option<(&'a Token, usize)>;`
			`}`

			`impl Tokenizer for Vec<Token> {`
			`/// Returns the first non whitespace token at index & the position the found token`
			`fn get_significant<'a>(&'a self, index: usize) -> Option<(&'a Token, usize)> {`
			`let mut current_pos = index;`

			`// Ignore all whitespace and newlines`
			`loop {`
			`match self.get(current_pos) {`
			`Some(token) => {`
			`if token.token_type == TokenType::INDENT`
			`\|\| token.token_type == TokenType::DEDENT`
			`\|\| token.token_type == TokenType::NewLine`
			`{`
			`current_pos += 1;`
			`} else {`
			`return Some((token, current_pos));`
			`}`
			`}`
			`None => return None,`
			`}`
			`}`
			`}`
			`}`

Refactor parsing return values 2024-03-15 21:07:28 +00:00			/// Expects the token at `pos` to be of type `token_type`.
			`///`
			`/// Doesn't ignore whitespace or newlines`
			`pub fn parse_immediate_token_type(`
			`tokens: &Vec<Token>,`
			`pos: usize,`
			`token_type: TokenType,`
			`) -> Result3<&Token> {`
Parse minimal function declaration 2023-09-09 01:17:46 +00:00			`match tokens.get(pos) {`
			`Some(t) if t.token_type == token_type => Result3::Ok(t),`
[syntax] Ignore whitespace when parsing a function declaration 2023-09-20 01:30:49 +00:00			`Some(t) if t.token_type == TokenType::EOF \|\| t.token_type == TokenType::NewLine => {`
			`Result3::None`
			`}`
[syntax] Alternative function to expect tokens 2023-09-20 01:06:38 +00:00			`Some(t) => Result3::Err(t),`
			`None => Result3::None,`
			`}`
			`}`

Simplify ParseResult struct 2024-03-15 20:49:02 +00:00			/// Expects the token at `pos` to be an operator of value `operator`. Doesn't ignore whitespace or newlines
[Syntax] Refactor binding parsing 2023-10-06 01:26:47 +00:00			`pub fn try_operator(tokens: &Vec<Token>, pos: usize, operator: String) -> Result3<&Token> {`
			`match tokens.get(pos) {`
			`Some(t) if t.token_type == TokenType::Operator && t.value == operator => Result3::Ok(t),`
			`Some(t) if t.token_type == TokenType::NewLine \|\| t.token_type == TokenType::EOF => {`
			`Result3::None`
			`}`
			`Some(t) => Result3::Err(t),`
			`None => Result3::None,`
			`}`
			`}`

Refactor parsing return values 2024-03-15 21:07:28 +00:00			/// Expects the token at `pos` to be of type `token_type`, and returns the token and the next position.
			`///`
			`/// Ignores all whitespace and newlines`
Parse minimal block of code 2023-09-21 00:53:46 +00:00			`pub fn parse_token_type(`
			`tokens: &Vec<Token>,`
			`pos: usize,`
			`token_type: TokenType,`
Simplify ParseResult struct 2024-03-15 20:49:02 +00:00			`) -> ParseResult<&Token> {`
Parse minimal block of code 2023-09-21 00:53:46 +00:00			`let mut current_pos = pos;`

			`// Ignore all whitespace and newlines`
			`while let Some(t) = tokens.get(current_pos) {`
			`if t.token_type == TokenType::INDENT`
			`\|\| t.token_type == TokenType::DEDENT`
			`\|\| t.token_type == TokenType::NewLine`
			`{`
			`current_pos += 1;`
			`} else {`
			`break;`
			`}`
			`}`

			`match tokens.get(current_pos) {`
			`Some(t) if t.token_type == token_type => ParseResult::Ok(t, current_pos + 1),`
			`Some(t) if t.token_type == TokenType::EOF \|\| t.token_type == TokenType::NewLine => {`
			`ParseResult::Unmatched`
			`}`
Refactor parsing return values 2024-03-15 21:07:28 +00:00			`Some(t) => ParseResult::Mismatch(t),`
Parse minimal block of code 2023-09-21 00:53:46 +00:00			`None => ParseResult::Unmatched,`
			`}`
			`}`