thp/src/syntax/binding.rs

289 lines
9.5 KiB
Rust
Raw Normal View History

2023-12-17 01:51:12 +00:00
use super::ast::var_binding::Binding;
use super::utils::{parse_token_type, try_operator};
2024-03-15 22:42:35 +00:00
use super::{expression, ParsingError, ParsingResult};
use crate::error_handling::SyntaxError;
2023-09-08 01:46:11 +00:00
use crate::lexic::token::{Token, TokenType};
2023-01-08 23:09:06 +00:00
/*
binding = val binding | var binding
val binding = "val", datatype?, binding remainder
| datatype, binding remainder
var binding = "var", datatype?, binding remainder
binding remainder = identifier, "=", expression
*/
2024-03-15 22:42:35 +00:00
pub fn try_parse<'a>(tokens: &'a Vec<Token>, pos: usize) -> ParsingResult<Binding> {
2023-09-17 22:58:56 +00:00
let mut current_pos = pos;
/*
* val/var keyword
*/
let (is_var, binding_token, next_pos) = 'token: {
// check for VAL
if let Ok((val_token, next_pos)) = parse_token_type(tokens, current_pos, TokenType::VAL) {
break 'token (false, Some(val_token), next_pos);
};
// check for VAR
match parse_token_type(tokens, current_pos, TokenType::VAR) {
Ok((var_token, next_pos)) => (true, Some(var_token), next_pos),
// If a VAR is not found it is still possible that the binding is an implicit VAL
_ => (false, None, current_pos),
2023-02-09 23:44:31 +00:00
}
};
2023-10-06 01:26:47 +00:00
current_pos = next_pos;
2023-01-08 23:09:06 +00:00
/*
* datatype
*/
let (datatype, next_pos) = match parse_token_type(tokens, current_pos, TokenType::Datatype) {
Ok((t, next)) => (Some(t), next),
_ => (None, current_pos),
};
current_pos = next_pos;
// Here:
// If the binding is None and the datatype is None, then we didn't match a binding
if binding_token.is_none() && datatype.is_none() {
return Err(ParsingError::Unmatched);
}
/*
* identifier
*/
let (identifier, next_pos) = match parse_token_type(tokens, current_pos, TokenType::Identifier)
{
2024-03-15 21:56:45 +00:00
Ok((t, n)) => (t, n),
Err(ParsingError::Mismatch(token)) => {
// The parser found a token, but it's not an identifier
2024-03-15 22:42:35 +00:00
return Err(ParsingError::Err(SyntaxError {
2023-11-04 10:41:16 +00:00
error_start: token.position,
error_end: token.get_end_position(),
reason: "??".into(),
2024-03-15 22:42:35 +00:00
}));
2023-11-04 10:41:16 +00:00
}
2024-03-15 21:56:45 +00:00
Err(ParsingError::Err(error)) => {
2024-03-15 22:42:35 +00:00
return Err(ParsingError::Err(error));
}
2023-10-06 01:26:47 +00:00
_ => {
// The parser didn't find an Identifier after VAL/VAR or the Datatype
match (binding_token, datatype) {
(Some(binding_token), _) => {
return Err(ParsingError::Err(SyntaxError {
reason: format!(
"There should be an identifier after a `{}` token",
if is_var { "val" } else { "var" }
),
error_start: binding_token.position,
error_end: binding_token.get_end_position(),
}));
}
(None, Some(datatype_token)) => {
return Err(ParsingError::Err(SyntaxError {
reason: "There should be an identifier after the datatype".into(),
error_start: datatype_token.position,
error_end: datatype_token.get_end_position(),
}));
}
_ => {
panic!("Illegal parser state: binding_token and datatype are both None")
}
};
}
};
2023-10-06 01:26:47 +00:00
current_pos = next_pos;
2023-01-08 23:09:06 +00:00
/*
* Equal (=) operator
*/
let equal_operator = match try_operator(tokens, current_pos, String::from("=")) {
2024-03-15 21:59:28 +00:00
Ok((t, _)) => t,
Err(ParsingError::Mismatch(t)) => {
// The parser found a token, but it's not the `=` operator
2024-03-15 22:42:35 +00:00
return Err(ParsingError::Err(SyntaxError {
reason: format!("There should be an equal sign `=` after the identifier"),
error_start: t.position,
error_end: t.get_end_position(),
2024-03-15 22:42:35 +00:00
}));
}
2024-03-15 21:59:28 +00:00
_ => {
// The parser didn't find the `=` operator after the identifier
2024-03-15 22:42:35 +00:00
return Err(ParsingError::Err(SyntaxError {
reason: format!("There should be an equal sign `=` after the identifier",),
error_start: identifier.position,
error_end: identifier.get_end_position(),
2024-03-15 22:42:35 +00:00
}));
}
};
current_pos += 1;
2023-01-08 23:09:06 +00:00
/*
* Expression of the binding
*/
let (expression, next_pos) = match expression::try_parse(tokens, current_pos) {
2024-03-15 22:42:35 +00:00
Ok((exp, next)) => (exp, next),
_ => {
2024-03-15 22:42:35 +00:00
return Err(ParsingError::Err(SyntaxError {
reason: String::from("Expected an expression after the equal `=` operator"),
error_start: equal_operator.position,
error_end: equal_operator.get_end_position(),
2024-03-15 22:42:35 +00:00
}));
}
};
current_pos = next_pos;
2023-01-08 23:09:06 +00:00
2023-12-17 01:51:12 +00:00
let binding = Binding {
datatype,
identifier: &identifier,
2023-12-17 01:51:12 +00:00
expression,
is_mutable: is_var,
};
2024-03-15 22:42:35 +00:00
Ok((binding, current_pos))
2023-01-08 23:09:06 +00:00
}
#[cfg(test)]
mod tests {
use super::*;
2024-03-15 21:56:45 +00:00
use crate::{lexic::get_tokens, syntax::utils::parse_token_type};
2023-01-08 23:09:06 +00:00
#[test]
fn should_parse_val_binding() {
2024-03-18 13:57:28 +00:00
let tokens = get_tokens(&String::from("val identifier = 20")).unwrap();
2024-03-15 22:42:35 +00:00
let Ok((binding, _)) = try_parse(&tokens, 0) else {
2023-09-24 23:51:08 +00:00
panic!()
};
2023-01-08 23:09:06 +00:00
assert_eq!("identifier", format!("{}", binding.identifier.value));
2023-01-08 23:09:06 +00:00
}
#[test]
fn should_parse_val() {
2024-03-18 13:57:28 +00:00
let tokens = get_tokens(&String::from("val")).unwrap();
let (token, _) = parse_token_type(&tokens, 0, TokenType::VAL).unwrap();
2023-01-08 23:09:06 +00:00
2024-03-18 13:57:28 +00:00
assert_eq!(TokenType::VAL, token.token_type);
assert_eq!("val", token.value);
2023-01-08 23:09:06 +00:00
}
#[test]
fn should_parse_identifier() {
let tokens = get_tokens(&String::from("identifier")).unwrap();
2024-03-15 21:56:45 +00:00
let (token, _) = parse_token_type(&tokens, 0, TokenType::Identifier).unwrap();
2023-01-08 23:09:06 +00:00
assert_eq!("identifier", token.value);
}
#[test]
fn should_parse_operator() {
let tokens = get_tokens(&String::from("=")).unwrap();
2024-03-15 21:59:28 +00:00
let (token, _) = try_operator(&tokens, 0, String::from("=")).unwrap();
2023-01-08 23:09:06 +00:00
assert_eq!("=", token.value);
}
#[test]
fn should_parse_val_binding_with_datatype() {
let tokens = get_tokens(&String::from("val Int identifier = 20")).unwrap();
let (binding, _) = try_parse(&tokens, 0).unwrap();
assert!(!binding.is_mutable);
assert_eq!("Int", binding.datatype.unwrap().value);
assert_eq!("identifier", binding.identifier.value);
}
#[test]
fn should_parse_var_binding_with_datatype() {
let tokens = get_tokens(&String::from("var Int identifier = 20")).unwrap();
let (binding, _) = try_parse(&tokens, 0).unwrap();
assert!(binding.is_mutable);
assert!(binding.datatype.is_some());
assert_eq!("Int", binding.datatype.unwrap().value);
assert_eq!("identifier", binding.identifier.value);
}
#[test]
fn should_parse_implicit_val_binding() {
let tokens = get_tokens(&String::from("Int identifier = 20")).unwrap();
let (binding, _) = try_parse(&tokens, 0).unwrap();
assert!(!binding.is_mutable);
assert!(binding.datatype.is_some());
assert_eq!("Int", binding.datatype.unwrap().value);
assert_eq!("identifier", binding.identifier.value);
}
#[test]
fn should_return_error_on_implicit_val_binding() {
let tokens = get_tokens(&String::from("Int => 20")).unwrap();
let binding = try_parse(&tokens, 0);
match binding {
Err(ParsingError::Err(error)) => {
assert_eq!(4, error.error_start);
assert_eq!(6, error.error_end);
}
_ => panic!("Error expected"),
}
}
#[test]
fn should_return_correct_error() {
2024-03-18 13:57:28 +00:00
let tokens = get_tokens(&String::from("val")).unwrap();
assert_eq!(TokenType::VAL, tokens[0].token_type);
assert_eq!(0, tokens[0].position);
2023-09-24 23:51:08 +00:00
let binding = try_parse(&tokens, 0);
match binding {
2024-03-15 22:42:35 +00:00
Err(ParsingError::Err(error)) => {
assert_eq!(0, error.error_start);
assert_eq!(3, error.error_end);
}
_ => panic!("Error expected"),
}
}
#[test]
fn should_return_error_when_identifier_is_wrong() {
2024-03-18 13:57:28 +00:00
let tokens = get_tokens(&String::from("val 322")).unwrap();
assert_eq!(TokenType::VAL, tokens[0].token_type);
assert_eq!(0, tokens[0].position);
2023-09-24 23:51:08 +00:00
let binding = try_parse(&tokens, 0);
match binding {
2024-03-15 22:42:35 +00:00
Err(ParsingError::Err(error)) => {
assert_eq!(4, error.error_start);
assert_eq!(7, error.error_end);
}
2023-04-05 15:31:12 +00:00
_ => panic!("Error expected"),
}
2024-03-18 13:57:28 +00:00
let tokens = get_tokens(&String::from("val \"hello\"")).unwrap();
2023-09-24 23:51:08 +00:00
let binding = try_parse(&tokens, 0);
match binding {
2024-03-15 22:42:35 +00:00
Err(ParsingError::Err(error)) => {
assert_eq!(4, error.error_start);
assert_eq!(11, error.error_end);
}
2023-04-05 15:31:12 +00:00
_ => panic!("Error expected"),
}
}
#[test]
fn should_return_error_when_equal_op_is_wrong() {
2024-03-18 13:57:28 +00:00
let tokens = get_tokens(&String::from("val id \"error\"")).unwrap();
2023-09-24 23:51:08 +00:00
let binding = try_parse(&tokens, 0);
match binding {
2024-03-15 22:42:35 +00:00
Err(ParsingError::Err(error)) => {
assert_eq!(7, error.error_start);
assert_eq!(14, error.error_end);
}
2023-04-05 15:31:12 +00:00
_ => panic!("Error expected"),
}
}
2023-01-08 23:09:06 +00:00
}