thp/src/syntax/binding.rs

254 lines
8.6 KiB
Rust
Raw Normal View History

2023-09-08 01:50:51 +00:00
use super::ast::{Binding, ValBinding, VarBinding};
use super::utils::{try_operator, try_token_type};
use super::{expression, SyntaxResult};
use crate::error_handling::SyntaxError;
2023-09-08 01:46:11 +00:00
use crate::lexic::token::{Token, TokenType};
use crate::utils::Result3;
2023-01-08 23:09:06 +00:00
// TODO: Should return a 3 state value:
2023-01-08 23:09:06 +00:00
// - Success: binding parsed successfully
// - NotFound: the first token (var | val) was not found, so the parser should try other options
// - Error: token (var | val) was found, but then other expected tokens were not found
pub fn try_parse<'a>(tokens: &'a Vec<Token>, pos: usize) -> Option<SyntaxResult> {
2023-09-17 22:58:56 +00:00
let mut current_pos = pos;
// Optional datatype annotation
let datatype_annotation = {
2023-09-17 22:58:56 +00:00
match try_token_type(tokens, current_pos, TokenType::Datatype) {
Result3::Ok(t) => {
2023-09-17 22:58:56 +00:00
current_pos += 1;
Some(String::from(&t.value))
}
Result3::Err(_) => None,
Result3::None => panic!(
"Internal compiler error: Illegal token stream at src/syntax/binding.rs#try_parse"
),
}
};
/*
* val/var keyword
*/
let (is_val, binding_token) = {
2023-09-17 22:58:56 +00:00
let res1 = try_token_type(tokens, current_pos, TokenType::VAL);
2023-02-09 23:44:31 +00:00
match res1 {
Result3::Ok(val_token) => (true, val_token),
_ => {
2023-09-17 22:58:56 +00:00
let res2 = try_token_type(tokens, current_pos, TokenType::VAR);
2023-02-09 23:44:31 +00:00
match res2 {
Result3::Ok(var_token) => (false, var_token),
// Neither VAL nor VAR were matched, the parser should try
// other constructs
_ => return None,
2023-02-09 23:44:31 +00:00
}
}
}
};
2023-01-08 23:09:06 +00:00
/*
* identifier
*/
2023-09-17 22:58:56 +00:00
let identifier = match try_token_type(tokens, current_pos + 1, TokenType::Identifier) {
Result3::Ok(t) => t,
Result3::Err(t) => {
// The parser found a token, but it's not an identifier
return Some(SyntaxResult::Err(SyntaxError {
reason: format!(
"There should be an identifier after a `{}` token",
if is_val { "val" } else { "var" }
),
error_start: t.position,
error_end: t.get_end_position(),
}));
}
Result3::None => {
// The parser didn't find an Identifier after VAL/VAR
return Some(SyntaxResult::Err(SyntaxError {
reason: format!(
"There should be an identifier after a `{}` token",
if is_val { "val" } else { "var" }
),
error_start: binding_token.position,
error_end: binding_token.get_end_position(),
}));
}
};
2023-01-08 23:09:06 +00:00
/*
* Equal (=) operator
*/
2023-09-17 22:58:56 +00:00
let equal_operator: &Token = match try_operator(tokens, current_pos + 2, String::from("=")) {
Result3::Ok(t) => t,
Result3::Err(t) => {
// The parser found a token, but it's not the `=` operator
return Some(SyntaxResult::Err(SyntaxError {
reason: format!("There should be an equal sign `=` after the identifier"),
error_start: t.position,
error_end: t.get_end_position(),
}));
}
Result3::None => {
// The parser didn't find the `=` operator after the identifier
return Some(SyntaxResult::Err(SyntaxError {
reason: format!("There should be an equal sign `=` after the identifier",),
error_start: identifier.position,
error_end: identifier.get_end_position(),
}));
}
};
2023-01-08 23:09:06 +00:00
2023-09-17 22:58:56 +00:00
let expression = expression::try_parse(tokens, current_pos + 3);
if expression.is_none() {
2023-03-28 15:06:23 +00:00
return Some(SyntaxResult::Err(SyntaxError {
reason: String::from("Expected an expression after the equal `=` operator"),
error_start: equal_operator.position,
error_end: equal_operator.get_end_position(),
}));
}
2023-01-08 23:09:06 +00:00
let expression = expression.unwrap();
let binding = if is_val {
Binding::Val(ValBinding {
datatype: datatype_annotation,
2023-09-08 01:32:59 +00:00
identifier: Box::new(identifier.value.clone()),
2023-02-09 23:44:31 +00:00
expression,
})
} else {
Binding::Var(VarBinding {
datatype: datatype_annotation,
2023-09-08 01:32:59 +00:00
identifier: Box::new(identifier.value.clone()),
2023-02-09 23:44:31 +00:00
expression,
})
};
2023-09-17 22:58:56 +00:00
Some(SyntaxResult::Ok(
super::ast::TopLevelDeclaration::Binding(binding),
current_pos + 4,
))
2023-01-08 23:09:06 +00:00
}
#[cfg(test)]
mod tests {
use super::*;
2023-09-17 22:58:56 +00:00
use crate::{lexic::get_tokens, syntax::ast::TopLevelDeclaration};
2023-01-08 23:09:06 +00:00
#[test]
fn should_parse_val_binding() {
let tokens = get_tokens(&String::from("val identifier = 20")).unwrap();
let binding = try_parse(&tokens, 0).unwrap();
match binding {
2023-09-17 22:58:56 +00:00
SyntaxResult::Ok(TopLevelDeclaration::Binding(Binding::Val(binding)), _) => {
2023-09-08 01:32:59 +00:00
assert_eq!("identifier", format!("{}", binding.identifier));
2023-01-08 23:09:06 +00:00
}
_ => panic!(),
2023-01-08 23:09:06 +00:00
}
}
#[test]
fn should_parse_val() {
let tokens = get_tokens(&String::from("val")).unwrap();
let token = *try_token_type(&tokens, 0, TokenType::VAL).unwrap();
2023-01-08 23:09:06 +00:00
assert_eq!(TokenType::VAL, token.token_type);
assert_eq!("val", token.value);
}
#[test]
fn should_parse_identifier() {
let tokens = get_tokens(&String::from("identifier")).unwrap();
let token = *try_token_type(&tokens, 0, TokenType::Identifier).unwrap();
2023-01-08 23:09:06 +00:00
assert_eq!("identifier", token.value);
}
#[test]
fn should_parse_operator() {
let tokens = get_tokens(&String::from("=")).unwrap();
let token = *try_operator(&tokens, 0, String::from("=")).unwrap();
2023-01-08 23:09:06 +00:00
assert_eq!("=", token.value);
}
#[test]
fn should_parse_binding_with_datatype() {
let tokens = get_tokens(&String::from("Num val identifier = 20")).unwrap();
let binding = try_parse(&tokens, 0).unwrap();
match binding {
2023-09-17 22:58:56 +00:00
SyntaxResult::Ok(TopLevelDeclaration::Binding(Binding::Val(binding)), _) => {
assert_eq!(Some(String::from("Num")), binding.datatype);
2023-09-08 01:32:59 +00:00
assert_eq!("identifier", format!("{}", binding.identifier));
}
_ => panic!(),
}
let tokens = get_tokens(&String::from("Bool var identifier = true")).unwrap();
let binding = try_parse(&tokens, 0).unwrap();
match binding {
2023-09-17 22:58:56 +00:00
SyntaxResult::Ok(TopLevelDeclaration::Binding(Binding::Var(binding)), _) => {
assert_eq!(Some(String::from("Bool")), binding.datatype);
2023-09-08 01:32:59 +00:00
assert_eq!("identifier", format!("{}", binding.identifier));
}
2023-09-09 01:17:46 +00:00
_ => panic!("D: {:?}", binding),
}
}
#[test]
fn should_return_correct_error() {
let tokens = get_tokens(&String::from("val")).unwrap();
assert_eq!(TokenType::VAL, tokens[0].token_type);
assert_eq!(0, tokens[0].position);
let binding = try_parse(&tokens, 0).unwrap();
match binding {
SyntaxResult::Err(error) => {
assert_eq!(0, error.error_start);
assert_eq!(3, error.error_end);
}
_ => panic!("Error expected"),
}
}
#[test]
fn should_return_error_when_identifier_is_wrong() {
let tokens = get_tokens(&String::from("val 322")).unwrap();
assert_eq!(TokenType::VAL, tokens[0].token_type);
assert_eq!(0, tokens[0].position);
let binding = try_parse(&tokens, 0).unwrap();
match binding {
SyntaxResult::Err(error) => {
assert_eq!(4, error.error_start);
assert_eq!(7, error.error_end);
}
2023-04-05 15:31:12 +00:00
_ => panic!("Error expected"),
}
let tokens = get_tokens(&String::from("val \"hello\"")).unwrap();
let binding = try_parse(&tokens, 0).unwrap();
match binding {
SyntaxResult::Err(error) => {
assert_eq!(4, error.error_start);
assert_eq!(11, error.error_end);
}
2023-04-05 15:31:12 +00:00
_ => panic!("Error expected"),
}
}
#[test]
fn should_return_error_when_equal_op_is_wrong() {
let tokens = get_tokens(&String::from("val id \"error\"")).unwrap();
let binding = try_parse(&tokens, 0).unwrap();
match binding {
SyntaxResult::Err(error) => {
assert_eq!(7, error.error_start);
assert_eq!(14, error.error_end);
}
2023-04-05 15:31:12 +00:00
_ => panic!("Error expected"),
}
}
2023-01-08 23:09:06 +00:00
}