dust/dust-lang/src/analyzer.rs

523 lines
16 KiB
Rust
Raw Normal View History

//! Tools for analyzing an abstract syntax tree and catching errors before running the virtual
2024-08-09 02:44:34 +00:00
//! machine.
//!
2024-08-12 12:54:21 +00:00
//! This module provides two anlysis options:
//! - `analyze` convenience function, which takes a string input
//! - `Analyzer` struct, which borrows an abstract syntax tree and a context
2024-08-09 00:58:56 +00:00
use std::{
error::Error,
fmt::{self, Display, Formatter},
};
2024-08-07 15:57:15 +00:00
2024-08-09 08:23:02 +00:00
use crate::{
2024-08-13 23:41:36 +00:00
abstract_tree::{BinaryOperator, UnaryOperator},
2024-08-13 18:21:31 +00:00
parse, AbstractSyntaxTree, Context, DustError, Identifier, Node, Span, Statement,
StructDefinition, StructType, Type,
2024-08-09 08:23:02 +00:00
};
2024-08-07 15:57:15 +00:00
/// Analyzes the abstract syntax tree for errors.
///
/// # Examples
/// ```
/// # use std::collections::HashMap;
/// # use dust_lang::*;
/// let input = "x = 1 + false";
2024-08-11 23:00:37 +00:00
/// let result = analyze(input);
2024-08-07 15:57:15 +00:00
///
/// assert!(result.is_err());
/// ```
2024-08-11 23:00:37 +00:00
pub fn analyze(source: &str) -> Result<(), DustError> {
2024-08-11 21:59:52 +00:00
let abstract_tree = parse(source)?;
2024-08-12 12:54:21 +00:00
let context = Context::new();
let mut analyzer = Analyzer::new(&abstract_tree, &context);
2024-08-11 21:59:52 +00:00
analyzer
.analyze()
.map_err(|analyzer_error| DustError::AnalyzerError {
analyzer_error,
source,
})
2024-08-05 04:40:51 +00:00
}
2024-08-07 16:13:49 +00:00
/// Static analyzer that checks for potential runtime errors.
///
/// # Examples
/// ```
/// # use std::collections::HashMap;
/// # use dust_lang::*;
/// let input = "x = 1 + false";
/// let abstract_tree = parse(input).unwrap();
2024-08-10 08:32:27 +00:00
/// let mut context = Context::new();
/// let mut analyzer = Analyzer::new(&abstract_tree, &mut context);
2024-08-07 16:13:49 +00:00
/// let result = analyzer.analyze();
///
/// assert!(result.is_err());
pub struct Analyzer<'a> {
abstract_tree: &'a AbstractSyntaxTree,
2024-08-12 12:54:21 +00:00
context: &'a Context,
2024-08-05 03:11:04 +00:00
}
impl<'a> Analyzer<'a> {
2024-08-12 12:54:21 +00:00
pub fn new(abstract_tree: &'a AbstractSyntaxTree, context: &'a Context) -> Self {
2024-08-07 15:57:15 +00:00
Self {
abstract_tree,
context,
2024-08-07 15:57:15 +00:00
}
2024-08-05 03:11:04 +00:00
}
pub fn analyze(&mut self) -> Result<(), AnalyzerError> {
2024-08-14 18:28:39 +00:00
for node in &self.abstract_tree.statements {
self.analyze_statement(node)?;
2024-08-05 03:11:04 +00:00
}
Ok(())
}
2024-08-14 18:28:39 +00:00
fn analyze_statement(&mut self, _: &Node<Statement>) -> Result<(), AnalyzerError> {
2024-08-05 03:11:04 +00:00
Ok(())
}
}
#[derive(Clone, Debug, PartialEq)]
pub enum AnalyzerError {
ExpectedBoolean {
actual: Node<Statement>,
},
ExpectedIdentifier {
actual: Node<Statement>,
},
ExpectedIdentifierOrString {
actual: Node<Statement>,
},
2024-08-12 14:43:18 +00:00
ExpectedIntegerOrRange {
actual: Node<Statement>,
},
2024-08-12 20:57:10 +00:00
ExpectedList {
actual: Node<Statement>,
},
ExpectedMap {
actual: Node<Statement>,
},
2024-08-09 08:23:02 +00:00
ExpectedValue {
actual: Node<Statement>,
},
2024-08-11 22:11:59 +00:00
ExpectedValueArgumentCount {
expected: usize,
actual: usize,
position: Span,
},
2024-08-12 23:39:26 +00:00
IndexOutOfBounds {
list: Node<Statement>,
index: Node<Statement>,
index_value: usize,
length: usize,
},
2024-08-11 23:00:37 +00:00
TypeConflict {
actual_statement: Node<Statement>,
actual_type: Type,
expected: Type,
},
UndefinedField {
identifier: Node<Statement>,
statement: Node<Statement>,
},
2024-08-13 20:21:44 +00:00
UndefinedType {
identifier: Node<Identifier>,
},
UnexpectedIdentifier {
identifier: Node<Statement>,
},
2024-08-09 08:23:02 +00:00
UnexectedString {
actual: Node<Statement>,
},
2024-08-13 20:21:44 +00:00
UndefinedVariable {
identifier: Node<Statement>,
},
2024-08-05 03:11:04 +00:00
}
2024-08-09 05:43:58 +00:00
impl AnalyzerError {
pub fn position(&self) -> Span {
match self {
2024-08-12 02:02:17 +00:00
AnalyzerError::ExpectedBoolean { actual, .. } => actual.position,
AnalyzerError::ExpectedIdentifier { actual, .. } => actual.position,
AnalyzerError::ExpectedIdentifierOrString { actual } => actual.position,
2024-08-12 14:43:18 +00:00
AnalyzerError::ExpectedIntegerOrRange { actual, .. } => actual.position,
2024-08-12 20:57:10 +00:00
AnalyzerError::ExpectedList { actual } => actual.position,
AnalyzerError::ExpectedMap { actual } => actual.position,
2024-08-11 23:00:37 +00:00
AnalyzerError::ExpectedValue { actual } => actual.position,
2024-08-11 22:11:59 +00:00
AnalyzerError::ExpectedValueArgumentCount { position, .. } => *position,
2024-08-12 23:39:26 +00:00
AnalyzerError::IndexOutOfBounds { list, index, .. } => {
(list.position.0, index.position.1)
}
2024-08-11 23:00:37 +00:00
AnalyzerError::TypeConflict {
actual_statement, ..
} => actual_statement.position,
AnalyzerError::UndefinedField { identifier, .. } => identifier.position,
2024-08-13 20:21:44 +00:00
AnalyzerError::UndefinedType { identifier } => identifier.position,
2024-08-09 22:14:46 +00:00
AnalyzerError::UndefinedVariable { identifier } => identifier.position,
2024-08-11 23:00:37 +00:00
AnalyzerError::UnexpectedIdentifier { identifier } => identifier.position,
AnalyzerError::UnexectedString { actual } => actual.position,
2024-08-09 05:43:58 +00:00
}
}
}
2024-08-09 00:58:56 +00:00
impl Error for AnalyzerError {}
impl Display for AnalyzerError {
fn fmt(&self, f: &mut Formatter) -> fmt::Result {
match self {
2024-08-09 01:47:49 +00:00
AnalyzerError::ExpectedBoolean { actual, .. } => {
2024-08-09 00:58:56 +00:00
write!(f, "Expected boolean, found {}", actual)
}
2024-08-09 01:47:49 +00:00
AnalyzerError::ExpectedIdentifier { actual, .. } => {
2024-08-09 00:58:56 +00:00
write!(f, "Expected identifier, found {}", actual)
}
AnalyzerError::ExpectedIdentifierOrString { actual } => {
write!(f, "Expected identifier or string, found {}", actual)
}
2024-08-12 14:43:18 +00:00
AnalyzerError::ExpectedIntegerOrRange { actual, .. } => {
write!(f, "Expected integer or range, found {}", actual)
}
2024-08-12 20:57:10 +00:00
AnalyzerError::ExpectedList { actual } => write!(f, "Expected list, found {}", actual),
AnalyzerError::ExpectedMap { actual } => write!(f, "Expected map, found {}", actual),
2024-08-09 08:23:02 +00:00
AnalyzerError::ExpectedValue { actual, .. } => {
write!(f, "Expected value, found {}", actual)
}
2024-08-11 22:11:59 +00:00
AnalyzerError::ExpectedValueArgumentCount {
expected, actual, ..
} => write!(f, "Expected {} value arguments, found {}", expected, actual),
2024-08-12 23:39:26 +00:00
AnalyzerError::IndexOutOfBounds {
list,
index_value,
length,
..
2024-08-12 23:39:26 +00:00
} => write!(
f,
"Index {} out of bounds for list {} with length {}",
index_value, list, length
),
2024-08-11 23:00:37 +00:00
AnalyzerError::TypeConflict {
actual_statement,
actual_type,
expected,
} => {
write!(
f,
"Expected type {}, found {}, which has type {}",
expected, actual_statement, actual_type
)
}
AnalyzerError::UndefinedField {
identifier,
statement: map,
} => {
write!(f, "Undefined field {} in map {}", identifier, map)
}
2024-08-13 20:21:44 +00:00
AnalyzerError::UndefinedType { identifier } => {
write!(f, "Undefined type {}", identifier)
}
2024-08-09 22:14:46 +00:00
AnalyzerError::UndefinedVariable { identifier } => {
write!(f, "Undefined variable {}", identifier)
}
2024-08-09 01:47:49 +00:00
AnalyzerError::UnexpectedIdentifier { identifier, .. } => {
2024-08-09 00:58:56 +00:00
write!(f, "Unexpected identifier {}", identifier)
}
2024-08-09 08:23:02 +00:00
AnalyzerError::UnexectedString { actual, .. } => {
write!(f, "Unexpected string {}", actual)
}
2024-08-09 00:58:56 +00:00
}
}
}
2024-08-05 03:11:04 +00:00
#[cfg(test)]
mod tests {
2024-08-14 18:28:39 +00:00
use crate::{AssignmentOperator, Identifier, Value};
2024-08-05 03:11:04 +00:00
use super::*;
2024-08-14 18:28:39 +00:00
#[test]
fn add_assign_wrong_type() {
let source = "
a = 1
a += 1.0
";
assert_eq!(
analyze(source),
Err(DustError::AnalyzerError {
analyzer_error: AnalyzerError::TypeConflict {
actual_statement: Node::new(
Statement::Assignment {
identifier: Node::new(Identifier::new("a"), (31, 32)),
operator: Node::new(AssignmentOperator::AddAssign, (33, 35)),
value: Box::new(Node::new(
Statement::Constant(Value::float(1.0)),
(38, 41)
))
},
(31, 32)
),
actual_type: Type::Integer,
expected: Type::Float
},
source
})
);
}
#[test]
fn subtract_assign_wrong_type() {
let source = "
a = 1
a -= 1.0
";
assert_eq!(
analyze(source),
Err(DustError::AnalyzerError {
analyzer_error: AnalyzerError::TypeConflict {
actual_statement: Node::new(
Statement::Assignment {
identifier: Node::new(Identifier::new("a"), (31, 32)),
operator: Node::new(AssignmentOperator::SubtractAssign, (33, 37)),
value: Box::new(Node::new(
Statement::Constant(Value::float(1.0)),
(40, 43)
))
},
(31, 32)
),
actual_type: Type::Integer,
expected: Type::Float
},
source
})
);
}
#[test]
fn tuple_struct_with_wrong_field_types() {
let source = "
struct Foo(int, float)
Foo(1, 2)
";
assert_eq!(
analyze(source),
Err(DustError::AnalyzerError {
analyzer_error: AnalyzerError::TypeConflict {
actual_statement: Node::new(Statement::Constant(Value::integer(2)), (55, 56)),
actual_type: Type::Integer,
expected: Type::Float
},
source
})
);
}
2024-08-12 23:39:26 +00:00
#[test]
fn constant_list_index_out_of_bounds() {
let source = "[1, 2, 3][3]";
assert_eq!(
analyze(source),
Err(DustError::AnalyzerError {
analyzer_error: AnalyzerError::IndexOutOfBounds {
list: Node::new(
Statement::List(vec![
Node::new(Statement::Constant(Value::integer(1)), (1, 2)),
Node::new(Statement::Constant(Value::integer(2)), (4, 5)),
Node::new(Statement::Constant(Value::integer(3)), (7, 8)),
]),
(0, 9)
),
index: Node::new(Statement::Constant(Value::integer(3)), (10, 11)),
index_value: 3,
length: 3
},
source
})
);
}
#[test]
fn nonexistant_field_identifier() {
2024-08-12 23:39:26 +00:00
let source = "{ x = 1 }.y";
assert_eq!(
analyze(source),
Err(DustError::AnalyzerError {
analyzer_error: AnalyzerError::UndefinedField {
2024-08-12 23:39:26 +00:00
identifier: Node::new(Statement::Identifier(Identifier::new("y")), (10, 11)),
statement: Node::new(
Statement::Map(vec![(
Node::new(Identifier::new("x"), (2, 3)),
Node::new(Statement::Constant(Value::integer(1)), (6, 7))
)]),
(0, 9)
)
},
source
})
);
}
#[test]
fn nonexistant_field_string() {
let source = "{ x = 1 }.'y'";
assert_eq!(
analyze(source),
Err(DustError::AnalyzerError {
analyzer_error: AnalyzerError::UndefinedField {
identifier: Node::new(Statement::Constant(Value::string("y")), (10, 13)),
statement: Node::new(
Statement::Map(vec![(
Node::new(Identifier::new("x"), (2, 3)),
Node::new(Statement::Constant(Value::integer(1)), (6, 7))
)]),
(0, 9)
)
2024-08-12 23:39:26 +00:00
},
source
})
);
}
2024-08-12 02:02:17 +00:00
#[test]
fn malformed_list_index() {
2024-08-12 20:57:10 +00:00
let source = "[1, 2, 3]['foo']";
2024-08-12 02:02:17 +00:00
assert_eq!(
analyze(source),
Err(DustError::AnalyzerError {
2024-08-12 14:43:18 +00:00
analyzer_error: AnalyzerError::ExpectedIntegerOrRange {
2024-08-12 20:57:10 +00:00
actual: Node::new(Statement::Constant(Value::string("foo")), (10, 15)),
2024-08-12 02:02:17 +00:00
},
source
})
);
}
#[test]
2024-08-12 23:39:26 +00:00
fn malformed_field_access() {
2024-08-12 02:02:17 +00:00
let source = "{ x = 1 }.0";
assert_eq!(
analyze(source),
Err(DustError::AnalyzerError {
analyzer_error: AnalyzerError::ExpectedIdentifierOrString {
actual: Node::new(Statement::Constant(Value::integer(0)), (10, 11)),
},
source
})
);
}
2024-08-11 23:00:37 +00:00
#[test]
fn length_no_arguments() {
let source = "length()";
2024-08-11 21:59:52 +00:00
assert_eq!(
2024-08-11 23:00:37 +00:00
analyze(source),
Err(DustError::AnalyzerError {
analyzer_error: AnalyzerError::ExpectedValueArgumentCount {
expected: 1,
actual: 0,
position: (0, 6)
},
source
2024-08-11 21:59:52 +00:00
})
2024-08-11 23:00:37 +00:00
);
2024-08-11 21:59:52 +00:00
}
2024-08-08 17:01:25 +00:00
#[test]
2024-08-09 08:56:24 +00:00
fn float_plus_integer() {
2024-08-11 23:00:37 +00:00
let source = "42.0 + 2";
assert_eq!(
2024-08-11 23:00:37 +00:00
analyze(source),
Err(DustError::AnalyzerError {
analyzer_error: AnalyzerError::TypeConflict {
actual_statement: Node::new(Statement::Constant(Value::integer(2)), (7, 8)),
actual_type: Type::Integer,
expected: Type::Float,
},
source
})
)
}
#[test]
2024-08-09 08:56:24 +00:00
fn integer_plus_boolean() {
2024-08-11 23:18:13 +00:00
let source = "42 + true";
2024-08-08 17:01:25 +00:00
assert_eq!(
2024-08-11 23:18:13 +00:00
analyze(source),
Err(DustError::AnalyzerError {
analyzer_error: AnalyzerError::TypeConflict {
actual_statement: Node::new(Statement::Constant(Value::boolean(true)), (5, 9)),
actual_type: Type::Boolean,
expected: Type::Integer,
},
source
2024-08-08 17:01:25 +00:00
})
)
}
2024-08-08 17:01:25 +00:00
#[test]
fn is_even_expects_number() {
2024-08-11 23:18:13 +00:00
let source = "is_even('hello')";
2024-08-08 17:01:25 +00:00
assert_eq!(
2024-08-11 23:18:13 +00:00
analyze(source),
Err(DustError::AnalyzerError {
analyzer_error: AnalyzerError::TypeConflict {
actual_statement: Node::new(
Statement::Constant(Value::string("hello")),
(8, 15)
),
actual_type: Type::String,
expected: Type::Number,
},
source
2024-08-08 17:01:25 +00:00
})
2024-08-11 23:18:13 +00:00
);
2024-08-08 17:01:25 +00:00
}
2024-08-11 23:18:13 +00:00
2024-08-05 03:11:04 +00:00
#[test]
fn is_odd_expects_number() {
2024-08-11 23:18:13 +00:00
let source = "is_odd('hello')";
2024-08-05 03:11:04 +00:00
assert_eq!(
2024-08-11 23:18:13 +00:00
analyze(source),
Err(DustError::AnalyzerError {
analyzer_error: AnalyzerError::TypeConflict {
actual_statement: Node::new(
Statement::Constant(Value::string("hello")),
(7, 14)
),
actual_type: Type::String,
expected: Type::Number,
},
source
2024-08-05 03:11:04 +00:00
})
2024-08-11 23:18:13 +00:00
);
2024-08-05 03:11:04 +00:00
}
2024-08-05 04:40:51 +00:00
2024-08-07 15:57:15 +00:00
#[test]
2024-08-09 22:14:46 +00:00
fn undefined_variable() {
2024-08-11 23:18:13 +00:00
let source = "foo";
2024-08-05 04:40:51 +00:00
assert_eq!(
2024-08-11 23:18:13 +00:00
analyze(source),
Err(DustError::AnalyzerError {
analyzer_error: AnalyzerError::UndefinedVariable {
identifier: Node::new(Statement::Identifier(Identifier::new("foo")), (0, 3)),
},
source
2024-08-05 04:40:51 +00:00
})
2024-08-11 23:18:13 +00:00
);
2024-08-05 04:40:51 +00:00
}
2024-08-05 03:11:04 +00:00
}