1
0
dust/dust-lang/src/chunk.rs

516 lines
15 KiB
Rust
Raw Normal View History

use std::fmt::{self, Debug, Display, Formatter};
2024-09-07 10:38:12 +00:00
use colored::Colorize;
2024-09-07 10:38:12 +00:00
use serde::{Deserialize, Serialize};
2024-09-11 07:10:12 +00:00
use crate::{AnnotatedError, Identifier, Instruction, Span, Value};
2024-09-07 10:38:12 +00:00
#[derive(Clone)]
2024-09-07 10:38:12 +00:00
pub struct Chunk {
instructions: Vec<(Instruction, Span)>,
constants: Vec<Option<Value>>,
locals: Vec<Local>,
2024-09-11 07:10:12 +00:00
scope_depth: usize,
2024-09-07 10:38:12 +00:00
}
impl Chunk {
pub fn new() -> Self {
Self {
instructions: Vec::new(),
2024-09-07 10:38:12 +00:00
constants: Vec::new(),
locals: Vec::new(),
2024-09-11 07:10:12 +00:00
scope_depth: 0,
2024-09-07 10:38:12 +00:00
}
}
2024-09-07 16:15:47 +00:00
pub fn with_data(
instructions: Vec<(Instruction, Span)>,
2024-09-07 16:15:47 +00:00
constants: Vec<Value>,
2024-09-09 23:23:49 +00:00
identifiers: Vec<Local>,
2024-09-07 16:15:47 +00:00
) -> Self {
Self {
instructions,
constants: constants.into_iter().map(Some).collect(),
locals: identifiers,
2024-09-11 07:10:12 +00:00
scope_depth: 0,
2024-09-07 16:15:47 +00:00
}
2024-09-07 10:38:12 +00:00
}
pub fn len(&self) -> usize {
self.instructions.len()
2024-09-07 10:38:12 +00:00
}
pub fn is_empty(&self) -> bool {
self.instructions.is_empty()
2024-09-07 10:38:12 +00:00
}
2024-09-10 22:19:59 +00:00
pub fn scope_depth(&self) -> usize {
2024-09-11 07:10:12 +00:00
self.scope_depth
2024-09-10 22:19:59 +00:00
}
pub fn get_instruction(
&self,
offset: usize,
position: Span,
) -> Result<&(Instruction, Span), ChunkError> {
self.instructions
2024-09-07 16:15:47 +00:00
.get(offset)
2024-09-10 22:19:59 +00:00
.ok_or(ChunkError::CodeIndexOfBounds { offset, position })
2024-09-07 10:38:12 +00:00
}
pub fn push_instruction(&mut self, instruction: Instruction, position: Span) {
self.instructions.push((instruction, position));
2024-09-07 10:38:12 +00:00
}
2024-09-13 05:10:07 +00:00
pub fn pop_instruction(&mut self, position: Span) -> Result<(Instruction, Span), ChunkError> {
self.instructions
.pop()
.ok_or(ChunkError::InstructionUnderflow { position })
}
pub fn get_constant(&self, index: usize, position: Span) -> Result<&Value, ChunkError> {
2024-09-07 10:38:12 +00:00
self.constants
.get(index)
2024-09-10 22:19:59 +00:00
.ok_or(ChunkError::ConstantIndexOutOfBounds { index, position })
.and_then(|value| {
value
.as_ref()
.ok_or(ChunkError::ConstantAlreadyUsed { index, position })
})
2024-09-07 10:38:12 +00:00
}
pub fn use_constant(&mut self, index: usize, position: Span) -> Result<Value, ChunkError> {
self.constants
.get_mut(index)
.ok_or_else(|| ChunkError::ConstantIndexOutOfBounds { index, position })?
.take()
.ok_or(ChunkError::ConstantAlreadyUsed { index, position })
}
pub fn push_constant(&mut self, value: Value, position: Span) -> Result<u16, ChunkError> {
2024-09-07 10:38:12 +00:00
let starting_length = self.constants.len();
if starting_length + 1 > (u8::MAX as usize) {
2024-09-11 07:10:12 +00:00
Err(ChunkError::ConstantOverflow { position })
2024-09-07 10:38:12 +00:00
} else {
self.constants.push(Some(value));
2024-09-07 10:38:12 +00:00
Ok(starting_length as u16)
2024-09-07 10:38:12 +00:00
}
}
2024-09-09 23:23:49 +00:00
pub fn contains_identifier(&self, identifier: &Identifier) -> bool {
self.locals
2024-09-11 07:10:12 +00:00
.iter()
.any(|local| &local.identifier == identifier)
2024-09-09 23:23:49 +00:00
}
pub fn get_local(&self, index: usize, position: Span) -> Result<&Local, ChunkError> {
self.locals
.get(index)
.ok_or(ChunkError::LocalIndexOutOfBounds { index, position })
2024-09-10 22:19:59 +00:00
}
pub fn get_identifier(&self, index: usize) -> Option<&Identifier> {
self.locals.get(index).map(|local| &local.identifier)
2024-09-07 16:15:47 +00:00
}
pub fn get_local_index(
2024-09-10 22:19:59 +00:00
&self,
identifier: &Identifier,
position: Span,
) -> Result<u16, ChunkError> {
self.locals
2024-09-11 07:10:12 +00:00
.iter()
.enumerate()
.rev()
2024-09-11 07:10:12 +00:00
.find_map(|(index, local)| {
if &local.identifier == identifier {
Some(index as u16)
2024-09-11 07:10:12 +00:00
} else {
None
}
})
2024-09-10 22:19:59 +00:00
.ok_or(ChunkError::IdentifierNotFound {
identifier: identifier.clone(),
position,
})
2024-09-09 23:23:49 +00:00
}
pub fn declare_local(
2024-09-11 07:10:12 +00:00
&mut self,
identifier: Identifier,
position: Span,
) -> Result<u16, ChunkError> {
let starting_length = self.locals.len();
2024-09-07 16:15:47 +00:00
if starting_length + 1 > (u8::MAX as usize) {
2024-09-11 07:10:12 +00:00
Err(ChunkError::IdentifierOverflow { position })
2024-09-07 16:15:47 +00:00
} else {
self.locals
.push(Local::new(identifier, self.scope_depth, None));
2024-09-07 16:15:47 +00:00
Ok(starting_length as u16)
2024-09-07 16:15:47 +00:00
}
}
pub fn define_local(
&mut self,
index: usize,
value: Value,
position: Span,
) -> Result<(), ChunkError> {
let local = self
.locals
.get_mut(index)
.ok_or_else(|| ChunkError::LocalIndexOutOfBounds { index, position })?;
let value = value.into_reference();
local.value = Some(value);
Ok(())
}
2024-09-10 14:44:15 +00:00
pub fn begin_scope(&mut self) {
2024-09-11 07:10:12 +00:00
self.scope_depth += 1;
2024-09-10 14:44:15 +00:00
}
pub fn end_scope(&mut self) {
2024-09-11 07:10:12 +00:00
self.scope_depth -= 1;
2024-09-10 14:44:15 +00:00
}
2024-09-07 10:38:12 +00:00
pub fn clear(&mut self) {
self.instructions.clear();
2024-09-07 10:38:12 +00:00
self.constants.clear();
self.locals.clear();
2024-09-07 10:38:12 +00:00
}
2024-09-11 07:10:12 +00:00
pub fn identifiers(&self) -> &[Local] {
&self.locals
2024-09-11 07:10:12 +00:00
}
pub fn pop_identifier(&mut self) -> Option<Local> {
self.locals.pop()
2024-09-11 07:10:12 +00:00
}
pub fn disassembler<'a>(&'a self, name: &'a str) -> ChunkDisassembler<'a> {
ChunkDisassembler::new(name, self)
}
}
impl Default for Chunk {
fn default() -> Self {
Self::new()
}
}
impl Display for Chunk {
fn fmt(&self, f: &mut Formatter) -> fmt::Result {
write!(
f,
"{}",
2024-09-13 05:10:07 +00:00
self.disassembler("Chunk Display").styled().disassemble()
)
}
}
impl Debug for Chunk {
fn fmt(&self, f: &mut Formatter) -> fmt::Result {
write!(
f,
"{}",
self.disassembler("Chunk Debug Display").disassemble()
)
}
}
impl Eq for Chunk {}
impl PartialEq for Chunk {
fn eq(&self, other: &Self) -> bool {
self.instructions == other.instructions
&& self.constants == other.constants
&& self.locals == other.locals
}
}
#[derive(Debug, Clone, Eq, PartialEq, Serialize, Deserialize)]
pub struct Local {
pub identifier: Identifier,
pub depth: usize,
pub value: Option<Value>,
}
impl Local {
pub fn new(identifier: Identifier, depth: usize, value: Option<Value>) -> Self {
Self {
identifier,
depth,
value,
}
}
}
pub struct ChunkDisassembler<'a> {
name: &'a str,
chunk: &'a Chunk,
width: usize,
styled: bool,
}
2024-09-07 10:38:12 +00:00
impl<'a> ChunkDisassembler<'a> {
2024-09-13 05:10:07 +00:00
const INSTRUCTION_HEADER: [&'static str; 5] = [
"",
"Instructions",
"------------",
"OFFSET OPERATION INFO POSITION",
"------- -------------- -------------------- --------",
];
const CONSTANT_HEADER: [&'static str; 5] = [
"",
"Constants",
"---------",
"INDEX KIND VALUE",
"----- ----- -----",
];
const LOCAL_HEADER: [&'static str; 5] = [
"",
"Locals",
"------",
"INDEX IDENTIFIER DEPTH KIND VALUE",
"----- ---------- ----- ----- -----",
];
/// The default width of the disassembly output. To correctly align the output, this should be
/// set to the width of the longest line that the disassembler is guaranteed to produce.
const DEFAULT_WIDTH: usize = Self::INSTRUCTION_HEADER[3].len() + 1;
pub fn new(name: &'a str, chunk: &'a Chunk) -> Self {
Self {
name,
chunk,
2024-09-13 05:10:07 +00:00
width: Self::DEFAULT_WIDTH,
styled: false,
}
}
pub fn disassemble(&self) -> String {
2024-09-13 05:10:07 +00:00
let chunk_header = self.chunk_header();
let mut disassembled = String::with_capacity(self.predict_capacity());
2024-09-13 05:10:07 +00:00
println!("capactity: {}", disassembled.capacity());
2024-09-10 14:44:15 +00:00
2024-09-13 05:10:07 +00:00
let center = |line: &str| format!("{line:^width$}\n", width = self.width);
let style = |line: String| {
if self.styled {
line.bold().to_string()
} else {
2024-09-13 05:10:07 +00:00
line
}
};
2024-09-10 00:55:00 +00:00
2024-09-13 05:10:07 +00:00
for line in chunk_header.iter() {
disassembled.push_str(&style(center(line)));
}
for line in Self::INSTRUCTION_HEADER {
disassembled.push_str(&style(center(line)));
}
for (offset, (instruction, position)) in self.chunk.instructions.iter().enumerate() {
let position = position.to_string();
let operation = instruction.operation.to_string();
let info_option = instruction.disassembly_info(Some(self.chunk));
let instruction_display = if let Some(info) = info_option {
format!("{offset:<7} {operation:14} {info:20} {position:8}")
} else {
format!("{offset:<7} {operation:14} {:20} {position:8}", " ")
};
2024-09-13 05:10:07 +00:00
disassembled.push_str(&center(&instruction_display));
}
2024-09-10 00:55:00 +00:00
2024-09-13 05:10:07 +00:00
for line in Self::CONSTANT_HEADER {
disassembled.push_str(&style(center(line)));
}
for (index, value_option) in self.chunk.constants.iter().enumerate() {
2024-09-13 05:10:07 +00:00
let value_kind_display = if let Some(value) = value_option {
value.kind().to_string()
} else {
"empty".to_string()
2024-09-10 00:55:00 +00:00
};
let value_display = value_option
.as_ref()
.map(|value| value.to_string())
.unwrap_or_else(|| "EMPTY".to_string());
let constant_display = format!("{index:<5} {value_kind_display:<5} {value_display:<5}");
2024-09-10 00:55:00 +00:00
2024-09-13 05:10:07 +00:00
disassembled.push_str(&center(&constant_display));
2024-09-10 00:55:00 +00:00
}
2024-09-13 05:10:07 +00:00
for line in Self::LOCAL_HEADER {
disassembled.push_str(&style(center(line)));
}
for (
index,
Local {
identifier,
depth,
2024-09-13 05:10:07 +00:00
value: value_option,
},
) in self.chunk.locals.iter().enumerate()
{
2024-09-13 05:10:07 +00:00
let value_kind_display = if let Some(value) = value_option {
value.kind().to_string()
} else {
"empty".to_string()
};
2024-09-13 05:10:07 +00:00
let value_display = value_option
.as_ref()
.map(|value| value.to_string())
.unwrap_or_else(|| "EMPTY".to_string());
let identifier_display = identifier.as_str();
let local_display =
format!("{index:<5} {identifier_display:<10} {depth:<5} {value_kind_display:<4} {value_display:<5}");
2024-09-13 05:10:07 +00:00
disassembled.push_str(&center(&local_display));
2024-09-07 10:38:12 +00:00
}
2024-09-13 05:10:07 +00:00
println!("length: {}", disassembled.len());
disassembled
2024-09-07 10:38:12 +00:00
}
pub fn width(&mut self, width: usize) -> &mut Self {
self.width = width;
2024-09-07 10:38:12 +00:00
self
}
pub fn styled(&mut self) -> &mut Self {
self.styled = true;
self
2024-09-07 10:38:12 +00:00
}
2024-09-13 05:10:07 +00:00
fn chunk_header(&self) -> [String; 3] {
[
self.name.to_string(),
"=".repeat(self.name.len()),
format!(
"{} instructions, {} constants, {} locals",
self.chunk.instructions.len(),
self.chunk.constants.len(),
self.chunk.locals.len()
),
]
}
/// Predicts the capacity of the disassembled output. This is used to pre-allocate the string
/// buffer to avoid reallocations.
///
/// The capacity is calculated as follows:
/// - Get the number of static lines, i.e. lines that are always present in the disassembly
/// - Get the number of dynamic lines, i.e. lines that are generated from the chunk
/// - Add 1 to the width to account for the newline character
/// - Multiply the total number of lines by the width of the disassembly output
fn predict_capacity(&self) -> usize {
let chunk_header_line_count = 3; // self.chunk_header().len() is hard-coded to 3
let static_line_count = chunk_header_line_count
+ Self::INSTRUCTION_HEADER.len()
+ Self::CONSTANT_HEADER.len()
+ Self::LOCAL_HEADER.len();
let dynamic_line_count =
self.chunk.instructions.len() + self.chunk.constants.len() + self.chunk.locals.len();
let total_line_count = static_line_count + dynamic_line_count;
total_line_count * (self.width + 1)
}
}
2024-09-09 23:23:49 +00:00
#[derive(Debug, Clone, PartialEq)]
2024-09-07 10:38:12 +00:00
pub enum ChunkError {
2024-09-10 22:19:59 +00:00
CodeIndexOfBounds {
offset: usize,
position: Span,
},
ConstantAlreadyUsed {
index: usize,
position: Span,
},
2024-09-11 07:10:12 +00:00
ConstantOverflow {
position: Span,
},
2024-09-10 22:19:59 +00:00
ConstantIndexOutOfBounds {
index: usize,
2024-09-10 22:19:59 +00:00
position: Span,
},
2024-09-13 05:10:07 +00:00
InstructionUnderflow {
position: Span,
},
LocalIndexOutOfBounds {
index: usize,
2024-09-11 07:10:12 +00:00
position: Span,
},
IdentifierOverflow {
position: Span,
},
2024-09-10 22:19:59 +00:00
IdentifierNotFound {
identifier: Identifier,
position: Span,
},
}
impl AnnotatedError for ChunkError {
fn title() -> &'static str {
"Chunk Error"
}
fn description(&self) -> &'static str {
match self {
ChunkError::CodeIndexOfBounds { .. } => "Code index out of bounds",
ChunkError::ConstantAlreadyUsed { .. } => "Constant already used",
2024-09-11 07:10:12 +00:00
ChunkError::ConstantOverflow { .. } => "Constant overflow",
2024-09-10 22:19:59 +00:00
ChunkError::ConstantIndexOutOfBounds { .. } => "Constant index out of bounds",
2024-09-13 05:10:07 +00:00
ChunkError::InstructionUnderflow { .. } => "Instruction underflow",
ChunkError::LocalIndexOutOfBounds { .. } => "Identifier index out of bounds",
2024-09-11 07:10:12 +00:00
ChunkError::IdentifierOverflow { .. } => "Identifier overflow",
2024-09-10 22:19:59 +00:00
ChunkError::IdentifierNotFound { .. } => "Identifier not found",
}
}
fn details(&self) -> Option<String> {
match self {
ChunkError::CodeIndexOfBounds { offset, .. } => Some(format!("Code index: {}", offset)),
ChunkError::ConstantAlreadyUsed { index, .. } => {
Some(format!("Constant index: {}", index))
}
2024-09-10 22:19:59 +00:00
ChunkError::ConstantIndexOutOfBounds { index, .. } => {
Some(format!("Constant index: {}", index))
}
2024-09-13 05:10:07 +00:00
ChunkError::InstructionUnderflow { .. } => None,
ChunkError::LocalIndexOutOfBounds { index, .. } => {
2024-09-10 22:19:59 +00:00
Some(format!("Identifier index: {}", index))
}
ChunkError::IdentifierNotFound { identifier, .. } => {
Some(format!("Identifier: {}", identifier))
}
_ => None,
}
}
fn position(&self) -> Span {
match self {
ChunkError::CodeIndexOfBounds { position, .. } => *position,
ChunkError::ConstantAlreadyUsed { position, .. } => *position,
2024-09-10 22:19:59 +00:00
ChunkError::ConstantIndexOutOfBounds { position, .. } => *position,
ChunkError::IdentifierNotFound { position, .. } => *position,
_ => todo!(),
}
}
2024-09-07 10:38:12 +00:00
}