683281363d
Optimizing Forth 2012 compiler targeting WebAssembly with IR-based compilation pipeline, multi-typed stack inference, subroutine threading, and JIT/consolidation modes. Rust kernel with ~35 primitives and Forth standard library for core/core-ext word sets.
135 lines
4.7 KiB
Rust
135 lines
4.7 KiB
Rust
//! Linear memory layout and stack operations for WAFER.
|
|
//!
|
|
//! WAFER uses WASM linear memory for the dictionary, return stack,
|
|
//! and as a fallback for the data and float stacks when types are unknown.
|
|
//! When type inference succeeds, values stay in WASM locals/operand stack instead.
|
|
|
|
/// Size of one memory page in WASM (64 KiB).
|
|
pub const PAGE_SIZE: u32 = 65536;
|
|
|
|
/// Initial number of memory pages.
|
|
pub const INITIAL_PAGES: u32 = 16; // 1 MiB
|
|
|
|
/// Maximum number of memory pages.
|
|
pub const MAX_PAGES: u32 = 256; // 16 MiB
|
|
|
|
// Memory region layout
|
|
// All offsets are byte addresses in linear memory.
|
|
|
|
/// System variables region (STATE, BASE, >IN, HLD, etc.)
|
|
pub const SYSVAR_BASE: u32 = 0x0000;
|
|
/// Size of system variables region.
|
|
pub const SYSVAR_SIZE: u32 = 64;
|
|
|
|
/// Input buffer for source parsing.
|
|
pub const INPUT_BUFFER_BASE: u32 = SYSVAR_BASE + SYSVAR_SIZE; // 0x0040
|
|
/// Size of input buffer.
|
|
pub const INPUT_BUFFER_SIZE: u32 = 1024;
|
|
|
|
/// PAD - scratch area for string formatting.
|
|
pub const PAD_BASE: u32 = INPUT_BUFFER_BASE + INPUT_BUFFER_SIZE; // 0x0440
|
|
/// Size of PAD.
|
|
pub const PAD_SIZE: u32 = 256;
|
|
|
|
/// Data stack region (fallback when types are unknown).
|
|
/// Grows downward from the top of this region.
|
|
pub const DATA_STACK_BASE: u32 = PAD_BASE + PAD_SIZE; // 0x0540
|
|
/// Size of data stack region.
|
|
pub const DATA_STACK_SIZE: u32 = 4096; // 1024 cells
|
|
|
|
/// Return stack region. Grows downward.
|
|
pub const RETURN_STACK_BASE: u32 = DATA_STACK_BASE + DATA_STACK_SIZE; // 0x1540
|
|
/// Size of return stack region.
|
|
pub const RETURN_STACK_SIZE: u32 = 4096;
|
|
|
|
/// Floating-point stack region (fallback). Grows downward.
|
|
pub const FLOAT_STACK_BASE: u32 = RETURN_STACK_BASE + RETURN_STACK_SIZE; // 0x2540
|
|
/// Size of float stack region.
|
|
pub const FLOAT_STACK_SIZE: u32 = 2048; // 256 doubles
|
|
|
|
/// Dictionary region start. Grows upward.
|
|
pub const DICTIONARY_BASE: u32 = FLOAT_STACK_BASE + FLOAT_STACK_SIZE; // 0x2D40
|
|
|
|
/// Initial top of data stack (grows down from here).
|
|
pub const DATA_STACK_TOP: u32 = DATA_STACK_BASE + DATA_STACK_SIZE;
|
|
|
|
/// Initial top of return stack (grows down from here).
|
|
pub const RETURN_STACK_TOP: u32 = RETURN_STACK_BASE + RETURN_STACK_SIZE;
|
|
|
|
/// Initial top of float stack (grows down from here).
|
|
pub const FLOAT_STACK_TOP: u32 = FLOAT_STACK_BASE + FLOAT_STACK_SIZE;
|
|
|
|
/// Size of one cell (4 bytes for i32).
|
|
pub const CELL_SIZE: u32 = 4;
|
|
|
|
/// Size of one double-cell (8 bytes).
|
|
pub const DOUBLE_CELL_SIZE: u32 = 8;
|
|
|
|
/// Size of one float (8 bytes for f64).
|
|
pub const FLOAT_SIZE: u32 = 8;
|
|
|
|
// System variable offsets within SYSVAR region
|
|
|
|
/// STATE: 0 = interpreting, -1 (0xFFFFFFFF) = compiling.
|
|
pub const SYSVAR_STATE: u32 = SYSVAR_BASE;
|
|
/// BASE: current number base (default 10).
|
|
pub const SYSVAR_BASE_VAR: u32 = SYSVAR_BASE + 4;
|
|
/// >IN: offset into the input buffer.
|
|
pub const SYSVAR_TO_IN: u32 = SYSVAR_BASE + 8;
|
|
/// HERE: next free dictionary address.
|
|
pub const SYSVAR_HERE: u32 = SYSVAR_BASE + 12;
|
|
/// LATEST: pointer to the most recent dictionary entry.
|
|
pub const SYSVAR_LATEST: u32 = SYSVAR_BASE + 16;
|
|
/// SOURCE-ID: current input source (0 = user input, -1 = string).
|
|
pub const SYSVAR_SOURCE_ID: u32 = SYSVAR_BASE + 20;
|
|
/// #TIB: length of current input.
|
|
pub const SYSVAR_NUM_TIB: u32 = SYSVAR_BASE + 24;
|
|
/// HLD: pointer for pictured numeric output.
|
|
pub const SYSVAR_HLD: u32 = SYSVAR_BASE + 28;
|
|
|
|
#[cfg(test)]
|
|
mod tests {
|
|
use super::*;
|
|
|
|
#[test]
|
|
fn memory_regions_dont_overlap() {
|
|
// Each region should start after the previous one ends
|
|
assert!(INPUT_BUFFER_BASE >= SYSVAR_BASE + SYSVAR_SIZE);
|
|
assert!(PAD_BASE >= INPUT_BUFFER_BASE + INPUT_BUFFER_SIZE);
|
|
assert!(DATA_STACK_BASE >= PAD_BASE + PAD_SIZE);
|
|
assert!(RETURN_STACK_BASE >= DATA_STACK_BASE + DATA_STACK_SIZE);
|
|
assert!(FLOAT_STACK_BASE >= RETURN_STACK_BASE + RETURN_STACK_SIZE);
|
|
assert!(DICTIONARY_BASE >= FLOAT_STACK_BASE + FLOAT_STACK_SIZE);
|
|
}
|
|
|
|
#[test]
|
|
fn dictionary_starts_within_first_page() {
|
|
assert!(DICTIONARY_BASE < PAGE_SIZE);
|
|
}
|
|
|
|
#[test]
|
|
fn stack_tops_are_correct() {
|
|
assert_eq!(DATA_STACK_TOP, DATA_STACK_BASE + DATA_STACK_SIZE);
|
|
assert_eq!(RETURN_STACK_TOP, RETURN_STACK_BASE + RETURN_STACK_SIZE);
|
|
assert_eq!(FLOAT_STACK_TOP, FLOAT_STACK_BASE + FLOAT_STACK_SIZE);
|
|
}
|
|
|
|
#[test]
|
|
fn sysvar_offsets_are_within_region() {
|
|
let all_offsets = [
|
|
SYSVAR_STATE,
|
|
SYSVAR_BASE_VAR,
|
|
SYSVAR_TO_IN,
|
|
SYSVAR_HERE,
|
|
SYSVAR_LATEST,
|
|
SYSVAR_SOURCE_ID,
|
|
SYSVAR_NUM_TIB,
|
|
SYSVAR_HLD,
|
|
];
|
|
for offset in all_offsets {
|
|
assert!(offset >= SYSVAR_BASE);
|
|
assert!(offset + CELL_SIZE <= SYSVAR_BASE + SYSVAR_SIZE);
|
|
}
|
|
}
|
|
}
|