Compare commits
20 Commits
elf
..
05a25447b2
| Author | SHA1 | Date | |
|---|---|---|---|
| 05a25447b2 | |||
| 56d2abe17f | |||
| eaaefd1b07 | |||
| 5302ad3876 | |||
| 2280f1e5d9 | |||
| ae92510fb8 | |||
| 7c63340888 | |||
| e9f04824ea | |||
| 620584488b | |||
| 1101331f70 | |||
| c171b0db89 | |||
| 82b99c127c | |||
| 92c4660a4d | |||
| 2a6991fe4a | |||
| 0fdd28aad1 | |||
| f639240b6c | |||
| d2c1492dca | |||
| 4ef8bbdf46 | |||
| 76197fac8f | |||
| bc5ddef311 |
@@ -5,7 +5,3 @@ rustc-wrapper = "sccache"
|
|||||||
|
|
||||||
[future-incompat-report]
|
[future-incompat-report]
|
||||||
frequency = "always"
|
frequency = "always"
|
||||||
|
|
||||||
[profile.profiling]
|
|
||||||
inherits = "release"
|
|
||||||
debug = true
|
|
||||||
|
|||||||
+2
-1
@@ -1,2 +1,3 @@
|
|||||||
/target
|
/target
|
||||||
**/*.env
|
**/*.env
|
||||||
|
book
|
||||||
|
|||||||
Vendored
+7
-1
@@ -5,5 +5,11 @@
|
|||||||
"files.eol": "\n",
|
"files.eol": "\n",
|
||||||
"files.insertFinalNewline": true,
|
"files.insertFinalNewline": true,
|
||||||
"files.trimFinalNewlines": true,
|
"files.trimFinalNewlines": true,
|
||||||
"files.trimTrailingWhitespace": true
|
"files.trimTrailingWhitespace": true,
|
||||||
|
"gitea.owner": "LowLevelDevs",
|
||||||
|
"gitea.repo": "damn_simple_architecture",
|
||||||
|
"[markdown]": {
|
||||||
|
"editor.formatOnSave": true,
|
||||||
|
"editor.formatOnPaste": true
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|||||||
Generated
+3
-185
@@ -129,15 +129,6 @@ dependencies = [
|
|||||||
"zerocopy",
|
"zerocopy",
|
||||||
]
|
]
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "aho-corasick"
|
|
||||||
version = "1.1.3"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "8e60d3430d3a69478ad0993f19238d2df97c507009a52b3c10addcd7f6bcb916"
|
|
||||||
dependencies = [
|
|
||||||
"memchr",
|
|
||||||
]
|
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "android-activity"
|
name = "android-activity"
|
||||||
version = "0.6.0"
|
version = "0.6.0"
|
||||||
@@ -174,56 +165,6 @@ dependencies = [
|
|||||||
"libc",
|
"libc",
|
||||||
]
|
]
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "anstream"
|
|
||||||
version = "0.6.19"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "301af1932e46185686725e0fad2f8f2aa7da69dd70bf6ecc44d6b703844a3933"
|
|
||||||
dependencies = [
|
|
||||||
"anstyle",
|
|
||||||
"anstyle-parse",
|
|
||||||
"anstyle-query",
|
|
||||||
"anstyle-wincon",
|
|
||||||
"colorchoice",
|
|
||||||
"is_terminal_polyfill",
|
|
||||||
"utf8parse",
|
|
||||||
]
|
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "anstyle"
|
|
||||||
version = "1.0.11"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "862ed96ca487e809f1c8e5a8447f6ee2cf102f846893800b20cebdf541fc6bbd"
|
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "anstyle-parse"
|
|
||||||
version = "0.2.7"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "4e7644824f0aa2c7b9384579234ef10eb7efb6a0deb83f9630a49594dd9c15c2"
|
|
||||||
dependencies = [
|
|
||||||
"utf8parse",
|
|
||||||
]
|
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "anstyle-query"
|
|
||||||
version = "1.1.3"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "6c8bdeb6047d8983be085bab0ba1472e6dc604e7041dbf6fcd5e71523014fae9"
|
|
||||||
dependencies = [
|
|
||||||
"windows-sys 0.59.0",
|
|
||||||
]
|
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "anstyle-wincon"
|
|
||||||
version = "3.0.9"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "403f75924867bb1033c59fbf0797484329750cfbe3c4325cd33127941fabc882"
|
|
||||||
dependencies = [
|
|
||||||
"anstyle",
|
|
||||||
"once_cell_polyfill",
|
|
||||||
"windows-sys 0.59.0",
|
|
||||||
]
|
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "arboard"
|
name = "arboard"
|
||||||
version = "3.5.0"
|
version = "3.5.0"
|
||||||
@@ -275,12 +216,9 @@ dependencies = [
|
|||||||
name = "assembler"
|
name = "assembler"
|
||||||
version = "0.2.0"
|
version = "0.2.0"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
"clap",
|
|
||||||
"common",
|
"common",
|
||||||
"num_cpus",
|
"num_cpus",
|
||||||
"regex",
|
|
||||||
"threadpool",
|
"threadpool",
|
||||||
"uuid",
|
|
||||||
]
|
]
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
@@ -665,46 +603,6 @@ dependencies = [
|
|||||||
"libc",
|
"libc",
|
||||||
]
|
]
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "clap"
|
|
||||||
version = "4.5.40"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "40b6887a1d8685cebccf115538db5c0efe625ccac9696ad45c409d96566e910f"
|
|
||||||
dependencies = [
|
|
||||||
"clap_builder",
|
|
||||||
"clap_derive",
|
|
||||||
]
|
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "clap_builder"
|
|
||||||
version = "4.5.40"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "e0c66c08ce9f0c698cbce5c0279d0bb6ac936d8674174fe48f736533b964f59e"
|
|
||||||
dependencies = [
|
|
||||||
"anstream",
|
|
||||||
"anstyle",
|
|
||||||
"clap_lex",
|
|
||||||
"strsim",
|
|
||||||
]
|
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "clap_derive"
|
|
||||||
version = "4.5.40"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "d2c7947ae4cc3d851207c1adb5b5e260ff0cca11446b1d6d1423788e442257ce"
|
|
||||||
dependencies = [
|
|
||||||
"heck",
|
|
||||||
"proc-macro2",
|
|
||||||
"quote",
|
|
||||||
"syn",
|
|
||||||
]
|
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "clap_lex"
|
|
||||||
version = "0.7.5"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "b94f61472cee1439c0b966b47e3aca9ae07e45d070759512cd390ea2bebc6675"
|
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "clipboard-win"
|
name = "clipboard-win"
|
||||||
version = "5.4.0"
|
version = "5.4.0"
|
||||||
@@ -724,12 +622,6 @@ dependencies = [
|
|||||||
"unicode-width",
|
"unicode-width",
|
||||||
]
|
]
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "colorchoice"
|
|
||||||
version = "1.0.4"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "b05b61dc5112cbb17e4b6cd61790d9845d13888356391624cbe7e41efeac1e75"
|
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "colorful"
|
name = "colorful"
|
||||||
version = "0.3.2"
|
version = "0.3.2"
|
||||||
@@ -749,9 +641,6 @@ dependencies = [
|
|||||||
[[package]]
|
[[package]]
|
||||||
name = "common"
|
name = "common"
|
||||||
version = "0.2.0"
|
version = "0.2.0"
|
||||||
dependencies = [
|
|
||||||
"object",
|
|
||||||
]
|
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "concurrent-queue"
|
name = "concurrent-queue"
|
||||||
@@ -894,9 +783,9 @@ dependencies = [
|
|||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "discord-presence"
|
name = "discord-presence"
|
||||||
version = "1.6.0"
|
version = "2.0.0"
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "f91d7c2fc01ffdc327e2b66d65dd59b8bd3f31a17e88811ce0540412fa0b84c1"
|
checksum = "91948dab8ccaaefeb7be5f21714ed774411df66830def1f99dd74e7a85f5f111"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
"byteorder",
|
"byteorder",
|
||||||
"bytes",
|
"bytes",
|
||||||
@@ -1138,6 +1027,7 @@ dependencies = [
|
|||||||
"eframe",
|
"eframe",
|
||||||
"egui",
|
"egui",
|
||||||
"egui_file",
|
"egui_file",
|
||||||
|
"rustc-hash 2.1.1",
|
||||||
"serde",
|
"serde",
|
||||||
"toml",
|
"toml",
|
||||||
"winit",
|
"winit",
|
||||||
@@ -1712,12 +1602,6 @@ dependencies = [
|
|||||||
"hashbrown",
|
"hashbrown",
|
||||||
]
|
]
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "is_terminal_polyfill"
|
|
||||||
version = "1.70.1"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "7943c866cc5cd64cbc25b2e01621d07fa8eb2a1a23160ee81ce38704e97b8ecf"
|
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "itoa"
|
name = "itoa"
|
||||||
version = "1.0.15"
|
version = "1.0.15"
|
||||||
@@ -2326,31 +2210,12 @@ dependencies = [
|
|||||||
"objc2-foundation 0.2.2",
|
"objc2-foundation 0.2.2",
|
||||||
]
|
]
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "object"
|
|
||||||
version = "0.37.1"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "03fd943161069e1768b4b3d050890ba48730e590f57e56d4aa04e7e090e61b4a"
|
|
||||||
dependencies = [
|
|
||||||
"crc32fast",
|
|
||||||
"hashbrown",
|
|
||||||
"indexmap",
|
|
||||||
"memchr",
|
|
||||||
"rustc-std-workspace-alloc",
|
|
||||||
]
|
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "once_cell"
|
name = "once_cell"
|
||||||
version = "1.21.3"
|
version = "1.21.3"
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "42f5e15c9953c5e4ccceeb2e7382a716482c34515315f7b03532b8b4e8393d2d"
|
checksum = "42f5e15c9953c5e4ccceeb2e7382a716482c34515315f7b03532b8b4e8393d2d"
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "once_cell_polyfill"
|
|
||||||
version = "1.70.1"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "a4895175b425cb1f87721b59f0f286c2092bd4af812243672510e1ac53e2e0ad"
|
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "option-ext"
|
name = "option-ext"
|
||||||
version = "0.2.0"
|
version = "0.2.0"
|
||||||
@@ -2701,35 +2566,6 @@ dependencies = [
|
|||||||
"thiserror 2.0.12",
|
"thiserror 2.0.12",
|
||||||
]
|
]
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "regex"
|
|
||||||
version = "1.11.1"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "b544ef1b4eac5dc2db33ea63606ae9ffcfac26c1416a2806ae0bf5f56b201191"
|
|
||||||
dependencies = [
|
|
||||||
"aho-corasick",
|
|
||||||
"memchr",
|
|
||||||
"regex-automata",
|
|
||||||
"regex-syntax",
|
|
||||||
]
|
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "regex-automata"
|
|
||||||
version = "0.4.9"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "809e8dc61f6de73b46c85f4c96486310fe304c434cfa43669d7b40f711150908"
|
|
||||||
dependencies = [
|
|
||||||
"aho-corasick",
|
|
||||||
"memchr",
|
|
||||||
"regex-syntax",
|
|
||||||
]
|
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "regex-syntax"
|
|
||||||
version = "0.8.5"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "2b15c43186be67a4fd63bee50d0303afffcef381492ebe2c5d87f324e1b8815c"
|
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "renderdoc-sys"
|
name = "renderdoc-sys"
|
||||||
version = "1.1.0"
|
version = "1.1.0"
|
||||||
@@ -2748,12 +2584,6 @@ version = "2.1.1"
|
|||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "357703d41365b4b27c590e3ed91eabb1b663f07c4c084095e60cbed4362dff0d"
|
checksum = "357703d41365b4b27c590e3ed91eabb1b663f07c4c084095e60cbed4362dff0d"
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "rustc-std-workspace-alloc"
|
|
||||||
version = "1.0.1"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "f9d441c3b2ebf55cebf796bfdc265d67fa09db17b7bb6bd4be75c509e1e8fec3"
|
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "rustix"
|
name = "rustix"
|
||||||
version = "0.38.44"
|
version = "0.38.44"
|
||||||
@@ -3003,12 +2833,6 @@ version = "0.1.1"
|
|||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "6637bab7722d379c8b41ba849228d680cc12d0a45ba1fa2b48f2a30577a06731"
|
checksum = "6637bab7722d379c8b41ba849228d680cc12d0a45ba1fa2b48f2a30577a06731"
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "strsim"
|
|
||||||
version = "0.11.1"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "7da8b5736845d9f2fcb837ea5d9e2628564b3b043a70948a3f0b778838c5fb4f"
|
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "strum"
|
name = "strum"
|
||||||
version = "0.26.3"
|
version = "0.26.3"
|
||||||
@@ -3315,12 +3139,6 @@ version = "1.0.4"
|
|||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "b6c140620e7ffbb22c2dee59cafe6084a59b5ffc27a8859a5f0d494b5d52b6be"
|
checksum = "b6c140620e7ffbb22c2dee59cafe6084a59b5ffc27a8859a5f0d494b5d52b6be"
|
||||||
|
|
||||||
[[package]]
|
|
||||||
name = "utf8parse"
|
|
||||||
version = "0.2.2"
|
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
|
||||||
checksum = "06abde3611657adf66d383f00b093d7faecc7fa57071cce2578660c9f1010821"
|
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "uuid"
|
name = "uuid"
|
||||||
version = "1.17.0"
|
version = "1.17.0"
|
||||||
|
|||||||
+1
-1
@@ -17,5 +17,5 @@ debug = true
|
|||||||
incremental = false # sccache does not support caching incremental crates.
|
incremental = false # sccache does not support caching incremental crates.
|
||||||
|
|
||||||
[profile.release]
|
[profile.release]
|
||||||
incremental = true
|
debug = true
|
||||||
lto = "fat"
|
lto = "fat"
|
||||||
|
|||||||
@@ -13,9 +13,6 @@ name = "assembler"
|
|||||||
path = "src/lib.rs"
|
path = "src/lib.rs"
|
||||||
|
|
||||||
[dependencies]
|
[dependencies]
|
||||||
clap = { version = "4.5.40", features = ["derive"] }
|
|
||||||
common = { path = "../common" }
|
common = { path = "../common" }
|
||||||
num_cpus = "1.17.0"
|
num_cpus = "1.17.0"
|
||||||
regex = "1.11.1"
|
|
||||||
threadpool = "1.8.1"
|
threadpool = "1.8.1"
|
||||||
uuid = { version = "1.17.0", features = ["v4"] }
|
|
||||||
|
|||||||
@@ -1,21 +0,0 @@
|
|||||||
use clap::{Parser, ValueEnum};
|
|
||||||
|
|
||||||
#[derive(Debug, Parser, Default)]
|
|
||||||
pub struct Args {
|
|
||||||
/// The output format to assemble to. Currently just ELF or a flat binary.
|
|
||||||
#[arg(value_enum)]
|
|
||||||
output_format: Option<OutputFormat>,
|
|
||||||
/// Whether the relocatable object files should be statically linked into a single
|
|
||||||
/// executable or library.
|
|
||||||
link: bool,
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug, Clone, Copy, ValueEnum, Default)]
|
|
||||||
/// The executable format the output should take.
|
|
||||||
pub enum OutputFormat {
|
|
||||||
/// An ELF file.
|
|
||||||
#[default]
|
|
||||||
Elf,
|
|
||||||
/// A flat binary file.
|
|
||||||
Flat,
|
|
||||||
}
|
|
||||||
@@ -0,0 +1,264 @@
|
|||||||
|
use std::{
|
||||||
|
collections::HashSet,
|
||||||
|
fs,
|
||||||
|
path::{self, Path, PathBuf},
|
||||||
|
sync::{Arc, Mutex},
|
||||||
|
thread::{self, JoinHandle},
|
||||||
|
};
|
||||||
|
|
||||||
|
use crate::assembler::{AssembleError, Token, expand_pseudo_ops, lexer, quick_hash};
|
||||||
|
use crate::assembler::{Node, Parser, resolve_dependencies};
|
||||||
|
use crate::util::logging::Logger;
|
||||||
|
|
||||||
|
// pub fn new_assemble(path: &Path) {
|
||||||
|
// let program = Program::new();
|
||||||
|
// let program_ref = ProgramRef::new(program);
|
||||||
|
|
||||||
|
// let task = Module::build(path.to_path_buf(), program_ref.clone());
|
||||||
|
// program_ref.add_task(task);
|
||||||
|
|
||||||
|
// // wait on all tasks to finish
|
||||||
|
// for task in program_ref.get_tasks() {
|
||||||
|
// let module = task.module.join().unwrap();
|
||||||
|
// program_ref.add_module(module);
|
||||||
|
// }
|
||||||
|
// }
|
||||||
|
|
||||||
|
pub struct Program {
|
||||||
|
pub main_path: PathBuf,
|
||||||
|
registry: HashSet<u64>,
|
||||||
|
modules: Vec<Module>,
|
||||||
|
tasks: Vec<Task>,
|
||||||
|
logger: Logger,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Program {
|
||||||
|
#[must_use]
|
||||||
|
pub fn new() -> Self {
|
||||||
|
Self {
|
||||||
|
registry: HashSet::new(),
|
||||||
|
modules: Vec::new(),
|
||||||
|
tasks: Vec::new(),
|
||||||
|
main_path: PathBuf::new(),
|
||||||
|
logger: Logger::new(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn add_task(&mut self, task: Task) {
|
||||||
|
self.tasks.push(task);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Default for Program {
|
||||||
|
fn default() -> Self {
|
||||||
|
Self::new()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub struct ProgramRef {
|
||||||
|
program: Arc<Mutex<Program>>,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl ProgramRef {
|
||||||
|
#[must_use]
|
||||||
|
pub fn new(program: Program) -> Self {
|
||||||
|
Self {
|
||||||
|
program: Arc::new(Mutex::new(program)),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn register(&self, path: &Path) {
|
||||||
|
self.program
|
||||||
|
.lock()
|
||||||
|
.expect("Failed to acquire program lock")
|
||||||
|
.registry
|
||||||
|
.insert(quick_hash(path));
|
||||||
|
}
|
||||||
|
|
||||||
|
#[must_use]
|
||||||
|
pub fn is_registered(&self, path: &Path) -> bool {
|
||||||
|
self.program
|
||||||
|
.lock()
|
||||||
|
.expect("Failed to acquire program lock")
|
||||||
|
.registry
|
||||||
|
.contains(&quick_hash(path))
|
||||||
|
}
|
||||||
|
|
||||||
|
// pub fn get_tasks(&self) -> Vec<&Task> {
|
||||||
|
// self.program.lock().unwrap().tasks.iter().collect()
|
||||||
|
// }
|
||||||
|
|
||||||
|
pub fn add_task(&self, task: Task) {
|
||||||
|
self.program
|
||||||
|
.lock()
|
||||||
|
.expect("Failed to acquire program lock")
|
||||||
|
.add_task(task);
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn add_module(&self, module: Module) {
|
||||||
|
self.program
|
||||||
|
.lock()
|
||||||
|
.expect("Failed to acquire program lock")
|
||||||
|
.modules
|
||||||
|
.push(module);
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn log(&self, message: &str) {
|
||||||
|
self.program
|
||||||
|
.lock()
|
||||||
|
.expect("Failed to acquire program lock")
|
||||||
|
.logger
|
||||||
|
.log(message);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Clone for ProgramRef {
|
||||||
|
fn clone(&self) -> Self {
|
||||||
|
Self {
|
||||||
|
program: self.program.clone(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub struct Module {
|
||||||
|
pub path: PathBuf,
|
||||||
|
pub hash: u64,
|
||||||
|
pub nodes: Vec<Node>,
|
||||||
|
program: ProgramRef,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Module {
|
||||||
|
#[must_use]
|
||||||
|
pub const fn new(
|
||||||
|
path: PathBuf,
|
||||||
|
hash: u64,
|
||||||
|
nodes: Vec<Node>,
|
||||||
|
program: ProgramRef,
|
||||||
|
) -> Self {
|
||||||
|
Self {
|
||||||
|
path,
|
||||||
|
hash,
|
||||||
|
nodes,
|
||||||
|
program,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn build(path: PathBuf, program: ProgramRef) -> Result<Task, AssembleError> {
|
||||||
|
// Spawn a thread that creates the main function and executes the lexer and parser.
|
||||||
|
let handle = thread::spawn(move || {
|
||||||
|
let mut module =
|
||||||
|
Self::new(path.clone(), quick_hash(&path), Vec::new(), program.clone());
|
||||||
|
|
||||||
|
match module.lex() {
|
||||||
|
Ok(tokens) => {
|
||||||
|
module.parse(tokens);
|
||||||
|
module.expand();
|
||||||
|
module.prepare_dependencies();
|
||||||
|
module
|
||||||
|
}
|
||||||
|
Err(why) => {
|
||||||
|
eprintln!(
|
||||||
|
"Error building program at path `{}`: {why}",
|
||||||
|
path.display()
|
||||||
|
);
|
||||||
|
|
||||||
|
// TODO: Find a way to make this work without panicking.
|
||||||
|
unreachable!()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
});
|
||||||
|
|
||||||
|
Ok(Task { module: handle })
|
||||||
|
}
|
||||||
|
|
||||||
|
fn lex(&self) -> Result<Vec<Token>, AssembleError> {
|
||||||
|
if let Ok(path) = self.path.canonicalize() {
|
||||||
|
self.program.log(&format!(
|
||||||
|
"{:20} {:20} [{}]",
|
||||||
|
"Building",
|
||||||
|
self.get_filename(),
|
||||||
|
path.display()
|
||||||
|
));
|
||||||
|
}
|
||||||
|
|
||||||
|
let src = fs::read_to_string(&self.path)
|
||||||
|
.map_err(|_| AssembleError::InvalidFile(self.path.clone()))?;
|
||||||
|
|
||||||
|
let file_hash = quick_hash(&self.path);
|
||||||
|
|
||||||
|
self.program
|
||||||
|
.log(&format!("{:20} {:20}", "Tokenising", self.get_filename()));
|
||||||
|
|
||||||
|
lexer::lexer(src, file_hash)
|
||||||
|
}
|
||||||
|
|
||||||
|
fn parse(&mut self, tokens: Vec<Token>) -> Result<(), AssembleError> {
|
||||||
|
self.program
|
||||||
|
.log(&format!("{:20} {:20}", "Parsing", self.get_filename()));
|
||||||
|
|
||||||
|
let parsed = Parser::parse_nodes(tokens)?;
|
||||||
|
self.nodes = parsed;
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn expand(&mut self) -> Result<(), AssembleError> {
|
||||||
|
self.program
|
||||||
|
.log(&format!("{:20} {:20}", "Expanding", self.get_filename()));
|
||||||
|
|
||||||
|
let expanded = expand_pseudo_ops(self.nodes.clone(), self.hash)?;
|
||||||
|
self.nodes = expanded;
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn prepare_dependencies(&self) -> Result<(), AssembleError> {
|
||||||
|
let nodes = resolve_dependencies(
|
||||||
|
self.nodes.clone(),
|
||||||
|
self.path.parent().expect("File should have a parent path!"),
|
||||||
|
)?;
|
||||||
|
|
||||||
|
let dependencies = Parser::get_dependencies(&nodes, &self.path)?;
|
||||||
|
|
||||||
|
for dep in dependencies {
|
||||||
|
if self.program.is_registered(&dep) {
|
||||||
|
// we have already built this module!
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
self.program.register(&dep);
|
||||||
|
|
||||||
|
// create new module
|
||||||
|
// add the task to the program
|
||||||
|
|
||||||
|
match Self::build(dep, self.program.clone()) {
|
||||||
|
Ok(task) => self.program.add_task(task),
|
||||||
|
Err(why) => {
|
||||||
|
eprintln!("Error building program: {why}");
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Gets the filename from a [`PathBuf`].
|
||||||
|
fn get_filename(&self) -> &str {
|
||||||
|
self.path
|
||||||
|
.file_name()
|
||||||
|
.and_then(|f| f.to_str())
|
||||||
|
.unwrap_or_default()
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Gets the parent filepath from a [`PathBuf`].
|
||||||
|
fn get_parent(&self) -> &str {
|
||||||
|
self.path
|
||||||
|
.parent()
|
||||||
|
.and_then(|f| f.to_str())
|
||||||
|
.unwrap_or_default()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub struct Task {
|
||||||
|
module: JoinHandle<Module>,
|
||||||
|
}
|
||||||
@@ -0,0 +1,348 @@
|
|||||||
|
use common::{args, prelude::*};
|
||||||
|
|
||||||
|
use crate::assembler::model::{Node, Opcode};
|
||||||
|
use crate::{assembler::AssembleError, expect_token};
|
||||||
|
|
||||||
|
fn log(message: &str) {
|
||||||
|
println!("\x1b[32mINFO:\x1b[0m {message}");
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn codegen(nodes: Vec<Node>) -> Result<Vec<Instruction>, AssembleError> {
|
||||||
|
let mut instructions = vec![];
|
||||||
|
|
||||||
|
for node in nodes {
|
||||||
|
instructions.push(build_instruction(&node)?);
|
||||||
|
}
|
||||||
|
|
||||||
|
println!("------------------------");
|
||||||
|
log("Compilation Success ✅");
|
||||||
|
|
||||||
|
Ok(instructions)
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_instruction(node: &Node) -> Result<Instruction, AssembleError> {
|
||||||
|
let opcode = node.opcode();
|
||||||
|
let args = node.args();
|
||||||
|
|
||||||
|
match opcode {
|
||||||
|
Opcode::Nop => Ok(Instruction::Nop),
|
||||||
|
Opcode::Mov | Opcode::Movs => build_mov_instruction(opcode, &args),
|
||||||
|
Opcode::Ldb
|
||||||
|
| Opcode::Ldw
|
||||||
|
| Opcode::Ldh
|
||||||
|
| Opcode::Ldbs
|
||||||
|
| Opcode::Ldhs
|
||||||
|
| Opcode::Stb
|
||||||
|
| Opcode::Stw
|
||||||
|
| Opcode::Sth => build_memory_instruction(opcode, &args),
|
||||||
|
Opcode::Lli | Opcode::Lui => build_load_immediate_instruction(opcode, &args),
|
||||||
|
Opcode::Jmp
|
||||||
|
| Opcode::Jeq
|
||||||
|
| Opcode::Jne
|
||||||
|
| Opcode::Jgt
|
||||||
|
| Opcode::Jge
|
||||||
|
| Opcode::Jlt
|
||||||
|
| Opcode::Jle => build_jump_instruction(opcode, &args),
|
||||||
|
Opcode::Cmp => build_compare_instruction(&args),
|
||||||
|
Opcode::Inc | Opcode::Dec => build_inc_dec_instruction(opcode, &args),
|
||||||
|
Opcode::Shl | Opcode::Shr => build_shift_instruction(opcode, &args),
|
||||||
|
Opcode::Add
|
||||||
|
| Opcode::Sub
|
||||||
|
| Opcode::And
|
||||||
|
| Opcode::Or
|
||||||
|
| Opcode::Xor
|
||||||
|
| Opcode::Nand
|
||||||
|
| Opcode::Nor
|
||||||
|
| Opcode::Xnor => build_arithmetic_instruction(opcode, &args),
|
||||||
|
Opcode::AddI | Opcode::SubI => {
|
||||||
|
build_arithmetic_immediate_instruction(opcode, &args)
|
||||||
|
}
|
||||||
|
Opcode::Not => build_not_instruction(&args),
|
||||||
|
Opcode::Int => build_interrupt_instruction(&args),
|
||||||
|
Opcode::Irt => Ok(Instruction::IntReturn),
|
||||||
|
Opcode::Hlt => Ok(Instruction::Halt),
|
||||||
|
Opcode::Data => build_data_instruction(&args),
|
||||||
|
Opcode::Segment => build_segment_instruction(&args),
|
||||||
|
// These pseudo-instructions should have been expanded!
|
||||||
|
Opcode::Db
|
||||||
|
| Opcode::Dh
|
||||||
|
| Opcode::Dw
|
||||||
|
| Opcode::Resb
|
||||||
|
| Opcode::Resh
|
||||||
|
| Opcode::Resw
|
||||||
|
| Opcode::Push
|
||||||
|
| Opcode::Pop
|
||||||
|
| Opcode::Lwi
|
||||||
|
| Opcode::Include
|
||||||
|
| Opcode::Call
|
||||||
|
| Opcode::Return
|
||||||
|
| Opcode::Pusha
|
||||||
|
| Opcode::Popa => Err(AssembleError::InvalidArg),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_mov_instruction(
|
||||||
|
opcode: Opcode,
|
||||||
|
args: &[crate::assembler::model::Token],
|
||||||
|
) -> Result<Instruction, AssembleError> {
|
||||||
|
let Some(src_token) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
let Some(dest_token) = args.get(1) else {
|
||||||
|
return Err(AssembleError::MissingArgument(1));
|
||||||
|
};
|
||||||
|
|
||||||
|
let src = expect_token!(src_token, Register)?;
|
||||||
|
let dest = expect_token!(dest_token, Register)?;
|
||||||
|
|
||||||
|
match opcode {
|
||||||
|
Opcode::Mov => Ok(Instruction::Mov(args!(R, sr1: src, dr: dest))),
|
||||||
|
Opcode::Movs => Ok(Instruction::MovSigned(args!(R, sr1: src, dr: dest))),
|
||||||
|
_ => unreachable!(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_memory_instruction(
|
||||||
|
opcode: Opcode,
|
||||||
|
args: &[crate::assembler::model::Token],
|
||||||
|
) -> Result<Instruction, AssembleError> {
|
||||||
|
let Some(base_token) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
let Some(dest_token) = args.get(1) else {
|
||||||
|
return Err(AssembleError::MissingArgument(1));
|
||||||
|
};
|
||||||
|
let Some(offset_token) = args.get(2) else {
|
||||||
|
return Err(AssembleError::MissingArgument(2));
|
||||||
|
};
|
||||||
|
|
||||||
|
let base = expect_token!(base_token, Register)?;
|
||||||
|
let dest = expect_token!(dest_token, Register)?;
|
||||||
|
let offset = expect_token!(offset_token, Immediate)?;
|
||||||
|
let instruction_args = args!(I, immediate: offset as u16, r1: base, r2: dest);
|
||||||
|
|
||||||
|
match opcode {
|
||||||
|
Opcode::Ldb => Ok(Instruction::LoadByte(instruction_args)),
|
||||||
|
Opcode::Ldw => Ok(Instruction::LoadWord(instruction_args)),
|
||||||
|
Opcode::Ldh => Ok(Instruction::LoadHalfword(instruction_args)),
|
||||||
|
Opcode::Ldbs => Ok(Instruction::LoadByteSigned(instruction_args)),
|
||||||
|
Opcode::Ldhs => Ok(Instruction::LoadHalfwordSigned(instruction_args)),
|
||||||
|
Opcode::Stb => Ok(Instruction::StoreByte(instruction_args)),
|
||||||
|
Opcode::Stw => Ok(Instruction::StoreWord(instruction_args)),
|
||||||
|
Opcode::Sth => Ok(Instruction::StoreHalfword(instruction_args)),
|
||||||
|
_ => unreachable!(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_load_immediate_instruction(
|
||||||
|
opcode: Opcode,
|
||||||
|
args: &[crate::assembler::model::Token],
|
||||||
|
) -> Result<Instruction, AssembleError> {
|
||||||
|
let Some(value_token) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
let Some(dest_token) = args.get(1) else {
|
||||||
|
return Err(AssembleError::MissingArgument(1));
|
||||||
|
};
|
||||||
|
|
||||||
|
let value = expect_token!(value_token, Immediate)?;
|
||||||
|
let dest = expect_token!(dest_token, Register)?;
|
||||||
|
|
||||||
|
match opcode {
|
||||||
|
Opcode::Lli => {
|
||||||
|
let instruction_args = args!(I, immediate: value as u16, r1: dest);
|
||||||
|
Ok(Instruction::LoadLowerImmediate(instruction_args))
|
||||||
|
}
|
||||||
|
Opcode::Lui => {
|
||||||
|
let upper_value = value >> 16;
|
||||||
|
let instruction_args = args!(I, immediate: upper_value as u16, r1: dest);
|
||||||
|
Ok(Instruction::LoadUpperImmediate(instruction_args))
|
||||||
|
}
|
||||||
|
_ => unreachable!(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_jump_instruction(
|
||||||
|
opcode: Opcode,
|
||||||
|
args: &[crate::assembler::model::Token],
|
||||||
|
) -> Result<Instruction, AssembleError> {
|
||||||
|
let Some(address_token) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
let Some(offset_token) = args.get(1) else {
|
||||||
|
return Err(AssembleError::MissingArgument(1));
|
||||||
|
};
|
||||||
|
|
||||||
|
let address = expect_token!(address_token, Immediate)?;
|
||||||
|
let offset = expect_token!(offset_token, Register)?;
|
||||||
|
let instruction_args = args!(I, immediate: address as u16, r1: offset);
|
||||||
|
|
||||||
|
match opcode {
|
||||||
|
Opcode::Jmp => Ok(Instruction::Jump(instruction_args)),
|
||||||
|
Opcode::Jeq => Ok(Instruction::JumpEq(instruction_args)),
|
||||||
|
Opcode::Jne => Ok(Instruction::JumpNeq(instruction_args)),
|
||||||
|
Opcode::Jgt => Ok(Instruction::JumpGt(instruction_args)),
|
||||||
|
Opcode::Jge => Ok(Instruction::JumpGe(instruction_args)),
|
||||||
|
Opcode::Jlt => Ok(Instruction::JumpLt(instruction_args)),
|
||||||
|
Opcode::Jle => Ok(Instruction::JumpLe(instruction_args)),
|
||||||
|
_ => unreachable!(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_compare_instruction(
|
||||||
|
args: &[crate::assembler::model::Token],
|
||||||
|
) -> Result<Instruction, AssembleError> {
|
||||||
|
let Some(left_token) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
let Some(right_token) = args.get(1) else {
|
||||||
|
return Err(AssembleError::MissingArgument(1));
|
||||||
|
};
|
||||||
|
|
||||||
|
let left = expect_token!(left_token, Register)?;
|
||||||
|
let right = expect_token!(right_token, Register)?;
|
||||||
|
Ok(Instruction::Compare(args!(R, sr1: left, sr2: right)))
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_inc_dec_instruction(
|
||||||
|
opcode: Opcode,
|
||||||
|
args: &[crate::assembler::model::Token],
|
||||||
|
) -> Result<Instruction, AssembleError> {
|
||||||
|
let Some(reg_token) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
|
||||||
|
let reg = expect_token!(reg_token, Register)?;
|
||||||
|
match opcode {
|
||||||
|
Opcode::Inc => Ok(Instruction::Increment(args!(R, sr1: reg))),
|
||||||
|
Opcode::Dec => Ok(Instruction::Decrement(args!(R, sr1: reg))),
|
||||||
|
_ => unreachable!(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_shift_instruction(
|
||||||
|
opcode: Opcode,
|
||||||
|
args: &[crate::assembler::model::Token],
|
||||||
|
) -> Result<Instruction, AssembleError> {
|
||||||
|
let Some(reg_token) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
let Some(amount_token) = args.get(1) else {
|
||||||
|
return Err(AssembleError::MissingArgument(1));
|
||||||
|
};
|
||||||
|
|
||||||
|
let reg = expect_token!(reg_token, Register)?;
|
||||||
|
let amount = expect_token!(amount_token, Immediate)? as u8;
|
||||||
|
|
||||||
|
match opcode {
|
||||||
|
Opcode::Shl => Ok(Instruction::ShiftLeft(args!(R, sr1: reg, shamt: amount))),
|
||||||
|
Opcode::Shr => Ok(Instruction::ShiftRight(args!(R, sr1: reg, shamt: amount))),
|
||||||
|
_ => unreachable!(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_arithmetic_instruction(
|
||||||
|
opcode: Opcode,
|
||||||
|
args: &[crate::assembler::model::Token],
|
||||||
|
) -> Result<Instruction, AssembleError> {
|
||||||
|
let Some(left_token) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
let Some(right_token) = args.get(1) else {
|
||||||
|
return Err(AssembleError::MissingArgument(1));
|
||||||
|
};
|
||||||
|
let Some(dest_token) = args.get(2) else {
|
||||||
|
return Err(AssembleError::MissingArgument(2));
|
||||||
|
};
|
||||||
|
|
||||||
|
let left = expect_token!(left_token, Register)?;
|
||||||
|
let right = expect_token!(right_token, Register)?;
|
||||||
|
let dest = expect_token!(dest_token, Register)?;
|
||||||
|
let instruction_args = args!(R, sr1: left, sr2: right, dr: dest);
|
||||||
|
|
||||||
|
match opcode {
|
||||||
|
Opcode::Add => Ok(Instruction::Add(instruction_args)),
|
||||||
|
Opcode::Sub => Ok(Instruction::Sub(instruction_args)),
|
||||||
|
Opcode::And => Ok(Instruction::And(instruction_args)),
|
||||||
|
Opcode::Or => Ok(Instruction::Or(instruction_args)),
|
||||||
|
Opcode::Xor => Ok(Instruction::Xor(instruction_args)),
|
||||||
|
Opcode::Nand => Ok(Instruction::Nand(instruction_args)),
|
||||||
|
Opcode::Nor => Ok(Instruction::Nor(instruction_args)),
|
||||||
|
Opcode::Xnor => Ok(Instruction::Xnor(instruction_args)),
|
||||||
|
_ => unreachable!(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_arithmetic_immediate_instruction(
|
||||||
|
opcode: Opcode,
|
||||||
|
args: &[crate::assembler::model::Token],
|
||||||
|
) -> Result<Instruction, AssembleError> {
|
||||||
|
let Some(reg_token) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
let Some(immediate_token) = args.get(1) else {
|
||||||
|
return Err(AssembleError::MissingArgument(1));
|
||||||
|
};
|
||||||
|
let Some(dest_token) = args.get(2) else {
|
||||||
|
return Err(AssembleError::MissingArgument(2));
|
||||||
|
};
|
||||||
|
|
||||||
|
let reg = expect_token!(reg_token, Register)?;
|
||||||
|
let immediate = expect_token!(immediate_token, Immediate)? as u16;
|
||||||
|
let dest = expect_token!(dest_token, Register)?;
|
||||||
|
let instruction_args = args!(I, immediate: immediate, r1: reg, r2: dest);
|
||||||
|
|
||||||
|
match opcode {
|
||||||
|
Opcode::AddI => Ok(Instruction::AddImmediate(instruction_args)),
|
||||||
|
Opcode::SubI => Ok(Instruction::SubImmediate(instruction_args)),
|
||||||
|
_ => unreachable!(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_not_instruction(
|
||||||
|
args: &[crate::assembler::model::Token],
|
||||||
|
) -> Result<Instruction, AssembleError> {
|
||||||
|
let Some(reg_token) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
let Some(dest_token) = args.get(1) else {
|
||||||
|
return Err(AssembleError::MissingArgument(1));
|
||||||
|
};
|
||||||
|
|
||||||
|
let reg = expect_token!(reg_token, Register)?;
|
||||||
|
let dest = expect_token!(dest_token, Register)?;
|
||||||
|
Ok(Instruction::Not(args!(R, sr1: reg, dr: dest)))
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_interrupt_instruction(
|
||||||
|
args: &[crate::assembler::model::Token],
|
||||||
|
) -> Result<Instruction, AssembleError> {
|
||||||
|
let Some(code_token) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
|
||||||
|
let code = expect_token!(code_token, Immediate)? as u8;
|
||||||
|
Ok(Instruction::Interrupt(Interrupt::Software(code)))
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_data_instruction(
|
||||||
|
args: &[crate::assembler::model::Token],
|
||||||
|
) -> Result<Instruction, AssembleError> {
|
||||||
|
let Some(immediate_token) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
|
||||||
|
let immediate = expect_token!(immediate_token, Immediate)?;
|
||||||
|
Ok(Instruction::Data(immediate))
|
||||||
|
}
|
||||||
|
|
||||||
|
fn build_segment_instruction(
|
||||||
|
args: &[crate::assembler::model::Token],
|
||||||
|
) -> Result<Instruction, AssembleError> {
|
||||||
|
let Some(immediate_token) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
|
||||||
|
let immediate = expect_token!(immediate_token, Immediate)?;
|
||||||
|
Ok(Instruction::Segment(immediate))
|
||||||
|
}
|
||||||
@@ -0,0 +1,368 @@
|
|||||||
|
use common::prelude::Register;
|
||||||
|
|
||||||
|
use crate::assembler::model::{Node, Opcode, Token};
|
||||||
|
use crate::{assembler::AssembleError, expect_token, expect_type, node};
|
||||||
|
|
||||||
|
pub fn expand_pseudo_ops(
|
||||||
|
mut nodes: Vec<Node>,
|
||||||
|
module: u64,
|
||||||
|
) -> Result<Vec<Node>, AssembleError> {
|
||||||
|
let mut result = Vec::<Node>::with_capacity(nodes.len());
|
||||||
|
|
||||||
|
for node in &mut nodes {
|
||||||
|
if try_expand(node.clone(), &mut result, module).is_err() {
|
||||||
|
result.push(node.clone());
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
Ok(result)
|
||||||
|
}
|
||||||
|
|
||||||
|
fn try_expand(
|
||||||
|
node: Node,
|
||||||
|
result: &mut Vec<Node>,
|
||||||
|
_module: u64,
|
||||||
|
) -> Result<(), AssembleError> {
|
||||||
|
match node.opcode() {
|
||||||
|
Opcode::Push => expand_push(&node, result)?,
|
||||||
|
Opcode::Pop => expand_pop(&node, result)?,
|
||||||
|
Opcode::Pusha => expand_pusha(&node, result)?,
|
||||||
|
Opcode::Popa => expand_popa(&node, result)?,
|
||||||
|
Opcode::Call => expand_call(&node, result)?,
|
||||||
|
Opcode::Return => expand_return(&node, result),
|
||||||
|
Opcode::Ldb | Opcode::Ldbs | Opcode::Ldh | Opcode::Ldhs | Opcode::Ldw => {
|
||||||
|
expand_ldx(&node, result)?;
|
||||||
|
}
|
||||||
|
Opcode::Stb | Opcode::Sth | Opcode::Stw => expand_stx(&node, result)?,
|
||||||
|
|
||||||
|
Opcode::Lwi => expand_lwi(&node, result)?,
|
||||||
|
Opcode::Resb | Opcode::Resh | Opcode::Resw => expand_resx(&node, result)?,
|
||||||
|
Opcode::Db | Opcode::Dh | Opcode::Dw => expand_dx(&node, result)?,
|
||||||
|
_ => result.push(node),
|
||||||
|
}
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn expand_push(current: &Node, nodes: &mut Vec<Node>) -> Result<(), AssembleError> {
|
||||||
|
let label = current.label();
|
||||||
|
let Ok(arg0) = current.arg(0) else {
|
||||||
|
return Err(AssembleError::Generic);
|
||||||
|
};
|
||||||
|
|
||||||
|
let reg = expect_type!(arg0, Register)?;
|
||||||
|
let spr = Token::Register(Register::Spr);
|
||||||
|
|
||||||
|
nodes.extend(vec![
|
||||||
|
node!(label, Opcode::SubI, spr, 4, spr),
|
||||||
|
node!(None, Opcode::Stw, reg, spr, 0),
|
||||||
|
]);
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn expand_pusha(current: &Node, nodes: &mut Vec<Node>) -> Result<(), AssembleError> {
|
||||||
|
let label = current.label();
|
||||||
|
let Ok(arg0) = current.arg(0) else {
|
||||||
|
return Err(AssembleError::Generic);
|
||||||
|
};
|
||||||
|
|
||||||
|
let count = expect_token!(arg0, Immediate)?;
|
||||||
|
let spr = Token::Register(Register::Spr);
|
||||||
|
let registers: Vec<Register> = Register::general();
|
||||||
|
|
||||||
|
nodes.push(node!(
|
||||||
|
label,
|
||||||
|
Opcode::SubI,
|
||||||
|
spr,
|
||||||
|
Token::Immediate(count * 4),
|
||||||
|
spr
|
||||||
|
));
|
||||||
|
|
||||||
|
nodes.extend((0..count).rev().map(|i| {
|
||||||
|
node!(
|
||||||
|
None,
|
||||||
|
Opcode::Stw,
|
||||||
|
Token::Register(registers[i as usize]),
|
||||||
|
spr,
|
||||||
|
Token::Immediate(i * 4)
|
||||||
|
)
|
||||||
|
}));
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn expand_popa(current: &Node, nodes: &mut Vec<Node>) -> Result<(), AssembleError> {
|
||||||
|
let label = current.label();
|
||||||
|
|
||||||
|
let Ok(arg0) = current.arg(0) else {
|
||||||
|
return Err(AssembleError::Generic);
|
||||||
|
};
|
||||||
|
|
||||||
|
let count = expect_token!(arg0, Immediate)?;
|
||||||
|
let spr = Token::Register(Register::Spr);
|
||||||
|
let registers: Vec<Register> = Register::general();
|
||||||
|
|
||||||
|
nodes.extend((0..count).rev().map(|i| {
|
||||||
|
node!(
|
||||||
|
{ if i == 0 { label.clone() } else { None } },
|
||||||
|
Opcode::Ldw,
|
||||||
|
spr,
|
||||||
|
Token::Register(registers[i as usize]),
|
||||||
|
Token::Immediate(i * 4)
|
||||||
|
)
|
||||||
|
}));
|
||||||
|
|
||||||
|
nodes.push(node!(
|
||||||
|
None,
|
||||||
|
Opcode::AddI,
|
||||||
|
spr,
|
||||||
|
Token::Immediate(count * 4),
|
||||||
|
spr
|
||||||
|
));
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn expand_call(current: &Node, nodes: &mut Vec<Node>) -> Result<(), AssembleError> {
|
||||||
|
let label = current.label();
|
||||||
|
|
||||||
|
let Ok(arg0) = current.arg(0) else {
|
||||||
|
return Err(AssembleError::Generic);
|
||||||
|
};
|
||||||
|
|
||||||
|
let addr = expect_type!(arg0, Symbol)?;
|
||||||
|
let spr = Token::Register(Register::Spr);
|
||||||
|
let pcx = Token::Register(Register::Pcx);
|
||||||
|
let zero = Token::Register(Register::Zero);
|
||||||
|
|
||||||
|
nodes.extend(vec![
|
||||||
|
node!(label, Opcode::SubI, spr, 4, spr),
|
||||||
|
node!(None, Opcode::Stw, pcx, spr, 0),
|
||||||
|
node!(None, Opcode::Jmp, addr, zero),
|
||||||
|
]);
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn expand_return(current: &Node, nodes: &mut Vec<Node>) {
|
||||||
|
let label = current.label();
|
||||||
|
let spr = Token::Register(Register::Spr);
|
||||||
|
let ret = Token::Register(Register::Ret);
|
||||||
|
|
||||||
|
nodes.extend(vec![
|
||||||
|
node!(label, Opcode::Ldw, spr, ret, 0),
|
||||||
|
node!(None, Opcode::AddI, spr, 4, spr),
|
||||||
|
node!(None, Opcode::Jmp, 4, ret),
|
||||||
|
]);
|
||||||
|
}
|
||||||
|
|
||||||
|
fn expand_pop(current: &Node, nodes: &mut Vec<Node>) -> Result<(), AssembleError> {
|
||||||
|
let label = current.label();
|
||||||
|
|
||||||
|
let Ok(arg0) = current.arg(0) else {
|
||||||
|
return Err(AssembleError::Generic);
|
||||||
|
};
|
||||||
|
|
||||||
|
let reg = expect_type!(arg0, Register)?;
|
||||||
|
let spr = Token::Register(Register::Spr);
|
||||||
|
|
||||||
|
nodes.extend(vec![
|
||||||
|
node!(label, Opcode::Ldw, spr, reg, 0),
|
||||||
|
node!(None, Opcode::AddI, spr, 4, spr),
|
||||||
|
]);
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn expand_ldx(current: &Node, nodes: &mut Vec<Node>) -> Result<(), AssembleError> {
|
||||||
|
let opcode = current.opcode();
|
||||||
|
let args: Vec<Token> = current.args().into_iter().take(3).collect();
|
||||||
|
|
||||||
|
let Some(name) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
|
||||||
|
let Some(reg) = args.get(1) else {
|
||||||
|
return Err(AssembleError::MissingArgument(1));
|
||||||
|
};
|
||||||
|
|
||||||
|
let Some(offset) = args.get(2) else {
|
||||||
|
return Err(AssembleError::MissingArgument(2));
|
||||||
|
};
|
||||||
|
|
||||||
|
let name = expect_type!(name, Symbol)?;
|
||||||
|
let reg = expect_type!(reg, Register)?;
|
||||||
|
let offset = expect_type!(offset, Immediate)?;
|
||||||
|
|
||||||
|
nodes.extend(vec![
|
||||||
|
node!(current.label(), Opcode::Lli, name, reg),
|
||||||
|
node!(None, Opcode::Lui, name, reg),
|
||||||
|
node!(None, opcode, reg, reg, offset),
|
||||||
|
]);
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn expand_stx(current: &Node, nodes: &mut Vec<Node>) -> Result<(), AssembleError> {
|
||||||
|
let opcode = current.opcode();
|
||||||
|
|
||||||
|
let args: Vec<Token> = current.args().into_iter().take(3).collect();
|
||||||
|
|
||||||
|
let Some(base) = args.first() else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
|
||||||
|
let Some(dest) = args.get(1) else {
|
||||||
|
return Err(AssembleError::MissingArgument(1));
|
||||||
|
};
|
||||||
|
|
||||||
|
let Some(offset) = args.get(2) else {
|
||||||
|
return Err(AssembleError::MissingArgument(2));
|
||||||
|
};
|
||||||
|
|
||||||
|
let base = expect_type!(base, Register)?;
|
||||||
|
let dest = expect_type!(dest, Symbol)?;
|
||||||
|
let offset = expect_type!(offset, Immediate)?;
|
||||||
|
let temp = Token::Register(Register::Acc);
|
||||||
|
|
||||||
|
nodes.extend(vec![
|
||||||
|
node!(current.label(), Opcode::Lli, dest, temp),
|
||||||
|
node!(None, Opcode::Lui, dest, temp),
|
||||||
|
node!(None, opcode, base, temp, offset),
|
||||||
|
]);
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn expand_lwi(current: &Node, nodes: &mut Vec<Node>) -> Result<(), AssembleError> {
|
||||||
|
let Ok(val) = current.arg(0) else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
|
||||||
|
let Ok(reg) = current.arg(1) else {
|
||||||
|
return Err(AssembleError::MissingArgument(1));
|
||||||
|
};
|
||||||
|
|
||||||
|
let val = expect_type!(val, Symbol, Immediate)?;
|
||||||
|
let reg = expect_type!(reg, Register)?;
|
||||||
|
|
||||||
|
nodes.extend(vec![
|
||||||
|
node!(current.label(), Opcode::Lli, val, reg),
|
||||||
|
node!(None, Opcode::Lui, val, reg),
|
||||||
|
]);
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn expand_resx(current: &Node, nodes: &mut Vec<Node>) -> Result<(), AssembleError> {
|
||||||
|
let Ok(region_label) = current.arg(0) else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
|
||||||
|
let Ok(size) = current.arg(1) else {
|
||||||
|
return Err(AssembleError::MissingArgument(1));
|
||||||
|
};
|
||||||
|
|
||||||
|
let region_label = expect_token!(region_label, Symbol)?;
|
||||||
|
let size = expect_token!(size, Immediate)?;
|
||||||
|
|
||||||
|
let units_per = match current.opcode() {
|
||||||
|
Opcode::Resb => 4,
|
||||||
|
Opcode::Resh => 2,
|
||||||
|
Opcode::Resw => 1,
|
||||||
|
_ => unreachable!(),
|
||||||
|
};
|
||||||
|
|
||||||
|
let mut buffer = vec![];
|
||||||
|
// push the inital node with the label
|
||||||
|
for _ in 0..size.div_ceil(units_per) {
|
||||||
|
// push the rest of the nodes
|
||||||
|
buffer.push(node!(None, Opcode::Data, 0));
|
||||||
|
}
|
||||||
|
buffer[0].symbol = Some(region_label);
|
||||||
|
nodes.extend(buffer);
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn expand_dx(current: &Node, nodes: &mut Vec<Node>) -> Result<(), AssembleError> {
|
||||||
|
let Ok(region_label) = current.arg(0) else {
|
||||||
|
return Err(AssembleError::MissingArgument(0));
|
||||||
|
};
|
||||||
|
|
||||||
|
let region_label = expect_token!(region_label, Symbol)?;
|
||||||
|
let size = match current.opcode() {
|
||||||
|
Opcode::Db => 4,
|
||||||
|
Opcode::Dh => 2,
|
||||||
|
Opcode::Dw => 1,
|
||||||
|
_ => unreachable!(),
|
||||||
|
};
|
||||||
|
|
||||||
|
let mut buffer = vec![];
|
||||||
|
|
||||||
|
let mut args = current.args();
|
||||||
|
let _label = args.remove(0);
|
||||||
|
|
||||||
|
for word in process_dx_data(args, size)? {
|
||||||
|
buffer.push(node!(None, Opcode::Data, Token::Immediate(word)));
|
||||||
|
}
|
||||||
|
buffer[0].symbol = Some(region_label);
|
||||||
|
|
||||||
|
nodes.extend(buffer);
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn process_dx_data(args: Vec<Token>, size: usize) -> Result<Vec<u32>, AssembleError> {
|
||||||
|
assert!(matches!(size, 1 | 2 | 4));
|
||||||
|
|
||||||
|
let mut buffer = Vec::<u8>::new();
|
||||||
|
|
||||||
|
// Process each token
|
||||||
|
for token in args {
|
||||||
|
match token {
|
||||||
|
Token::StringLit(mut s) => {
|
||||||
|
s.push('\0');
|
||||||
|
// Split string into chars and write as bytes
|
||||||
|
for ch in s.chars() {
|
||||||
|
// Convert char to bytes (UTF-8 encoding)
|
||||||
|
let mut char_buf = [0u8; 4];
|
||||||
|
let char_bytes = ch.encode_utf8(&mut char_buf);
|
||||||
|
buffer.extend_from_slice(char_bytes.as_bytes());
|
||||||
|
}
|
||||||
|
}
|
||||||
|
Token::Immediate(value) => {
|
||||||
|
// Split u32 into bytes (little-endian)
|
||||||
|
buffer.extend_from_slice(&value.to_be_bytes());
|
||||||
|
}
|
||||||
|
_ => {
|
||||||
|
return Err(AssembleError::Generic);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// Pad buffer to alignment boundary with zeros
|
||||||
|
let remainder = buffer.len() % size;
|
||||||
|
if remainder != 0 {
|
||||||
|
let padding = size - remainder;
|
||||||
|
buffer.resize(buffer.len() + padding, 0);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// Convert byte buffer to u32 chunks
|
||||||
|
// Pad final buffer to u32 boundary if needed
|
||||||
|
let remainder = buffer.len() % 4;
|
||||||
|
if remainder != 0 {
|
||||||
|
let padding = 4 - remainder;
|
||||||
|
buffer.resize(buffer.len() + padding, 0);
|
||||||
|
}
|
||||||
|
|
||||||
|
// Convert bytes to u32s efficiently using chunks_exact
|
||||||
|
let result = buffer
|
||||||
|
.chunks_exact(4)
|
||||||
|
.map(|chunk| {
|
||||||
|
// Convert 4 bytes to u32 (little-endian)
|
||||||
|
u32::from_be_bytes([chunk[0], chunk[1], chunk[2], chunk[3]])
|
||||||
|
})
|
||||||
|
.collect();
|
||||||
|
|
||||||
|
Ok(result)
|
||||||
|
}
|
||||||
@@ -0,0 +1,173 @@
|
|||||||
|
use std::str::FromStr;
|
||||||
|
|
||||||
|
use crate::assembler::AssembleError;
|
||||||
|
use crate::assembler::model::{Module, Opcode, Symbol, Token};
|
||||||
|
use common::prelude::Register;
|
||||||
|
|
||||||
|
pub fn lexer(mut program: String, module: u64) -> Result<Vec<Token>, AssembleError> {
|
||||||
|
let mut tokens = Vec::new();
|
||||||
|
|
||||||
|
let lines = program.lines();
|
||||||
|
let mut literal = String::new();
|
||||||
|
|
||||||
|
for line in lines {
|
||||||
|
for (i, token) in line.split_whitespace().enumerate() {
|
||||||
|
if token.starts_with("//") {
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
|
||||||
|
if let Some(stripped) = token.strip_prefix('"') {
|
||||||
|
literal.push_str(stripped);
|
||||||
|
}
|
||||||
|
|
||||||
|
if !literal.is_empty() {
|
||||||
|
if !token.starts_with('"') {
|
||||||
|
if i > 0 {
|
||||||
|
literal.push(' ');
|
||||||
|
}
|
||||||
|
literal.push_str(token);
|
||||||
|
}
|
||||||
|
|
||||||
|
if token.ends_with('"') {
|
||||||
|
literal.pop(); // remove the closing quote
|
||||||
|
|
||||||
|
tokens.push(Token::StringLit(literal));
|
||||||
|
literal = String::new();
|
||||||
|
}
|
||||||
|
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
let token = token.trim_end_matches(',');
|
||||||
|
if token.is_empty() {
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
if let Some(token) = parse_register(token)? {
|
||||||
|
tokens.push(token);
|
||||||
|
} else if let Some(token) = parse_opcode(token)? {
|
||||||
|
tokens.push(token);
|
||||||
|
} else if let Some(token) = parse_hex(token)? {
|
||||||
|
tokens.push(token);
|
||||||
|
} else if let Some(token) = parse_octal(token)? {
|
||||||
|
tokens.push(token);
|
||||||
|
} else if let Some(token) = parse_binary(token)? {
|
||||||
|
tokens.push(token);
|
||||||
|
} else if let Some(token) = parse_decimal(token)? {
|
||||||
|
tokens.push(token);
|
||||||
|
} else if let Some(token) = parse_label(token, module)? {
|
||||||
|
tokens.push(token);
|
||||||
|
} else if let Some(token) = parse_symbol(token, module)? {
|
||||||
|
tokens.push(token);
|
||||||
|
} else {
|
||||||
|
return Err(AssembleError::Generic);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
println!("{:#?}", tokens);
|
||||||
|
|
||||||
|
Ok(tokens)
|
||||||
|
}
|
||||||
|
pub fn parse_register(token: &str) -> Result<Option<Token>, AssembleError> {
|
||||||
|
Ok(Register::try_from(token).map(Token::Register).ok())
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn parse_opcode(token: &str) -> Result<Option<Token>, AssembleError> {
|
||||||
|
if Opcode::OPCODES.contains(&token) {
|
||||||
|
Ok(Some(Token::Opcode(Opcode::from_str(token).expect(
|
||||||
|
"Opcode::from_str failed for a valid opcode token",
|
||||||
|
))))
|
||||||
|
} else {
|
||||||
|
Ok(None)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn parse_hex(token: &str) -> Result<Option<Token>, AssembleError> {
|
||||||
|
if (token.len() < 3) | !token.starts_with("0x") {
|
||||||
|
return Ok(None);
|
||||||
|
}
|
||||||
|
|
||||||
|
let Some(lit) = &token.get(2..) else {
|
||||||
|
return Err(AssembleError::InvalidArg);
|
||||||
|
};
|
||||||
|
|
||||||
|
u32::from_str_radix(lit, 16).map_or(Err(AssembleError::Generic), |value| {
|
||||||
|
Ok(Some(Token::Immediate(value)))
|
||||||
|
})
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn parse_octal(token: &str) -> Result<Option<Token>, AssembleError> {
|
||||||
|
if (token.len() < 3) | !token.starts_with("0o") {
|
||||||
|
return Ok(None);
|
||||||
|
}
|
||||||
|
|
||||||
|
let Some(lit) = &token.get(2..) else {
|
||||||
|
return Err(AssembleError::InvalidArg);
|
||||||
|
};
|
||||||
|
|
||||||
|
u32::from_str_radix(lit, 8).map_or(Err(AssembleError::Generic), |value| {
|
||||||
|
Ok(Some(Token::Immediate(value)))
|
||||||
|
})
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn parse_binary(token: &str) -> Result<Option<Token>, AssembleError> {
|
||||||
|
if (token.len() < 3) | !token.starts_with("0b") {
|
||||||
|
return Ok(None);
|
||||||
|
}
|
||||||
|
|
||||||
|
let Some(lit) = &token.get(2..) else {
|
||||||
|
return Err(AssembleError::InvalidArg);
|
||||||
|
};
|
||||||
|
|
||||||
|
u32::from_str_radix(lit, 2).map_or(Err(AssembleError::Generic), |value| {
|
||||||
|
Ok(Some(Token::Immediate(value)))
|
||||||
|
})
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn parse_decimal(token: &str) -> Result<Option<Token>, AssembleError> {
|
||||||
|
let Ok(tok) = token.parse::<u32>() else {
|
||||||
|
return Ok(None);
|
||||||
|
};
|
||||||
|
|
||||||
|
Ok(Some(Token::Immediate(tok)))
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn parse_label(token: &str, module: u64) -> Result<Option<Token>, AssembleError> {
|
||||||
|
if token.ends_with(':') {
|
||||||
|
Ok(Some(Token::Symbol(Symbol {
|
||||||
|
name: token[0..token.len() - 1].to_string(),
|
||||||
|
module: Module::Resolved(module),
|
||||||
|
})))
|
||||||
|
} else {
|
||||||
|
Ok(None)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn parse_symbol(token: &str, module: u64) -> Result<Option<Token>, AssembleError> {
|
||||||
|
let Some(tokc) = token.chars().next() else {
|
||||||
|
return Err(AssembleError::Generic); // TODO: What is this error?
|
||||||
|
};
|
||||||
|
|
||||||
|
if tokc.is_numeric() {
|
||||||
|
return Ok(None);
|
||||||
|
}
|
||||||
|
|
||||||
|
let mut split = token.splitn(2, "::");
|
||||||
|
let Some(symbol1) = split.next() else {
|
||||||
|
return Err(AssembleError::InvalidArg);
|
||||||
|
};
|
||||||
|
let symbol1 = symbol1.to_string();
|
||||||
|
|
||||||
|
if let Some(symbol2) = split.next() {
|
||||||
|
Ok(Some(Token::Symbol(Symbol {
|
||||||
|
name: symbol2.to_string(),
|
||||||
|
module: Module::Unresolved(symbol1),
|
||||||
|
})))
|
||||||
|
} else {
|
||||||
|
Ok(Some(Token::Symbol(Symbol {
|
||||||
|
name: symbol1,
|
||||||
|
module: Module::Resolved(module),
|
||||||
|
})))
|
||||||
|
}
|
||||||
|
}
|
||||||
@@ -0,0 +1,138 @@
|
|||||||
|
//! Macros used throughout the assembler
|
||||||
|
|
||||||
|
use crate::assembler::model::{Node, Opcode, Symbol, Token};
|
||||||
|
/// Parse DSA assembly code with optional formatting
|
||||||
|
///
|
||||||
|
/// # Examples
|
||||||
|
/// ```
|
||||||
|
/// // With formatting:
|
||||||
|
/// let nodes = dsa!(hash, "mov r1, {}", 42)?;
|
||||||
|
///
|
||||||
|
/// // Without formatting:
|
||||||
|
/// let nodes = dsa!(hash, "mov r1, 42")?;
|
||||||
|
/// ```
|
||||||
|
#[macro_export]
|
||||||
|
macro_rules! dsa {
|
||||||
|
// Version with formatting arguments
|
||||||
|
($hash:expr, $input:expr, $($args:expr),+) => {{
|
||||||
|
let input = format!($input, $($args),+);
|
||||||
|
let tokens = $crate::lexer::lexer(input, $hash)?;
|
||||||
|
let parsed = $crate::parser::Parser::parse_nodes(tokens)?;
|
||||||
|
parsed
|
||||||
|
}};
|
||||||
|
// Version without formatting
|
||||||
|
($hash:expr, $input:expr) => {{
|
||||||
|
let input = String::from($input);
|
||||||
|
let tokens = $crate::lexer::lexer(input, $hash)?;
|
||||||
|
let parsed = $crate::parser::Parser::parse_nodes(tokens)?;
|
||||||
|
parsed
|
||||||
|
}};
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Creates a new Node with the given symbol, opcode, and tokens
|
||||||
|
#[macro_export]
|
||||||
|
macro_rules! node {
|
||||||
|
($symbol: expr, $opcode: expr, args: $tokens: expr) => {
|
||||||
|
$crate::assembler::model::Node::new($symbol.clone(), $opcode.clone(), $tokens.clone())
|
||||||
|
};
|
||||||
|
|
||||||
|
($symbol: expr, $opcode: expr, $($tokens: expr),+) => {
|
||||||
|
$crate::assembler::model::Node::new(
|
||||||
|
$symbol.clone(),
|
||||||
|
$opcode.clone(),
|
||||||
|
vec![$(node!(@convert_token $tokens)),+]
|
||||||
|
)
|
||||||
|
};
|
||||||
|
|
||||||
|
($symbol: expr, $opcode: expr) => {
|
||||||
|
$crate::assembler::model::Node::new(
|
||||||
|
$symbol.clone(),
|
||||||
|
$opcode.clone(),
|
||||||
|
Vec::new()
|
||||||
|
)
|
||||||
|
};
|
||||||
|
|
||||||
|
(@convert_token $token: literal) => {
|
||||||
|
$crate::assembler::model::Token::Immediate($token)
|
||||||
|
};
|
||||||
|
|
||||||
|
(@convert_token $token: expr) => {
|
||||||
|
$token.clone()
|
||||||
|
};
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Extracts a specific token type from a token
|
||||||
|
#[macro_export]
|
||||||
|
macro_rules! expect_token {
|
||||||
|
($token:expr, Symbol) => {
|
||||||
|
match $token {
|
||||||
|
$crate::assembler::model::Token::Symbol(value) => Ok(value.clone()),
|
||||||
|
other => Err($crate::assembler::AssembleError::UnexpectedToken(
|
||||||
|
other.clone(),
|
||||||
|
$crate::assembler::model::TokenType::Symbol,
|
||||||
|
)),
|
||||||
|
}
|
||||||
|
};
|
||||||
|
($token:expr, Register) => {
|
||||||
|
match $token {
|
||||||
|
$crate::assembler::model::Token::Register(value) => Ok(value.clone()),
|
||||||
|
other => Err($crate::assembler::AssembleError::UnexpectedToken(
|
||||||
|
other.clone(),
|
||||||
|
$crate::assembler::model::TokenType::Register,
|
||||||
|
)),
|
||||||
|
}
|
||||||
|
};
|
||||||
|
($token:expr, Immediate) => {
|
||||||
|
match $token {
|
||||||
|
$crate::assembler::model::Token::Immediate(value) => Ok(value.clone()),
|
||||||
|
other => Err($crate::assembler::AssembleError::UnexpectedToken(
|
||||||
|
other.clone(),
|
||||||
|
$crate::assembler::model::TokenType::Immediate,
|
||||||
|
)),
|
||||||
|
}
|
||||||
|
};
|
||||||
|
($token:expr, StringLit) => {
|
||||||
|
match $token {
|
||||||
|
$crate::assembler::model::Token::StringLit(value) => Ok(value.clone()),
|
||||||
|
other => Err($crate::assembler::AssembleError::UnexpectedToken(
|
||||||
|
other.clone(),
|
||||||
|
$crate::assembler::model::TokenType::StringLit,
|
||||||
|
)),
|
||||||
|
}
|
||||||
|
};
|
||||||
|
($token:expr, Opcode) => {
|
||||||
|
match $token {
|
||||||
|
$crate::assembler::model::Token::Opcode(value) => Ok(value.clone()),
|
||||||
|
other => Err($crate::assembler::AssembleError::UnexpectedToken(
|
||||||
|
other.clone(),
|
||||||
|
$crate::assembler::model::TokenType::Opcode,
|
||||||
|
)),
|
||||||
|
}
|
||||||
|
};
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Checks if a token matches any of the specified types
|
||||||
|
#[macro_export]
|
||||||
|
macro_rules! expect_type {
|
||||||
|
($token:expr, $($variant:ident),+) => {{
|
||||||
|
let token = $token;
|
||||||
|
match &token {
|
||||||
|
$(
|
||||||
|
$crate::assembler::model::Token::$variant(_) => Ok(token.clone()),
|
||||||
|
)+
|
||||||
|
other => {
|
||||||
|
let expected_type = expect_type!(@get_first_type $($variant),+);
|
||||||
|
Err($crate::assembler::AssembleError::UnexpectedToken(
|
||||||
|
other.clone().clone(),
|
||||||
|
expected_type,
|
||||||
|
))
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}};
|
||||||
|
|
||||||
|
(@get_first_type Symbol $(, $rest:ident)*) => { $crate::assembler::model::TokenType::Symbol };
|
||||||
|
(@get_first_type Register $(, $rest:ident)*) => { $crate::assembler::model::TokenType::Register };
|
||||||
|
(@get_first_type Immediate $(, $rest:ident)*) => { $crate::assembler::model::TokenType::Immediate };
|
||||||
|
(@get_first_type StringLit $(, $rest:ident)*) => { $crate::assembler::model::TokenType::StringLit };
|
||||||
|
(@get_first_type Opcode $(, $rest:ident)*) => { $crate::assembler::model::TokenType::Opcode };
|
||||||
|
}
|
||||||
@@ -0,0 +1,266 @@
|
|||||||
|
#![allow(dead_code, unused)]
|
||||||
|
|
||||||
|
use std::{
|
||||||
|
collections::HashSet,
|
||||||
|
fmt, fs,
|
||||||
|
hash::{DefaultHasher, Hash, Hasher},
|
||||||
|
path::{Path, PathBuf},
|
||||||
|
sync::{Arc, Mutex, mpsc},
|
||||||
|
thread,
|
||||||
|
};
|
||||||
|
|
||||||
|
use common::prelude::Instruction;
|
||||||
|
|
||||||
|
// TODO: Use an actual logging or tracing library for pretty (scoped) output.
|
||||||
|
fn log(message: &str) {
|
||||||
|
println!("\x1b[32mINFO:\x1b[0m {message}");
|
||||||
|
}
|
||||||
|
|
||||||
|
// Module declarations
|
||||||
|
#[macro_use]
|
||||||
|
pub mod macros;
|
||||||
|
|
||||||
|
#[allow(clippy::module_inception)]
|
||||||
|
pub mod assembler;
|
||||||
|
pub mod codegen;
|
||||||
|
pub mod expand;
|
||||||
|
pub mod lexer;
|
||||||
|
pub mod model;
|
||||||
|
pub mod parser;
|
||||||
|
pub mod resolver;
|
||||||
|
|
||||||
|
// Re-exports
|
||||||
|
pub use self::{
|
||||||
|
codegen::codegen,
|
||||||
|
expand::expand_pseudo_ops,
|
||||||
|
lexer::lexer,
|
||||||
|
model::{Module, Node, Opcode, Symbol, Token, TokenType},
|
||||||
|
parser::{Parser, Program},
|
||||||
|
resolver::{create_sections, resolve_dependencies, resolve_symbols},
|
||||||
|
};
|
||||||
|
|
||||||
|
use crate::util::logging::{Entry, Logger};
|
||||||
|
|
||||||
|
pub struct CompilerEngine {
|
||||||
|
result_tx: mpsc::Sender<Result<Vec<Instruction>, AssembleError>>,
|
||||||
|
result_rx: Option<mpsc::Receiver<Result<Vec<Instruction>, AssembleError>>>,
|
||||||
|
is_running: bool,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl CompilerEngine {
|
||||||
|
#[must_use]
|
||||||
|
pub fn new() -> Self {
|
||||||
|
let (tx, rx) = mpsc::channel();
|
||||||
|
Self {
|
||||||
|
result_tx: tx,
|
||||||
|
result_rx: Some(rx),
|
||||||
|
is_running: false,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Start the compilation process in a separate thread
|
||||||
|
pub fn start_compilation(&mut self, src: &Path) {
|
||||||
|
if self.is_running {
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
|
let src = src.to_path_buf();
|
||||||
|
let tx = self.result_tx.clone();
|
||||||
|
|
||||||
|
thread::spawn(move || {
|
||||||
|
let result = assemble(&src);
|
||||||
|
tx.send(result)
|
||||||
|
.expect("Failed to send compilation result from worker thread");
|
||||||
|
});
|
||||||
|
|
||||||
|
self.is_running = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Check if compilation is complete and get the result
|
||||||
|
pub fn try_get_result(&mut self) -> Option<Result<Vec<Instruction>, AssembleError>> {
|
||||||
|
if !self.is_running {
|
||||||
|
return None;
|
||||||
|
}
|
||||||
|
|
||||||
|
match self
|
||||||
|
.result_rx
|
||||||
|
.as_ref()
|
||||||
|
.expect("result_rx should be Some while compilation is running")
|
||||||
|
.try_recv()
|
||||||
|
{
|
||||||
|
Ok(result) => {
|
||||||
|
self.is_running = false;
|
||||||
|
Some(result)
|
||||||
|
}
|
||||||
|
Err(mpsc::TryRecvError::Empty) => None,
|
||||||
|
Err(mpsc::TryRecvError::Disconnected) => {
|
||||||
|
self.is_running = false;
|
||||||
|
Some(Err(AssembleError::Generic))
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// Block until compilation is complete and return the result
|
||||||
|
pub fn wait_for_result(&mut self) -> Result<Vec<Instruction>, AssembleError> {
|
||||||
|
if !self.is_running {
|
||||||
|
return Err(AssembleError::Generic);
|
||||||
|
}
|
||||||
|
|
||||||
|
if let Ok(result) = self
|
||||||
|
.result_rx
|
||||||
|
.take()
|
||||||
|
.expect("result_rx should be Some while waiting for compilation result")
|
||||||
|
.recv()
|
||||||
|
{
|
||||||
|
self.is_running = false;
|
||||||
|
result
|
||||||
|
} else {
|
||||||
|
self.is_running = false;
|
||||||
|
Err(AssembleError::Generic)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn assemble(src: &Path) -> Result<Vec<Instruction>, AssembleError> {
|
||||||
|
let mut modules = HashSet::new();
|
||||||
|
let mut program = Program::new();
|
||||||
|
|
||||||
|
let hash = quick_hash(src);
|
||||||
|
|
||||||
|
if modules.contains(&hash) {
|
||||||
|
return Ok(vec![]);
|
||||||
|
}
|
||||||
|
|
||||||
|
prepare_dependency(src, &mut modules, &mut program)?;
|
||||||
|
|
||||||
|
let mut nodes = program.nodes.clone();
|
||||||
|
|
||||||
|
create_sections(&mut nodes)?;
|
||||||
|
resolve_symbols(&mut nodes)?;
|
||||||
|
|
||||||
|
let instructions = codegen(nodes)?;
|
||||||
|
Ok(instructions)
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Default for CompilerEngine {
|
||||||
|
fn default() -> Self {
|
||||||
|
Self::new()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn prepare_dependency(
|
||||||
|
path: &Path,
|
||||||
|
modules: &mut HashSet<u64>,
|
||||||
|
program: &mut Program,
|
||||||
|
) -> Result<(), AssembleError> {
|
||||||
|
let filename = path
|
||||||
|
.file_name()
|
||||||
|
.and_then(|n| n.to_str())
|
||||||
|
.expect("Failed to get file name from path");
|
||||||
|
|
||||||
|
if let Ok(path) = path.canonicalize() {
|
||||||
|
log(&format!(
|
||||||
|
"{:20} {:20} [{}]",
|
||||||
|
"Building",
|
||||||
|
filename,
|
||||||
|
path.display()
|
||||||
|
));
|
||||||
|
}
|
||||||
|
|
||||||
|
let src = fs::read_to_string(path)
|
||||||
|
.map_err(|_| AssembleError::InvalidFile(path.to_path_buf()))?;
|
||||||
|
let file_hash = quick_hash(path);
|
||||||
|
|
||||||
|
log(&format!("{:20} {:20}", "Tokenising", filename));
|
||||||
|
let tokens = lexer::lexer(src, file_hash)?;
|
||||||
|
|
||||||
|
log(&format!("{:20} {:20}", "Parsing", filename));
|
||||||
|
let parsed = Parser::parse_nodes(tokens)?;
|
||||||
|
|
||||||
|
log(&format!("{:20} {:20}", "Resolving Deps", filename));
|
||||||
|
// Get the parent directory of the source file to use as the base directory
|
||||||
|
let base_dir = path
|
||||||
|
.parent()
|
||||||
|
.ok_or_else(|| AssembleError::InvalidFile(path.to_path_buf()))?;
|
||||||
|
let mut nodes = expand_pseudo_ops(parsed, file_hash)?;
|
||||||
|
nodes = resolve_dependencies(nodes, base_dir)?;
|
||||||
|
|
||||||
|
let deps = Parser::get_dependencies(&nodes, path)?;
|
||||||
|
|
||||||
|
log(&format!(
|
||||||
|
"{:20} {:20}",
|
||||||
|
"Expanding PseudoInstructions", filename
|
||||||
|
));
|
||||||
|
|
||||||
|
// add a section instruction
|
||||||
|
nodes.insert(
|
||||||
|
0,
|
||||||
|
node!(None, Opcode::Segment, Token::Immediate(file_hash as u32)),
|
||||||
|
);
|
||||||
|
|
||||||
|
for n in &nodes {
|
||||||
|
println!("{n}");
|
||||||
|
}
|
||||||
|
|
||||||
|
program.add_module(nodes);
|
||||||
|
|
||||||
|
for dep in deps {
|
||||||
|
log(&format!(
|
||||||
|
"{:20} {:20}",
|
||||||
|
"Including",
|
||||||
|
dep.file_name()
|
||||||
|
.and_then(|f| f.to_str())
|
||||||
|
.expect("Dependency path has no file name or is not valid UTF-8")
|
||||||
|
));
|
||||||
|
|
||||||
|
let dep_hash = quick_hash(&dep);
|
||||||
|
if modules.insert(dep_hash) {
|
||||||
|
prepare_dependency(dep.as_path(), modules, program)?;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug, Clone)]
|
||||||
|
pub enum AssembleError {
|
||||||
|
Generic,
|
||||||
|
UnexpectedEof,
|
||||||
|
InvalidFile(PathBuf),
|
||||||
|
UnexpectedToken(Token, TokenType),
|
||||||
|
InvalidArg,
|
||||||
|
UndefinedSymbol(Symbol),
|
||||||
|
/// Contains the nth element missing from the instruction.
|
||||||
|
MissingArgument(u8),
|
||||||
|
}
|
||||||
|
|
||||||
|
impl fmt::Display for AssembleError {
|
||||||
|
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
|
||||||
|
match self {
|
||||||
|
Self::Generic => write!(f, "Generic error"),
|
||||||
|
Self::UnexpectedToken(tok, expected) => {
|
||||||
|
write!(f, "Unexpected token {tok:?}, expected {expected:?}")
|
||||||
|
}
|
||||||
|
Self::UnexpectedEof => write!(f, "Unexpected end of file"),
|
||||||
|
Self::InvalidFile(path) => write!(f, "Invalid file `{}`", path.display()),
|
||||||
|
Self::InvalidArg => write!(f, "Invalid argument"),
|
||||||
|
Self::UndefinedSymbol(symbol) => {
|
||||||
|
write!(f, "Undefined symbol {symbol}")
|
||||||
|
}
|
||||||
|
Self::MissingArgument(n) => {
|
||||||
|
write!(f, "Missing argument #{n} from instruction arguments.")
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn quick_hash(value: &Path) -> u64 {
|
||||||
|
let mut hasher = DefaultHasher::new();
|
||||||
|
value
|
||||||
|
.canonicalize()
|
||||||
|
.expect("Failed to canonicalize path for quick_hash")
|
||||||
|
.to_str()
|
||||||
|
.hash(&mut hasher);
|
||||||
|
|
||||||
|
hasher.finish()
|
||||||
|
}
|
||||||
@@ -1,285 +1,84 @@
|
|||||||
//! This module contains instructions for tokenisation.
|
|
||||||
|
|
||||||
use std::{fmt, str::FromStr};
|
use std::{fmt, str::FromStr};
|
||||||
|
|
||||||
use common::prelude::{ITypeArgs, Instruction, Interrupt, RTypeArgs};
|
use common::prelude::Register;
|
||||||
|
|
||||||
use crate::{
|
use crate::assembler::AssembleError;
|
||||||
error::{AssembleError, AssembleErrorKind},
|
|
||||||
source::source_info::SourceInfo,
|
|
||||||
};
|
|
||||||
|
|
||||||
#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
|
#[derive(Debug, Clone)]
|
||||||
pub enum Opcode {
|
pub struct Node {
|
||||||
Nop,
|
pub symbol: Option<Symbol>,
|
||||||
Mov,
|
pub opcode: Opcode,
|
||||||
Movs,
|
pub tokens: Vec<Token>,
|
||||||
Ldb,
|
|
||||||
Ldbs,
|
|
||||||
Ldh,
|
|
||||||
Ldhs,
|
|
||||||
Ldw,
|
|
||||||
Stb,
|
|
||||||
Sth,
|
|
||||||
Stw,
|
|
||||||
Lli,
|
|
||||||
Lui,
|
|
||||||
Jmp,
|
|
||||||
Jeq,
|
|
||||||
Jne,
|
|
||||||
Jgt,
|
|
||||||
Jge,
|
|
||||||
Jlt,
|
|
||||||
Jle,
|
|
||||||
Cmp,
|
|
||||||
Inc,
|
|
||||||
Dec,
|
|
||||||
Shl,
|
|
||||||
Shr,
|
|
||||||
Add,
|
|
||||||
Sub,
|
|
||||||
And,
|
|
||||||
Or,
|
|
||||||
Not,
|
|
||||||
Xor,
|
|
||||||
Nand,
|
|
||||||
Nor,
|
|
||||||
Xnor,
|
|
||||||
Int,
|
|
||||||
Irt,
|
|
||||||
Hlt,
|
|
||||||
AddI,
|
|
||||||
SubI,
|
|
||||||
|
|
||||||
// Pseudo-instructions
|
|
||||||
Db,
|
|
||||||
Dh,
|
|
||||||
Dw,
|
|
||||||
Resb,
|
|
||||||
Resh,
|
|
||||||
Resw,
|
|
||||||
Push,
|
|
||||||
Pop,
|
|
||||||
Pusha,
|
|
||||||
Popa,
|
|
||||||
Lwi,
|
|
||||||
Call,
|
|
||||||
Return,
|
|
||||||
|
|
||||||
// Meta instructions (these aren't present in the binary as instructions)
|
|
||||||
Include,
|
|
||||||
Data,
|
|
||||||
Segment,
|
|
||||||
}
|
}
|
||||||
|
|
||||||
#[derive(Debug)]
|
impl Node {
|
||||||
pub enum OpcodeFromStrError {
|
#[must_use]
|
||||||
InvalidRegister(&'static str),
|
pub const fn new(symbol: Option<Symbol>, opcode: Opcode, tokens: Vec<Token>) -> Self {
|
||||||
InvalidOpcode(String),
|
Self {
|
||||||
}
|
symbol,
|
||||||
|
opcode,
|
||||||
impl std::fmt::Display for OpcodeFromStrError {
|
tokens,
|
||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
|
||||||
match self {
|
|
||||||
Self::InvalidRegister(reg) => write!(f, "register does not exist: {reg}"),
|
|
||||||
Self::InvalidOpcode(op) => write!(f, "instruction does not exist: {op}"),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl std::error::Error for OpcodeFromStrError {}
|
|
||||||
|
|
||||||
impl Opcode {
|
|
||||||
pub const OPCODES: &[&str] = &[
|
|
||||||
// Real instructions (0x00-0x26)
|
|
||||||
"nop", "mov", "movs", "ldb", "ldbs", "ldh", "ldhs", "ldw", "stb", "sth", "stw",
|
|
||||||
"lli", "lui", "jmp", "jeq", "jne", "jgt", "jge", "jlt", "jle", "cmp", "inc",
|
|
||||||
"dec", "shl", "shr", "add", "sub", "and", "or", "not", "xor", "nand", "nor",
|
|
||||||
"xnor", "int", "irt", "hlt", "addi", "subi", // Pseudo-instructions
|
|
||||||
"db", "dh", "dw", "resb", "resh", "resw", "push", "pop", "lwi", "call", "return",
|
|
||||||
"pusha", "popa", // meta instructions
|
|
||||||
"include",
|
|
||||||
];
|
|
||||||
|
|
||||||
pub fn to_instruction(
|
|
||||||
&self,
|
|
||||||
source_info: SourceInfo,
|
|
||||||
) -> Result<Instruction, AssembleError> {
|
|
||||||
match self {
|
|
||||||
Self::Nop => Ok(Instruction::Nop),
|
|
||||||
Self::Mov => Ok(Instruction::Mov(RTypeArgs::default())),
|
|
||||||
Self::Movs => Ok(Instruction::MovSigned(RTypeArgs::default())),
|
|
||||||
Self::Ldb => Ok(Instruction::LoadByte(ITypeArgs::default())),
|
|
||||||
Self::Ldbs => Ok(Instruction::LoadByteSigned(ITypeArgs::default())),
|
|
||||||
Self::Ldh => Ok(Instruction::LoadHalfword(ITypeArgs::default())),
|
|
||||||
Self::Ldhs => Ok(Instruction::LoadHalfwordSigned(ITypeArgs::default())),
|
|
||||||
Self::Ldw => Ok(Instruction::LoadWord(ITypeArgs::default())),
|
|
||||||
Self::Stb => Ok(Instruction::StoreByte(ITypeArgs::default())),
|
|
||||||
Self::Sth => Ok(Instruction::StoreHalfword(ITypeArgs::default())),
|
|
||||||
Self::Stw => Ok(Instruction::StoreWord(ITypeArgs::default())),
|
|
||||||
Self::Lli => Ok(Instruction::LoadLowerImmediate(ITypeArgs::default())),
|
|
||||||
Self::Lui => Ok(Instruction::LoadUpperImmediate(ITypeArgs::default())),
|
|
||||||
Self::Jmp => Ok(Instruction::Jump(ITypeArgs::default())),
|
|
||||||
Self::Jeq => Ok(Instruction::JumpEq(ITypeArgs::default())),
|
|
||||||
Self::Jne => Ok(Instruction::JumpNeq(ITypeArgs::default())),
|
|
||||||
Self::Jgt => Ok(Instruction::JumpGt(ITypeArgs::default())),
|
|
||||||
Self::Jge => Ok(Instruction::JumpGe(ITypeArgs::default())),
|
|
||||||
Self::Jlt => Ok(Instruction::JumpLt(ITypeArgs::default())),
|
|
||||||
Self::Jle => Ok(Instruction::JumpLe(ITypeArgs::default())),
|
|
||||||
Self::Cmp => Ok(Instruction::Compare(RTypeArgs::default())),
|
|
||||||
Self::Inc => Ok(Instruction::Increment(RTypeArgs::default())),
|
|
||||||
Self::Dec => Ok(Instruction::Decrement(RTypeArgs::default())),
|
|
||||||
Self::Shl => Ok(Instruction::ShiftLeft(RTypeArgs::default())),
|
|
||||||
Self::Shr => Ok(Instruction::ShiftRight(RTypeArgs::default())),
|
|
||||||
Self::Add => Ok(Instruction::Add(RTypeArgs::default())),
|
|
||||||
Self::Sub => Ok(Instruction::Sub(RTypeArgs::default())),
|
|
||||||
Self::And => Ok(Instruction::And(RTypeArgs::default())),
|
|
||||||
Self::Or => Ok(Instruction::Or(RTypeArgs::default())),
|
|
||||||
Self::Not => Ok(Instruction::Not(RTypeArgs::default())),
|
|
||||||
Self::Xor => Ok(Instruction::Xor(RTypeArgs::default())),
|
|
||||||
Self::Nand => Ok(Instruction::Nand(RTypeArgs::default())),
|
|
||||||
Self::Nor => Ok(Instruction::Nor(RTypeArgs::default())),
|
|
||||||
Self::Xnor => Ok(Instruction::Xnor(RTypeArgs::default())),
|
|
||||||
Self::Int => Ok(Instruction::Interrupt(Interrupt::default())),
|
|
||||||
Self::Irt => Ok(Instruction::IntReturn),
|
|
||||||
Self::Hlt => Ok(Instruction::Halt),
|
|
||||||
Self::AddI => Ok(Instruction::AddImmediate(ITypeArgs::default())),
|
|
||||||
Self::SubI => Ok(Instruction::SubImmediate(ITypeArgs::default())),
|
|
||||||
Self::Segment => Ok(Instruction::Segment(0)),
|
|
||||||
_ => Err(AssembleError::new_source_error(
|
|
||||||
source_info,
|
|
||||||
AssembleErrorKind::Unimplemented(
|
|
||||||
"Opcode::to_instruction called on an instruction that does not exist in common.",
|
|
||||||
),
|
|
||||||
)),
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
#[must_use]
|
#[must_use]
|
||||||
pub const fn to_opcode_value(&self) -> Option<u8> {
|
pub fn label(&self) -> Option<Symbol> {
|
||||||
match self {
|
self.symbol.clone()
|
||||||
Self::Nop => Some(0x00),
|
|
||||||
Self::Mov => Some(0x01),
|
|
||||||
Self::Movs => Some(0x02),
|
|
||||||
Self::Ldb => Some(0x03),
|
|
||||||
Self::Ldbs => Some(0x04),
|
|
||||||
Self::Ldh => Some(0x05),
|
|
||||||
Self::Ldhs => Some(0x06),
|
|
||||||
Self::Ldw => Some(0x07),
|
|
||||||
Self::Stb => Some(0x08),
|
|
||||||
Self::Sth => Some(0x09),
|
|
||||||
Self::Stw => Some(0x0A),
|
|
||||||
Self::Lli => Some(0x0B),
|
|
||||||
Self::Lui => Some(0x0C),
|
|
||||||
Self::Jmp => Some(0x0D),
|
|
||||||
Self::Jeq => Some(0x0E),
|
|
||||||
Self::Jne => Some(0x0F),
|
|
||||||
Self::Jgt => Some(0x10),
|
|
||||||
Self::Jge => Some(0x11),
|
|
||||||
Self::Jlt => Some(0x12),
|
|
||||||
Self::Jle => Some(0x13),
|
|
||||||
Self::Cmp => Some(0x14),
|
|
||||||
Self::Inc => Some(0x15),
|
|
||||||
Self::Dec => Some(0x16),
|
|
||||||
Self::Shl => Some(0x17),
|
|
||||||
Self::Shr => Some(0x18),
|
|
||||||
Self::Add => Some(0x19),
|
|
||||||
Self::Sub => Some(0x1A),
|
|
||||||
Self::And => Some(0x1B),
|
|
||||||
Self::Or => Some(0x1C),
|
|
||||||
Self::Not => Some(0x1D),
|
|
||||||
Self::Xor => Some(0x1E),
|
|
||||||
Self::Nand => Some(0x1F),
|
|
||||||
Self::Nor => Some(0x20),
|
|
||||||
Self::Xnor => Some(0x21),
|
|
||||||
Self::Int => Some(0x22),
|
|
||||||
Self::Irt => Some(0x23),
|
|
||||||
Self::Hlt => Some(0x24),
|
|
||||||
Self::AddI => Some(0x25),
|
|
||||||
Self::SubI => Some(0x26),
|
|
||||||
// TODO: Maybe recombine pseudos?
|
|
||||||
Self::Segment => Some(0x27),
|
|
||||||
// Pseudo-instructions don't have opcode values
|
|
||||||
_ => None,
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
#[must_use]
|
#[must_use]
|
||||||
pub const fn is_pseudo_instruction(&self) -> bool {
|
pub const fn opcode(&self) -> Opcode {
|
||||||
matches!(
|
self.opcode
|
||||||
self,
|
}
|
||||||
Self::Db
|
|
||||||
| Self::Dh
|
#[must_use]
|
||||||
| Self::Dw
|
pub fn args(&self) -> Vec<Token> {
|
||||||
| Self::Resb
|
self.tokens.clone()
|
||||||
| Self::Resh
|
}
|
||||||
| Self::Resw
|
|
||||||
| Self::Push
|
pub fn arg(&self, index: usize) -> Result<Token, AssembleError> {
|
||||||
| Self::Pop
|
self.args()
|
||||||
| Self::Lwi
|
.get(index)
|
||||||
|
.cloned()
|
||||||
|
.ok_or(AssembleError::InvalidArg)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl fmt::Display for Node {
|
||||||
|
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
|
||||||
|
let symbol = self
|
||||||
|
.label()
|
||||||
|
.as_ref()
|
||||||
|
.map_or_else(String::new, |symbol| format!("{symbol}:\n"));
|
||||||
|
|
||||||
|
let args = self
|
||||||
|
.args()
|
||||||
|
.into_iter()
|
||||||
|
.map(|arg| arg.to_string())
|
||||||
|
.collect::<Vec<_>>()
|
||||||
|
.join(" ");
|
||||||
|
|
||||||
|
write!(
|
||||||
|
f,
|
||||||
|
"\x1b[93m{} \t\x1b[94m{} \x1b[37m{} \x1b[0m",
|
||||||
|
symbol,
|
||||||
|
self.opcode(),
|
||||||
|
args,
|
||||||
)
|
)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
impl FromStr for Opcode {
|
impl fmt::Display for Symbol {
|
||||||
type Err = OpcodeFromStrError;
|
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
|
||||||
|
write!(f, "{} [ID:{}]", self.name, self.module)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
fn from_str(s: &str) -> Result<Self, Self::Err> {
|
impl fmt::Display for Module {
|
||||||
match s.to_lowercase().as_str() {
|
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
|
||||||
"nop" => Ok(Self::Nop),
|
match self {
|
||||||
"mov" => Ok(Self::Mov),
|
Self::Unresolved(name) => write!(f, "{name}"),
|
||||||
"movs" => Ok(Self::Movs),
|
Self::Resolved(name) => write!(f, "{name}"),
|
||||||
"ldb" => Ok(Self::Ldb),
|
|
||||||
"ldbs" => Ok(Self::Ldbs),
|
|
||||||
"ldh" => Ok(Self::Ldh),
|
|
||||||
"ldhs" => Ok(Self::Ldhs),
|
|
||||||
"ldw" => Ok(Self::Ldw),
|
|
||||||
"stb" => Ok(Self::Stb),
|
|
||||||
"sth" => Ok(Self::Sth),
|
|
||||||
"stw" => Ok(Self::Stw),
|
|
||||||
"lli" => Ok(Self::Lli),
|
|
||||||
"lui" => Ok(Self::Lui),
|
|
||||||
"jmp" => Ok(Self::Jmp),
|
|
||||||
"jeq" => Ok(Self::Jeq),
|
|
||||||
"jne" => Ok(Self::Jne),
|
|
||||||
"jgt" => Ok(Self::Jgt),
|
|
||||||
"jge" => Ok(Self::Jge),
|
|
||||||
"jlt" => Ok(Self::Jlt),
|
|
||||||
"jle" => Ok(Self::Jle),
|
|
||||||
"cmp" => Ok(Self::Cmp),
|
|
||||||
"inc" => Ok(Self::Inc),
|
|
||||||
"dec" => Ok(Self::Dec),
|
|
||||||
"shl" => Ok(Self::Shl),
|
|
||||||
"shr" => Ok(Self::Shr),
|
|
||||||
"add" => Ok(Self::Add),
|
|
||||||
"sub" => Ok(Self::Sub),
|
|
||||||
"and" => Ok(Self::And),
|
|
||||||
"or" => Ok(Self::Or),
|
|
||||||
"not" => Ok(Self::Not),
|
|
||||||
"xor" => Ok(Self::Xor),
|
|
||||||
"nand" => Ok(Self::Nand),
|
|
||||||
"nor" => Ok(Self::Nor),
|
|
||||||
"xnor" => Ok(Self::Xnor),
|
|
||||||
"int" => Ok(Self::Int),
|
|
||||||
"irt" => Ok(Self::Irt),
|
|
||||||
"hlt" => Ok(Self::Hlt),
|
|
||||||
"addi" => Ok(Self::AddI),
|
|
||||||
"subi" => Ok(Self::SubI),
|
|
||||||
"db" => Ok(Self::Db),
|
|
||||||
"dh" => Ok(Self::Dh),
|
|
||||||
"dw" => Ok(Self::Dw),
|
|
||||||
"resb" => Ok(Self::Resb),
|
|
||||||
"resh" => Ok(Self::Resh),
|
|
||||||
"resw" => Ok(Self::Resw),
|
|
||||||
"push" => Ok(Self::Push),
|
|
||||||
"pop" => Ok(Self::Pop),
|
|
||||||
"lwi" => Ok(Self::Lwi),
|
|
||||||
"include" => Ok(Self::Include),
|
|
||||||
"call" => Ok(Self::Call),
|
|
||||||
"return" => Ok(Self::Return),
|
|
||||||
"pusha" => Ok(Self::Pusha),
|
|
||||||
"popa" => Ok(Self::Popa),
|
|
||||||
_ => Err(OpcodeFromStrError::InvalidOpcode(s.to_string())),
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@@ -347,3 +146,293 @@ impl fmt::Display for Opcode {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[derive(Debug, Clone, Eq)]
|
||||||
|
pub struct Symbol {
|
||||||
|
pub name: String,
|
||||||
|
pub module: Module,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl std::hash::Hash for Symbol {
|
||||||
|
fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
|
||||||
|
self.name.hash(state);
|
||||||
|
self.module.hash(state);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl PartialEq for Symbol {
|
||||||
|
fn eq(&self, other: &Self) -> bool {
|
||||||
|
self.name == other.name && self.module == other.module
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
|
||||||
|
pub enum Module {
|
||||||
|
Resolved(u64),
|
||||||
|
Unresolved(String),
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug, Clone)]
|
||||||
|
pub enum Token {
|
||||||
|
Symbol(Symbol),
|
||||||
|
Register(Register),
|
||||||
|
Immediate(u32),
|
||||||
|
StringLit(String),
|
||||||
|
Opcode(Opcode),
|
||||||
|
}
|
||||||
|
|
||||||
|
impl fmt::Display for Token {
|
||||||
|
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
|
||||||
|
match self {
|
||||||
|
Self::Symbol(symbol) => write!(f, "{}", symbol),
|
||||||
|
Self::Register(register) => write!(f, "{}", register),
|
||||||
|
Self::Immediate(immediate) => write!(f, "{}", immediate),
|
||||||
|
Self::StringLit(string_lit) => write!(f, "{}", string_lit),
|
||||||
|
Self::Opcode(opcode) => write!(f, "{}", opcode),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug, PartialEq, Eq, Copy, Clone)]
|
||||||
|
pub enum TokenType {
|
||||||
|
Symbol,
|
||||||
|
Register,
|
||||||
|
Immediate,
|
||||||
|
StringLit,
|
||||||
|
Opcode,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl TokenType {
|
||||||
|
#[must_use]
|
||||||
|
pub const fn from_token(token: &Token) -> Self {
|
||||||
|
match token {
|
||||||
|
Token::Symbol(_) => Self::Symbol,
|
||||||
|
Token::Register(_) => Self::Register,
|
||||||
|
Token::Immediate(_) => Self::Immediate,
|
||||||
|
Token::StringLit(_) => Self::StringLit,
|
||||||
|
Token::Opcode(_) => Self::Opcode,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
|
||||||
|
pub enum Opcode {
|
||||||
|
// Real instructions (0x00-0x26)
|
||||||
|
Nop,
|
||||||
|
Mov,
|
||||||
|
Movs,
|
||||||
|
Ldb,
|
||||||
|
Ldbs,
|
||||||
|
Ldh,
|
||||||
|
Ldhs,
|
||||||
|
Ldw,
|
||||||
|
Stb,
|
||||||
|
Sth,
|
||||||
|
Stw,
|
||||||
|
Lli,
|
||||||
|
Lui,
|
||||||
|
Jmp,
|
||||||
|
Jeq,
|
||||||
|
Jne,
|
||||||
|
Jgt,
|
||||||
|
Jge,
|
||||||
|
Jlt,
|
||||||
|
Jle,
|
||||||
|
Cmp,
|
||||||
|
Inc,
|
||||||
|
Dec,
|
||||||
|
Shl,
|
||||||
|
Shr,
|
||||||
|
Add,
|
||||||
|
Sub,
|
||||||
|
And,
|
||||||
|
Or,
|
||||||
|
Not,
|
||||||
|
Xor,
|
||||||
|
Nand,
|
||||||
|
Nor,
|
||||||
|
Xnor,
|
||||||
|
Int,
|
||||||
|
Irt,
|
||||||
|
Hlt,
|
||||||
|
AddI,
|
||||||
|
SubI,
|
||||||
|
|
||||||
|
// Pseudo-instructions
|
||||||
|
Db,
|
||||||
|
Dh,
|
||||||
|
Dw,
|
||||||
|
Resb,
|
||||||
|
Resh,
|
||||||
|
Resw,
|
||||||
|
Push,
|
||||||
|
Pop,
|
||||||
|
Pusha,
|
||||||
|
Popa,
|
||||||
|
Lwi,
|
||||||
|
Call,
|
||||||
|
Return,
|
||||||
|
|
||||||
|
// meta instructions (these aren't present in the binary as instructions)
|
||||||
|
Include,
|
||||||
|
Data,
|
||||||
|
Segment,
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug)]
|
||||||
|
pub enum OpcodeFromStrError {
|
||||||
|
InvalidRegister(&'static str),
|
||||||
|
InvalidOpcode(String),
|
||||||
|
}
|
||||||
|
|
||||||
|
impl std::fmt::Display for OpcodeFromStrError {
|
||||||
|
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
||||||
|
match self {
|
||||||
|
Self::InvalidRegister(reg) => write!(f, "register does not exist: {reg}"),
|
||||||
|
Self::InvalidOpcode(op) => write!(f, "instruction does not exist: {op}"),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl std::error::Error for OpcodeFromStrError {}
|
||||||
|
|
||||||
|
impl FromStr for Opcode {
|
||||||
|
type Err = OpcodeFromStrError;
|
||||||
|
|
||||||
|
fn from_str(s: &str) -> Result<Self, Self::Err> {
|
||||||
|
match s.to_lowercase().as_str() {
|
||||||
|
"nop" => Ok(Self::Nop),
|
||||||
|
"mov" => Ok(Self::Mov),
|
||||||
|
"movs" => Ok(Self::Movs),
|
||||||
|
"ldb" => Ok(Self::Ldb),
|
||||||
|
"ldbs" => Ok(Self::Ldbs),
|
||||||
|
"ldh" => Ok(Self::Ldh),
|
||||||
|
"ldhs" => Ok(Self::Ldhs),
|
||||||
|
"ldw" => Ok(Self::Ldw),
|
||||||
|
"stb" => Ok(Self::Stb),
|
||||||
|
"sth" => Ok(Self::Sth),
|
||||||
|
"stw" => Ok(Self::Stw),
|
||||||
|
"lli" => Ok(Self::Lli),
|
||||||
|
"lui" => Ok(Self::Lui),
|
||||||
|
"jmp" => Ok(Self::Jmp),
|
||||||
|
"jeq" => Ok(Self::Jeq),
|
||||||
|
"jne" => Ok(Self::Jne),
|
||||||
|
"jgt" => Ok(Self::Jgt),
|
||||||
|
"jge" => Ok(Self::Jge),
|
||||||
|
"jlt" => Ok(Self::Jlt),
|
||||||
|
"jle" => Ok(Self::Jle),
|
||||||
|
"cmp" => Ok(Self::Cmp),
|
||||||
|
"inc" => Ok(Self::Inc),
|
||||||
|
"dec" => Ok(Self::Dec),
|
||||||
|
"shl" => Ok(Self::Shl),
|
||||||
|
"shr" => Ok(Self::Shr),
|
||||||
|
"add" => Ok(Self::Add),
|
||||||
|
"sub" => Ok(Self::Sub),
|
||||||
|
"and" => Ok(Self::And),
|
||||||
|
"or" => Ok(Self::Or),
|
||||||
|
"not" => Ok(Self::Not),
|
||||||
|
"xor" => Ok(Self::Xor),
|
||||||
|
"nand" => Ok(Self::Nand),
|
||||||
|
"nor" => Ok(Self::Nor),
|
||||||
|
"xnor" => Ok(Self::Xnor),
|
||||||
|
"int" => Ok(Self::Int),
|
||||||
|
"irt" => Ok(Self::Irt),
|
||||||
|
"hlt" => Ok(Self::Hlt),
|
||||||
|
"addi" => Ok(Self::AddI),
|
||||||
|
"subi" => Ok(Self::SubI),
|
||||||
|
"db" => Ok(Self::Db),
|
||||||
|
"dh" => Ok(Self::Dh),
|
||||||
|
"dw" => Ok(Self::Dw),
|
||||||
|
"resb" => Ok(Self::Resb),
|
||||||
|
"resh" => Ok(Self::Resh),
|
||||||
|
"resw" => Ok(Self::Resw),
|
||||||
|
"push" => Ok(Self::Push),
|
||||||
|
"pop" => Ok(Self::Pop),
|
||||||
|
"lwi" => Ok(Self::Lwi),
|
||||||
|
"include" => Ok(Self::Include),
|
||||||
|
"call" => Ok(Self::Call),
|
||||||
|
"return" => Ok(Self::Return),
|
||||||
|
"pusha" => Ok(Self::Pusha),
|
||||||
|
"popa" => Ok(Self::Popa),
|
||||||
|
_ => Err(OpcodeFromStrError::InvalidOpcode(s.to_string())),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Opcode {
|
||||||
|
pub const OPCODES: &[&str] = &[
|
||||||
|
// Real instructions (0x00-0x26)
|
||||||
|
"nop", "mov", "movs", "ldb", "ldbs", "ldh", "ldhs", "ldw", "stb", "sth", "stw",
|
||||||
|
"lli", "lui", "jmp", "jeq", "jne", "jgt", "jge", "jlt", "jle", "cmp", "inc",
|
||||||
|
"dec", "shl", "shr", "add", "sub", "and", "or", "not", "xor", "nand", "nor",
|
||||||
|
"xnor", "int", "irt", "hlt", "addi", "subi", // Pseudo-instructions
|
||||||
|
"db", "dh", "dw", "resb", "resh", "resw", "push", "pop", "lwi", "call", "return",
|
||||||
|
"pusha", "popa", // meta instructions
|
||||||
|
"include",
|
||||||
|
];
|
||||||
|
|
||||||
|
#[must_use]
|
||||||
|
pub const fn to_opcode_value(&self) -> Option<u8> {
|
||||||
|
match self {
|
||||||
|
Self::Nop => Some(0x00),
|
||||||
|
Self::Mov => Some(0x01),
|
||||||
|
Self::Movs => Some(0x02),
|
||||||
|
Self::Ldb => Some(0x03),
|
||||||
|
Self::Ldbs => Some(0x04),
|
||||||
|
Self::Ldh => Some(0x05),
|
||||||
|
Self::Ldhs => Some(0x06),
|
||||||
|
Self::Ldw => Some(0x07),
|
||||||
|
Self::Stb => Some(0x08),
|
||||||
|
Self::Sth => Some(0x09),
|
||||||
|
Self::Stw => Some(0x0A),
|
||||||
|
Self::Lli => Some(0x0B),
|
||||||
|
Self::Lui => Some(0x0C),
|
||||||
|
Self::Jmp => Some(0x0D),
|
||||||
|
Self::Jeq => Some(0x0E),
|
||||||
|
Self::Jne => Some(0x0F),
|
||||||
|
Self::Jgt => Some(0x10),
|
||||||
|
Self::Jge => Some(0x11),
|
||||||
|
Self::Jlt => Some(0x12),
|
||||||
|
Self::Jle => Some(0x13),
|
||||||
|
Self::Cmp => Some(0x14),
|
||||||
|
Self::Inc => Some(0x15),
|
||||||
|
Self::Dec => Some(0x16),
|
||||||
|
Self::Shl => Some(0x17),
|
||||||
|
Self::Shr => Some(0x18),
|
||||||
|
Self::Add => Some(0x19),
|
||||||
|
Self::Sub => Some(0x1A),
|
||||||
|
Self::And => Some(0x1B),
|
||||||
|
Self::Or => Some(0x1C),
|
||||||
|
Self::Not => Some(0x1D),
|
||||||
|
Self::Xor => Some(0x1E),
|
||||||
|
Self::Nand => Some(0x1F),
|
||||||
|
Self::Nor => Some(0x20),
|
||||||
|
Self::Xnor => Some(0x21),
|
||||||
|
Self::Int => Some(0x22),
|
||||||
|
Self::Irt => Some(0x23),
|
||||||
|
Self::Hlt => Some(0x24),
|
||||||
|
Self::AddI => Some(0x25),
|
||||||
|
Self::SubI => Some(0x26),
|
||||||
|
Self::Segment => Some(0x27),
|
||||||
|
|
||||||
|
// Pseudo-instructions don't have opcode values
|
||||||
|
_ => None,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[must_use]
|
||||||
|
pub const fn is_pseudo_instruction(&self) -> bool {
|
||||||
|
matches!(
|
||||||
|
self,
|
||||||
|
Self::Db
|
||||||
|
| Self::Dh
|
||||||
|
| Self::Dw
|
||||||
|
| Self::Resb
|
||||||
|
| Self::Resh
|
||||||
|
| Self::Resw
|
||||||
|
| Self::Push
|
||||||
|
| Self::Pop
|
||||||
|
| Self::Lwi
|
||||||
|
)
|
||||||
|
}
|
||||||
|
}
|
||||||
@@ -0,0 +1,368 @@
|
|||||||
|
use std::path::{Path, PathBuf};
|
||||||
|
|
||||||
|
use crate::{assembler::AssembleError, expect_token, expect_type, node};
|
||||||
|
|
||||||
|
use crate::assembler::model::{Node, Opcode, Token};
|
||||||
|
use common::prelude::*;
|
||||||
|
|
||||||
|
pub struct Parser {
|
||||||
|
tokens: Vec<Token>,
|
||||||
|
nodes: Vec<Node>,
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug)]
|
||||||
|
pub struct Program {
|
||||||
|
pub nodes: Vec<Node>,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Program {
|
||||||
|
#[must_use]
|
||||||
|
pub const fn new() -> Self {
|
||||||
|
Self { nodes: vec![] }
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn add_module(&mut self, module: Vec<Node>) {
|
||||||
|
self.nodes.extend(module);
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn parser(&mut self) -> Parser {
|
||||||
|
Parser {
|
||||||
|
tokens: vec![],
|
||||||
|
nodes: self.nodes.clone(),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Default for Program {
|
||||||
|
fn default() -> Self {
|
||||||
|
Self::new()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Parser {
|
||||||
|
pub fn parse_nodes(tokens: Vec<Token>) -> Result<Vec<Node>, AssembleError> {
|
||||||
|
let mut self_ = Self {
|
||||||
|
tokens: tokens.into_iter().rev().collect(),
|
||||||
|
nodes: vec![],
|
||||||
|
};
|
||||||
|
|
||||||
|
while !self_.tokens.is_empty() {
|
||||||
|
let ins = self_.parse_instruction()?;
|
||||||
|
self_.nodes.push(ins);
|
||||||
|
}
|
||||||
|
|
||||||
|
Ok(self_.nodes.clone())
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn get_dependencies(
|
||||||
|
nodes: &Vec<Node>,
|
||||||
|
source_path: &Path,
|
||||||
|
) -> Result<Vec<PathBuf>, AssembleError> {
|
||||||
|
let mut dependencies = Vec::new();
|
||||||
|
// Get the parent directory of the source file to use as the base directory
|
||||||
|
let base_dir = source_path
|
||||||
|
.parent()
|
||||||
|
.ok_or_else(|| AssembleError::InvalidFile(source_path.to_path_buf()))?;
|
||||||
|
|
||||||
|
for node in nodes {
|
||||||
|
if node.opcode() == Opcode::Include {
|
||||||
|
let path_str = expect_token!(
|
||||||
|
node.args().get(1).ok_or(AssembleError::Generic)?,
|
||||||
|
StringLit
|
||||||
|
)?;
|
||||||
|
let path = PathBuf::from(path_str);
|
||||||
|
|
||||||
|
// If the path is not absolute, make it relative to the base directory
|
||||||
|
let full_path = if path.is_absolute() {
|
||||||
|
path
|
||||||
|
} else {
|
||||||
|
base_dir.join(path)
|
||||||
|
};
|
||||||
|
|
||||||
|
dependencies.push(full_path);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
Ok(dependencies)
|
||||||
|
}
|
||||||
|
|
||||||
|
#[expect(clippy::too_many_lines, clippy::cognitive_complexity)]
|
||||||
|
fn parse_instruction(&mut self) -> Result<Node, AssembleError> {
|
||||||
|
if self.tokens.is_empty() {
|
||||||
|
unreachable!();
|
||||||
|
}
|
||||||
|
|
||||||
|
// check if the Node starts with a label
|
||||||
|
let label = expect_token!(self.peek_next()?, Symbol).ok();
|
||||||
|
if label.is_some() {
|
||||||
|
self.tokens.pop();
|
||||||
|
}
|
||||||
|
|
||||||
|
let opcode = expect_token!(self.next()?, Opcode)?;
|
||||||
|
let args: Vec<Token>;
|
||||||
|
|
||||||
|
match opcode {
|
||||||
|
// R-type instructions
|
||||||
|
Opcode::Mov | Opcode::Movs => {
|
||||||
|
let reg1 = expect_type!(self.next()?, Register, Symbol)?;
|
||||||
|
let reg2 = expect_type!(self.next()?, Register, Symbol)?;
|
||||||
|
args = vec![reg1, reg2];
|
||||||
|
}
|
||||||
|
|
||||||
|
Opcode::Ldb | Opcode::Ldbs | Opcode::Ldh | Opcode::Ldhs | Opcode::Ldw => {
|
||||||
|
let base = expect_type!(self.next()?, Register, Symbol)?;
|
||||||
|
let dest = expect_type!(self.next()?, Register)?;
|
||||||
|
|
||||||
|
let mut offset = Token::Immediate(0);
|
||||||
|
if let Ok(next) = self.peek_next()
|
||||||
|
&& expect_type!(next, Immediate).is_ok() {
|
||||||
|
offset = self.next()?;
|
||||||
|
}
|
||||||
|
|
||||||
|
args = vec![base, dest, offset];
|
||||||
|
}
|
||||||
|
Opcode::Stb | Opcode::Sth | Opcode::Stw => {
|
||||||
|
let base = expect_type!(self.next()?, Register)?;
|
||||||
|
let dest = expect_type!(self.next()?, Register, Symbol)?;
|
||||||
|
let mut offset = Token::Immediate(0);
|
||||||
|
if let Ok(next) = self.peek_next()
|
||||||
|
&& expect_type!(next, Immediate).is_ok() {
|
||||||
|
offset = self.next()?;
|
||||||
|
}
|
||||||
|
args = vec![base, dest, offset];
|
||||||
|
}
|
||||||
|
|
||||||
|
Opcode::Add
|
||||||
|
| Opcode::Sub
|
||||||
|
| Opcode::And
|
||||||
|
| Opcode::Or
|
||||||
|
| Opcode::Xor
|
||||||
|
| Opcode::Nand
|
||||||
|
| Opcode::Nor
|
||||||
|
| Opcode::Xnor => {
|
||||||
|
let src1 = expect_type!(self.next()?, Register, Symbol)?;
|
||||||
|
let src2 = expect_type!(self.next()?, Register, Symbol)?;
|
||||||
|
let dest = expect_type!(self.next()?, Register, Symbol)?;
|
||||||
|
args = vec![src1, src2, dest];
|
||||||
|
}
|
||||||
|
|
||||||
|
Opcode::Not | Opcode::Cmp => {
|
||||||
|
let reg1 = expect_type!(self.next()?, Register, Symbol)?;
|
||||||
|
let reg2 = expect_type!(self.next()?, Register, Symbol)?;
|
||||||
|
args = vec![reg1, reg2];
|
||||||
|
}
|
||||||
|
|
||||||
|
Opcode::Shl | Opcode::Shr => {
|
||||||
|
let reg = expect_type!(self.next()?, Register, Symbol)?;
|
||||||
|
let num = expect_type!(self.next()?, Immediate)?;
|
||||||
|
args = vec![reg, num];
|
||||||
|
}
|
||||||
|
|
||||||
|
Opcode::Inc | Opcode::Dec => {
|
||||||
|
let reg = expect_type!(self.next()?, Register, Symbol)?;
|
||||||
|
args = vec![reg];
|
||||||
|
}
|
||||||
|
|
||||||
|
Opcode::Include => {
|
||||||
|
let mod_name = expect_type!(self.next()?, Symbol)?;
|
||||||
|
let path = expect_type!(self.next()?, StringLit)?;
|
||||||
|
args = vec![mod_name, path];
|
||||||
|
}
|
||||||
|
|
||||||
|
// J-type instructions
|
||||||
|
Opcode::Jmp
|
||||||
|
| Opcode::Jeq
|
||||||
|
| Opcode::Jne
|
||||||
|
| Opcode::Jgt
|
||||||
|
| Opcode::Jge
|
||||||
|
| Opcode::Jlt
|
||||||
|
| Opcode::Jle => {
|
||||||
|
let imm = expect_type!(self.next()?, Immediate, Symbol)?;
|
||||||
|
let offset = match self.peek_next() {
|
||||||
|
Ok(token) => {
|
||||||
|
if expect_type!(token, Register).is_ok() {
|
||||||
|
self.next()?
|
||||||
|
} else {
|
||||||
|
Token::Register(Register::Zero)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
Err(_) => Token::Register(Register::Zero),
|
||||||
|
};
|
||||||
|
args = vec![imm, offset];
|
||||||
|
}
|
||||||
|
|
||||||
|
Opcode::Call => {
|
||||||
|
let addr = expect_type!(self.next()?, Symbol)?;
|
||||||
|
args = vec![addr];
|
||||||
|
}
|
||||||
|
|
||||||
|
// I-type instructions
|
||||||
|
Opcode::Lui | Opcode::Lli | Opcode::Lwi => {
|
||||||
|
let imm = expect_type!(self.next()?, Immediate, Symbol)?;
|
||||||
|
let reg = expect_type!(self.next()?, Register)?;
|
||||||
|
args = vec![imm, reg];
|
||||||
|
}
|
||||||
|
|
||||||
|
// Immediate Arithmetic
|
||||||
|
Opcode::AddI | Opcode::SubI => {
|
||||||
|
let reg = expect_type!(self.next()?, Register)?;
|
||||||
|
let imm = expect_type!(self.next()?, Immediate)?;
|
||||||
|
let reg2 = if expect_type!(self.peek_next()?, Register).is_ok() {
|
||||||
|
self.next()?
|
||||||
|
} else {
|
||||||
|
reg.clone()
|
||||||
|
};
|
||||||
|
args = vec![reg, imm, reg2];
|
||||||
|
}
|
||||||
|
|
||||||
|
// D-type pseudoinstructions (data definition)
|
||||||
|
Opcode::Resb | Opcode::Resh | Opcode::Resw => {
|
||||||
|
let name = expect_type!(self.next()?, Symbol)?;
|
||||||
|
let num = expect_type!(self.next()?, Immediate)?;
|
||||||
|
args = vec![name, num];
|
||||||
|
}
|
||||||
|
|
||||||
|
Opcode::Db | Opcode::Dh | Opcode::Dw => {
|
||||||
|
args = self.parse_data_definition(opcode)?;
|
||||||
|
}
|
||||||
|
|
||||||
|
// E-type pseudoinstructions (stack operations)
|
||||||
|
Opcode::Push | Opcode::Pop => {
|
||||||
|
let reg = expect_type!(self.next()?, Register, Symbol)?;
|
||||||
|
args = vec![reg];
|
||||||
|
}
|
||||||
|
|
||||||
|
Opcode::Pusha | Opcode::Popa => {
|
||||||
|
let count =
|
||||||
|
expect_type!(self.next()?, Immediate).unwrap_or(Token::Immediate(8));
|
||||||
|
args = vec![count];
|
||||||
|
}
|
||||||
|
|
||||||
|
// Special instructions
|
||||||
|
Opcode::Int => {
|
||||||
|
let val = expect_type!(self.next()?, Immediate)?;
|
||||||
|
args = vec![val];
|
||||||
|
}
|
||||||
|
|
||||||
|
// Instructions with no arguments
|
||||||
|
Opcode::Hlt | Opcode::Nop | Opcode::Irt | Opcode::Return => {
|
||||||
|
args = vec![];
|
||||||
|
}
|
||||||
|
|
||||||
|
Opcode::Data | Opcode::Segment => {
|
||||||
|
return Err(AssembleError::Generic);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
Ok(node!(label, opcode, args: args))
|
||||||
|
}
|
||||||
|
|
||||||
|
fn parse_data_definition(
|
||||||
|
&mut self,
|
||||||
|
opcode: Opcode,
|
||||||
|
) -> Result<Vec<Token>, AssembleError> {
|
||||||
|
let mut values = Vec::new();
|
||||||
|
|
||||||
|
let name = expect_type!(self.next()?, Symbol)?;
|
||||||
|
values.push(name);
|
||||||
|
|
||||||
|
match opcode {
|
||||||
|
Opcode::Db => {
|
||||||
|
// db can take string literals or u8 immediates
|
||||||
|
while !self.tokens.is_empty() {
|
||||||
|
let token = self
|
||||||
|
.tokens
|
||||||
|
.last()
|
||||||
|
.expect("Expected a token for data definition, but found none");
|
||||||
|
|
||||||
|
match token {
|
||||||
|
Token::StringLit(_) => {
|
||||||
|
values.push(self.tokens.pop().expect(
|
||||||
|
"Expected a token for data definition, but found none",
|
||||||
|
));
|
||||||
|
}
|
||||||
|
Token::Immediate(val) if u8::try_from(*val).is_ok() => {
|
||||||
|
values.push(self.tokens.pop().expect(
|
||||||
|
"Expected a token for data definition, but found none",
|
||||||
|
));
|
||||||
|
}
|
||||||
|
_ => break,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
Opcode::Dh => {
|
||||||
|
// dh can take u16 immediates
|
||||||
|
while !self.tokens.is_empty() {
|
||||||
|
let token = self
|
||||||
|
.tokens
|
||||||
|
.last()
|
||||||
|
.expect("Expected a token for data definition, but found none");
|
||||||
|
|
||||||
|
match token {
|
||||||
|
Token::StringLit(_) => {
|
||||||
|
values.push(self.tokens.pop().expect(
|
||||||
|
"Expected a token for data definition, but found none",
|
||||||
|
));
|
||||||
|
}
|
||||||
|
Token::Immediate(val) if u16::try_from(*val).is_ok() => {
|
||||||
|
values.push(self.tokens.pop().expect(
|
||||||
|
"Expected a token for data definition, but found none",
|
||||||
|
));
|
||||||
|
}
|
||||||
|
_ => break,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
Opcode::Dw => {
|
||||||
|
// dw can take u32 immediates
|
||||||
|
while !self.tokens.is_empty() {
|
||||||
|
match self
|
||||||
|
.tokens
|
||||||
|
.last()
|
||||||
|
.expect("Expected a token for data definition, but found none")
|
||||||
|
{
|
||||||
|
Token::StringLit(_) => {
|
||||||
|
values.push(self.tokens.pop().expect(
|
||||||
|
"Expected a token for data definition, but found none",
|
||||||
|
));
|
||||||
|
}
|
||||||
|
Token::Immediate(val) => {
|
||||||
|
values.push(self.tokens.pop().expect(
|
||||||
|
"Expected a token for data definition, but found none",
|
||||||
|
));
|
||||||
|
}
|
||||||
|
_ => break,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
_ => unreachable!(),
|
||||||
|
}
|
||||||
|
|
||||||
|
Ok(values)
|
||||||
|
}
|
||||||
|
|
||||||
|
fn next(&mut self) -> Result<Token, AssembleError> {
|
||||||
|
if self.tokens.is_empty() {
|
||||||
|
Err(AssembleError::UnexpectedEof)
|
||||||
|
} else {
|
||||||
|
Ok(self
|
||||||
|
.tokens
|
||||||
|
.pop()
|
||||||
|
.expect("tokens vector was unexpectedly empty in next()"))
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
fn peek_next(&self) -> Result<Token, AssembleError> {
|
||||||
|
if self.tokens.is_empty() {
|
||||||
|
Err(AssembleError::UnexpectedEof)
|
||||||
|
} else {
|
||||||
|
Ok(self
|
||||||
|
.tokens
|
||||||
|
.last()
|
||||||
|
.expect("peek_next called on empty tokens vector")
|
||||||
|
.clone())
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
@@ -0,0 +1,156 @@
|
|||||||
|
use std::{
|
||||||
|
collections::HashMap,
|
||||||
|
fs::canonicalize,
|
||||||
|
path::{Path, PathBuf},
|
||||||
|
};
|
||||||
|
|
||||||
|
use common::prelude::Register;
|
||||||
|
|
||||||
|
use crate::assembler::quick_hash;
|
||||||
|
use crate::assembler::{
|
||||||
|
log,
|
||||||
|
model::{Module, Node, Opcode, Symbol, Token},
|
||||||
|
};
|
||||||
|
use crate::{assembler::AssembleError, node};
|
||||||
|
|
||||||
|
pub fn resolve_symbols(nodes: &mut [Node]) -> Result<(), AssembleError> {
|
||||||
|
let symbol_table = generate_symbol_table(nodes);
|
||||||
|
|
||||||
|
for node in nodes.iter_mut() {
|
||||||
|
match node.opcode() {
|
||||||
|
Opcode::Jmp
|
||||||
|
| Opcode::Jeq
|
||||||
|
| Opcode::Jne
|
||||||
|
| Opcode::Jgt
|
||||||
|
| Opcode::Jge
|
||||||
|
| Opcode::Jlt
|
||||||
|
| Opcode::Jle
|
||||||
|
| Opcode::Lli
|
||||||
|
| Opcode::Lui => {
|
||||||
|
if let Token::Symbol(symbol) = node
|
||||||
|
.arg(0)
|
||||||
|
.expect("Expected argument 0 for jump-like opcode")
|
||||||
|
{
|
||||||
|
if let Some(address) = symbol_table.get(&symbol) {
|
||||||
|
node.tokens[0] = Token::Immediate(*address);
|
||||||
|
} else {
|
||||||
|
return Err(AssembleError::UndefinedSymbol(symbol));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
_ => (),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn generate_symbol_table(nodes: &[Node]) -> HashMap<Symbol, u32> {
|
||||||
|
let mut table = HashMap::new();
|
||||||
|
|
||||||
|
for (i, node) in nodes.iter().enumerate() {
|
||||||
|
if let Some(symbol) = node.label() {
|
||||||
|
table.insert(symbol, 4 * i as u32);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
table
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn resolve_dependencies(
|
||||||
|
mut nodes: Vec<Node>,
|
||||||
|
base_dir: &Path,
|
||||||
|
) -> Result<Vec<Node>, AssembleError> {
|
||||||
|
// First we get a list of imports.
|
||||||
|
let mut dependencies = Vec::new();
|
||||||
|
for node in &nodes {
|
||||||
|
if node.opcode() == Opcode::Include {
|
||||||
|
// we want the path, and the name
|
||||||
|
let name = if let Token::Symbol(name) = node
|
||||||
|
.arg(0)
|
||||||
|
.expect("Expected argument #0 for Include directive.")
|
||||||
|
{
|
||||||
|
name.name.clone()
|
||||||
|
} else {
|
||||||
|
unreachable!()
|
||||||
|
}; //node.2.get(0).unwrap()
|
||||||
|
|
||||||
|
let Ok(Token::StringLit(path)) = node.arg(1) else {
|
||||||
|
unreachable!()
|
||||||
|
};
|
||||||
|
|
||||||
|
let full_path = base_dir.join(path);
|
||||||
|
let canonical_path = full_path
|
||||||
|
.canonicalize()
|
||||||
|
.map_err(|_| AssembleError::InvalidFile(full_path.clone()))?;
|
||||||
|
|
||||||
|
let hash = quick_hash(&canonical_path);
|
||||||
|
|
||||||
|
dependencies.push((name, hash));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
let mut changes = Vec::<(u32, u32, Symbol)>::new();
|
||||||
|
// now we resolve the symbols on all the nodes
|
||||||
|
// we need to check all operands for unresolved signals
|
||||||
|
for (i, node) in nodes.clone().iter().enumerate() {
|
||||||
|
let Node {
|
||||||
|
tokens: operands, ..
|
||||||
|
} = node;
|
||||||
|
for (j, token) in operands.iter().enumerate() {
|
||||||
|
if let Token::Symbol(symbol) = token {
|
||||||
|
for d in &dependencies {
|
||||||
|
if let Module::Unresolved(name) = symbol.module.clone() {
|
||||||
|
if name != d.0 {
|
||||||
|
continue;
|
||||||
|
}
|
||||||
|
|
||||||
|
let symbol = Symbol {
|
||||||
|
name: symbol.name.clone(),
|
||||||
|
module: Module::Resolved(d.1),
|
||||||
|
};
|
||||||
|
changes.push((i as u32, j as u32, symbol));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
for (i, j, symbol) in changes {
|
||||||
|
nodes[i as usize].tokens[j as usize] = Token::Symbol(symbol);
|
||||||
|
}
|
||||||
|
|
||||||
|
Ok(nodes)
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn create_sections(nodes: &mut Vec<Node>) -> Result<(), AssembleError> {
|
||||||
|
let mut res = Vec::<Node>::with_capacity(nodes.len());
|
||||||
|
|
||||||
|
res.push(node!(None, Opcode::Segment, Token::Immediate(0)));
|
||||||
|
|
||||||
|
for n in nodes.iter() {
|
||||||
|
if n.opcode() == Opcode::Data {
|
||||||
|
res.push(n.clone());
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
let start = res.len() + 1;
|
||||||
|
res.insert(
|
||||||
|
0,
|
||||||
|
node!(
|
||||||
|
None,
|
||||||
|
Opcode::Jmp,
|
||||||
|
Token::Immediate(start as u32 * 4),
|
||||||
|
Token::Register(Register::Zero)
|
||||||
|
),
|
||||||
|
);
|
||||||
|
for n in nodes.iter() {
|
||||||
|
if !matches!(n.opcode(), Opcode::Data | Opcode::Include) {
|
||||||
|
res.push(n.clone());
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
*nodes = res;
|
||||||
|
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
@@ -1,374 +0,0 @@
|
|||||||
//! Simple compiler engine that orchestrates the entire compilation process.
|
|
||||||
|
|
||||||
use std::collections::{HashMap, HashSet};
|
|
||||||
use std::fmt;
|
|
||||||
use std::path::Path;
|
|
||||||
use std::sync::mpsc;
|
|
||||||
use std::thread;
|
|
||||||
|
|
||||||
use crate::error::{AssembleErrorKind, IoErrorKind};
|
|
||||||
use crate::{
|
|
||||||
context::AssemblerContext,
|
|
||||||
error::AssembleError,
|
|
||||||
model::module::ModuleId,
|
|
||||||
source::{token::Token, tokeniser::Tokeniser},
|
|
||||||
};
|
|
||||||
|
|
||||||
use common::instructions::Instruction;
|
|
||||||
|
|
||||||
/// Error type for the `CompilerEngine`
|
|
||||||
#[derive(Debug)]
|
|
||||||
pub enum EngineError {
|
|
||||||
/// Assembly error during compilation
|
|
||||||
Assembly(AssembleError),
|
|
||||||
/// Channel communication error
|
|
||||||
Channel(String),
|
|
||||||
/// Other generic error
|
|
||||||
Other(String),
|
|
||||||
}
|
|
||||||
|
|
||||||
impl fmt::Display for EngineError {
|
|
||||||
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
|
|
||||||
match self {
|
|
||||||
Self::Assembly(e) => write!(f, "Assembly error: {e}"),
|
|
||||||
Self::Channel(msg) => write!(f, "Channel error: {msg}"),
|
|
||||||
Self::Other(msg) => write!(f, "Engine error: {msg}"),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl std::error::Error for EngineError {
|
|
||||||
fn source(&self) -> Option<&(dyn std::error::Error + 'static)> {
|
|
||||||
match self {
|
|
||||||
Self::Assembly(e) => Some(e),
|
|
||||||
Self::Channel(_) | Self::Other(_) => None,
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// Convert from AssembleError
|
|
||||||
impl From<AssembleError> for EngineError {
|
|
||||||
fn from(error: AssembleError) -> Self {
|
|
||||||
Self::Assembly(error)
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// Convert from mpsc::SendError
|
|
||||||
impl<T> From<mpsc::SendError<T>> for EngineError {
|
|
||||||
fn from(error: mpsc::SendError<T>) -> Self {
|
|
||||||
Self::Channel(format!("Send error: {error}"))
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// Convert from mpsc::RecvError
|
|
||||||
impl From<mpsc::RecvError> for EngineError {
|
|
||||||
fn from(error: mpsc::RecvError) -> Self {
|
|
||||||
Self::Channel(format!("Receive error: {error}"))
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// Convert from mpsc::TryRecvError
|
|
||||||
impl From<mpsc::TryRecvError> for EngineError {
|
|
||||||
fn from(error: mpsc::TryRecvError) -> Self {
|
|
||||||
Self::Channel(format!("Try receive error: {error}"))
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// Convert from String for generic errors
|
|
||||||
impl From<String> for EngineError {
|
|
||||||
fn from(error: String) -> Self {
|
|
||||||
Self::Other(error)
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// Convert from &str for convenience
|
|
||||||
impl From<&str> for EngineError {
|
|
||||||
fn from(error: &str) -> Self {
|
|
||||||
Self::Other(error.to_string())
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Simple compiler engine that orchestrates the entire compilation process.
|
|
||||||
pub struct CompilerEngine {
|
|
||||||
result_tx: mpsc::Sender<Result<Vec<Instruction>, EngineError>>,
|
|
||||||
result_rx: Option<mpsc::Receiver<Result<Vec<Instruction>, EngineError>>>,
|
|
||||||
is_running: bool,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl CompilerEngine {
|
|
||||||
/// Create a new compiler engine
|
|
||||||
#[must_use]
|
|
||||||
pub fn new() -> Self {
|
|
||||||
let (tx, rx) = mpsc::channel();
|
|
||||||
Self {
|
|
||||||
result_tx: tx,
|
|
||||||
result_rx: Some(rx),
|
|
||||||
is_running: false,
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Start the compilation process in a separate thread
|
|
||||||
pub fn start_compilation<P: AsRef<Path>>(&mut self, src: P) {
|
|
||||||
if self.is_running {
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
|
|
||||||
let src = src.as_ref().to_path_buf();
|
|
||||||
let tx = self.result_tx.clone();
|
|
||||||
|
|
||||||
thread::spawn(move || {
|
|
||||||
let result = assemble(&src).map_err(EngineError::from);
|
|
||||||
let _ = tx.send(result); // Ignore send errors if receiver is dropped
|
|
||||||
});
|
|
||||||
|
|
||||||
self.is_running = true;
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Check if compilation is complete and get the result
|
|
||||||
pub fn try_get_result(&mut self) -> Option<Result<Vec<Instruction>, EngineError>> {
|
|
||||||
if !self.is_running {
|
|
||||||
return None;
|
|
||||||
}
|
|
||||||
|
|
||||||
match self
|
|
||||||
.result_rx
|
|
||||||
.as_ref()
|
|
||||||
.expect("result_rx should be Some while compilation is running")
|
|
||||||
.try_recv()
|
|
||||||
{
|
|
||||||
Ok(result) => {
|
|
||||||
self.is_running = false;
|
|
||||||
Some(result)
|
|
||||||
}
|
|
||||||
Err(mpsc::TryRecvError::Empty) => None,
|
|
||||||
Err(mpsc::TryRecvError::Disconnected) => {
|
|
||||||
self.is_running = false;
|
|
||||||
Some(Err(EngineError::Channel(
|
|
||||||
"Compilation thread disconnected".to_string(),
|
|
||||||
)))
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Block until compilation is complete and return the result
|
|
||||||
pub fn wait_for_result(&mut self) -> Result<Vec<Instruction>, EngineError> {
|
|
||||||
if !self.is_running {
|
|
||||||
return Err(EngineError::Other("No compilation in progress".to_string()));
|
|
||||||
}
|
|
||||||
|
|
||||||
let result = self
|
|
||||||
.result_rx
|
|
||||||
.take()
|
|
||||||
.expect("result_rx should be Some while waiting for compilation result")
|
|
||||||
.recv()
|
|
||||||
.map_err(EngineError::from)?;
|
|
||||||
|
|
||||||
self.is_running = false;
|
|
||||||
result
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Add a source file to be compiled (for compatibility with old interface)
|
|
||||||
pub fn add_source_file<P: AsRef<Path>>(
|
|
||||||
&mut self,
|
|
||||||
path: P,
|
|
||||||
) -> Result<(), EngineError> {
|
|
||||||
let path = path.as_ref().to_path_buf();
|
|
||||||
|
|
||||||
// Verify file exists
|
|
||||||
if !path.exists() {
|
|
||||||
return Err(EngineError::Assembly(AssembleError::new_other_error(
|
|
||||||
AssembleErrorKind::Io(crate::error::IoError::new(
|
|
||||||
IoErrorKind::NotFound,
|
|
||||||
Some(format!("Source file not found: {}", path.display())),
|
|
||||||
)),
|
|
||||||
)));
|
|
||||||
}
|
|
||||||
|
|
||||||
// For now, just validate the file exists
|
|
||||||
// TODO: Could store multiple files for batch compilation
|
|
||||||
Ok(())
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Compile all added source files (synchronous version)
|
|
||||||
pub fn compile(&mut self) -> Result<CompileResult, EngineError> {
|
|
||||||
// This is a placeholder that matches the old interface
|
|
||||||
// For now, return empty result since we don't have a specific file to compile
|
|
||||||
Ok(CompileResult {
|
|
||||||
modules: Vec::new(),
|
|
||||||
tokens: HashMap::new(),
|
|
||||||
})
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Get access to the assembler context (placeholder)
|
|
||||||
pub fn context(&self) -> Result<&AssemblerContext, EngineError> {
|
|
||||||
// For now, return an error since we're using the threaded approach
|
|
||||||
// TODO: Integrate context properly when we have more compilation phases
|
|
||||||
Err(EngineError::Other(
|
|
||||||
"Context not available in threaded mode".to_string(),
|
|
||||||
))
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Default for CompilerEngine {
|
|
||||||
fn default() -> Self {
|
|
||||||
Self::new()
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Main assembly function that orchestrates the compilation process
|
|
||||||
fn assemble(src: &Path) -> Result<Vec<Instruction>, AssembleError> {
|
|
||||||
// Verify the file exists
|
|
||||||
if !src.exists() {
|
|
||||||
return Err(AssembleError::new_other_error(AssembleErrorKind::Io(
|
|
||||||
crate::error::IoError::new(
|
|
||||||
IoErrorKind::NotFound,
|
|
||||||
Some(format!("Source file not found: {}", src.display())),
|
|
||||||
),
|
|
||||||
)));
|
|
||||||
}
|
|
||||||
|
|
||||||
let mut modules = HashSet::new();
|
|
||||||
let mut all_tokens = HashMap::new();
|
|
||||||
let mut module_ids = Vec::new();
|
|
||||||
|
|
||||||
// Create a new assembler context for this compilation
|
|
||||||
let context = AssemblerContext::new();
|
|
||||||
|
|
||||||
// Process the main file and its dependencies
|
|
||||||
prepare_dependency(
|
|
||||||
src,
|
|
||||||
&mut modules,
|
|
||||||
&mut all_tokens,
|
|
||||||
&mut module_ids,
|
|
||||||
&context,
|
|
||||||
)?;
|
|
||||||
|
|
||||||
// Phase 2: Parse tokens into AST (placeholder for now)
|
|
||||||
// TODO: Add parser here when implemented
|
|
||||||
println!("Phase 2: Parsing {} modules...", module_ids.len());
|
|
||||||
|
|
||||||
// Phase 3: Symbol resolution (placeholder for now)
|
|
||||||
// TODO: Add symbol resolution here when implemented
|
|
||||||
println!("Phase 3: Resolving symbols...");
|
|
||||||
|
|
||||||
// Phase 4: Code generation (placeholder for now)
|
|
||||||
// TODO: Add code generation here when implemented
|
|
||||||
println!("Phase 4: Generating code...");
|
|
||||||
|
|
||||||
// For now, return empty instructions since we don't have the full pipeline yet
|
|
||||||
Ok(Vec::new())
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Prepare a dependency (file) for compilation
|
|
||||||
fn prepare_dependency(
|
|
||||||
path: &Path,
|
|
||||||
modules: &mut HashSet<u64>,
|
|
||||||
all_tokens: &mut HashMap<ModuleId, Vec<Token>>,
|
|
||||||
module_ids: &mut Vec<ModuleId>,
|
|
||||||
context: &AssemblerContext,
|
|
||||||
) -> Result<(), AssembleError> {
|
|
||||||
let filename = path.file_name().and_then(|n| n.to_str()).ok_or_else(|| {
|
|
||||||
AssembleError::new_other_error(AssembleErrorKind::Io(crate::error::IoError::new(
|
|
||||||
IoErrorKind::InvalidData,
|
|
||||||
Some("Failed to get file name from path".to_string()),
|
|
||||||
)))
|
|
||||||
})?;
|
|
||||||
|
|
||||||
// Calculate a simple hash for the file (similar to quick_hash)
|
|
||||||
let file_hash = calculate_file_hash(path);
|
|
||||||
|
|
||||||
// Skip if we've already processed this module
|
|
||||||
if modules.contains(&file_hash) {
|
|
||||||
return Ok(());
|
|
||||||
}
|
|
||||||
modules.insert(file_hash);
|
|
||||||
|
|
||||||
if let Ok(canonical_path) = path.canonicalize() {
|
|
||||||
println!("Building {} [{}]", filename, canonical_path.display());
|
|
||||||
}
|
|
||||||
|
|
||||||
// Phase 1: Tokenize the file
|
|
||||||
println!("Tokenising {filename}");
|
|
||||||
let tokeniser = Tokeniser::new(path, context)?;
|
|
||||||
let tokens = tokeniser.tokenise()?;
|
|
||||||
|
|
||||||
// Get the module ID that was registered during tokenization
|
|
||||||
let module_id = get_module_id_for_file(path, context)?;
|
|
||||||
|
|
||||||
all_tokens.insert(module_id, tokens);
|
|
||||||
module_ids.push(module_id);
|
|
||||||
|
|
||||||
// TODO: Parse tokens to find dependencies (.include directives, etc.)
|
|
||||||
// For now, we'll just process the single file
|
|
||||||
println!("Resolving dependencies for {filename}");
|
|
||||||
|
|
||||||
Ok(())
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Calculate a simple hash for a file path (similar to the old `quick_hash`)
|
|
||||||
fn calculate_file_hash(path: &Path) -> u64 {
|
|
||||||
use std::collections::hash_map::DefaultHasher;
|
|
||||||
use std::hash::{Hash, Hasher};
|
|
||||||
|
|
||||||
let mut hasher = DefaultHasher::new();
|
|
||||||
if let Ok(canonical) = path.canonicalize() {
|
|
||||||
canonical.hash(&mut hasher);
|
|
||||||
} else {
|
|
||||||
path.hash(&mut hasher);
|
|
||||||
}
|
|
||||||
hasher.finish()
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Get the module ID for a given source file
|
|
||||||
fn get_module_id_for_file(
|
|
||||||
file_path: &Path,
|
|
||||||
context: &AssemblerContext,
|
|
||||||
) -> Result<ModuleId, AssembleError> {
|
|
||||||
{
|
|
||||||
let registry = context.module_registry.read()?;
|
|
||||||
|
|
||||||
// Find module by path.
|
|
||||||
for module in registry.modules() {
|
|
||||||
if module.path == file_path {
|
|
||||||
return Ok(module.id);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
Err(AssembleError::new_other_error(AssembleErrorKind::Io(
|
|
||||||
crate::error::IoError::new(
|
|
||||||
IoErrorKind::NotFound,
|
|
||||||
Some(format!(
|
|
||||||
"Module not found for file: {}",
|
|
||||||
file_path.display()
|
|
||||||
)),
|
|
||||||
),
|
|
||||||
)))
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Result of compilation. This is useless at present but compiles.
|
|
||||||
#[derive(Debug)]
|
|
||||||
pub struct CompileResult {
|
|
||||||
pub modules: Vec<ModuleId>,
|
|
||||||
pub tokens: HashMap<ModuleId, Vec<Token>>,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl CompileResult {
|
|
||||||
/// Get tokens for a specific module
|
|
||||||
#[must_use]
|
|
||||||
pub fn get_tokens(&self, module_id: &ModuleId) -> Option<&Vec<Token>> {
|
|
||||||
self.tokens.get(module_id)
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Get all module IDs
|
|
||||||
#[must_use]
|
|
||||||
pub fn module_ids(&self) -> &[ModuleId] {
|
|
||||||
&self.modules
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Get total number of tokens across all modules
|
|
||||||
#[must_use]
|
|
||||||
pub fn total_tokens(&self) -> usize {
|
|
||||||
self.tokens.values().map(std::vec::Vec::len).sum()
|
|
||||||
}
|
|
||||||
}
|
|
||||||
@@ -1,28 +0,0 @@
|
|||||||
//! This module contains the global asembler context to be passed to functions that need
|
|
||||||
//! it.
|
|
||||||
|
|
||||||
use std::sync::RwLock;
|
|
||||||
|
|
||||||
use crate::{model::module_registry::ModuleRegistry, symtab::SymbolTable};
|
|
||||||
|
|
||||||
/// Global state to be passed around.
|
|
||||||
pub struct AssemblerContext {
|
|
||||||
pub symbol_table: RwLock<SymbolTable>,
|
|
||||||
pub module_registry: RwLock<ModuleRegistry>,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Default for AssemblerContext {
|
|
||||||
fn default() -> Self {
|
|
||||||
Self::new()
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl AssemblerContext {
|
|
||||||
#[must_use]
|
|
||||||
pub fn new() -> Self {
|
|
||||||
Self {
|
|
||||||
symbol_table: RwLock::new(SymbolTable::new()),
|
|
||||||
module_registry: RwLock::new(ModuleRegistry::new()),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
@@ -1,275 +0,0 @@
|
|||||||
//! This module contains code for various types of errors that may occur when assembling a
|
|
||||||
//! set of source DSA files.
|
|
||||||
|
|
||||||
use std::fmt::{Debug, Display};
|
|
||||||
|
|
||||||
use crate::source::{source_info::SourceInfo, tokeniser::error::TokeniserError};
|
|
||||||
|
|
||||||
/// An error that may occur during the assembly of a set of source files.
|
|
||||||
#[derive(Debug)]
|
|
||||||
pub struct AssembleError {
|
|
||||||
/// Display implementation can handle when the source code information is shown or
|
|
||||||
/// not.
|
|
||||||
source_info: Option<SourceInfo>,
|
|
||||||
/// The type of assembly error that occurred.
|
|
||||||
kind: AssembleErrorKind,
|
|
||||||
/// Whether context should be added to errors being printed. This might get changed
|
|
||||||
/// to Verbosity in the future.
|
|
||||||
display_quietly: bool,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl AssembleError {
|
|
||||||
#[must_use]
|
|
||||||
pub const fn new_source_error(
|
|
||||||
source_info: SourceInfo,
|
|
||||||
kind: AssembleErrorKind,
|
|
||||||
) -> Self {
|
|
||||||
Self {
|
|
||||||
source_info: Some(source_info),
|
|
||||||
kind,
|
|
||||||
display_quietly: false,
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[must_use]
|
|
||||||
pub const fn new_other_error(kind: AssembleErrorKind) -> Self {
|
|
||||||
Self {
|
|
||||||
source_info: None,
|
|
||||||
kind,
|
|
||||||
display_quietly: true,
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Prints a parser error to the screen.
|
|
||||||
fn print_parser_error(
|
|
||||||
&self,
|
|
||||||
f: &mut std::fmt::Formatter<'_>,
|
|
||||||
parse_error: &ParserError,
|
|
||||||
) -> std::fmt::Result {
|
|
||||||
let Some(source_info) = &self.source_info else {
|
|
||||||
write!(
|
|
||||||
f,
|
|
||||||
"parser error thrown with no source information. Error: {parse_error}"
|
|
||||||
)?;
|
|
||||||
|
|
||||||
return Ok(());
|
|
||||||
};
|
|
||||||
|
|
||||||
writeln!(f, "parser error of type `{parse_error}`.\n")?;
|
|
||||||
|
|
||||||
// Prints out the context for our error.
|
|
||||||
if !self.display_quietly {
|
|
||||||
source_info.print_context_with_underline().map_err(|e| {
|
|
||||||
_ = writeln!(f, "print context error: {e}");
|
|
||||||
|
|
||||||
std::fmt::Error {}
|
|
||||||
})?;
|
|
||||||
}
|
|
||||||
|
|
||||||
Ok(())
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Prints a tokeniser error to the screen.
|
|
||||||
fn print_tokeniser_error(
|
|
||||||
&self,
|
|
||||||
f: &mut std::fmt::Formatter<'_>,
|
|
||||||
err: &TokeniserError,
|
|
||||||
) -> std::fmt::Result {
|
|
||||||
let Some(source_info) = &self.source_info else {
|
|
||||||
write!(
|
|
||||||
f,
|
|
||||||
"Tokeniser error thrown with no source information. Error: {err}"
|
|
||||||
)?;
|
|
||||||
|
|
||||||
return Ok(());
|
|
||||||
};
|
|
||||||
|
|
||||||
writeln!(f, "tokeniser error of type `{err}`.\n")?;
|
|
||||||
|
|
||||||
// Prints out the context for our error.
|
|
||||||
source_info.print_context_with_underline().map_err(|e| {
|
|
||||||
_ = writeln!(f, "Print context error: {e}");
|
|
||||||
|
|
||||||
std::fmt::Error {}
|
|
||||||
})?;
|
|
||||||
|
|
||||||
Ok(())
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Display for AssembleError {
|
|
||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
|
||||||
if let Some(info) = &self.source_info {
|
|
||||||
write!(f, "At {info}, got ")?;
|
|
||||||
|
|
||||||
match &self.kind {
|
|
||||||
AssembleErrorKind::Parser(err) => self.print_parser_error(f, err)?,
|
|
||||||
AssembleErrorKind::Tokeniser(err) => {
|
|
||||||
self.print_tokeniser_error(f, err)?;
|
|
||||||
}
|
|
||||||
_ => write!(f, "{}", self.kind)?,
|
|
||||||
}
|
|
||||||
|
|
||||||
writeln!(f)?;
|
|
||||||
|
|
||||||
return Ok(());
|
|
||||||
}
|
|
||||||
|
|
||||||
// Handle errors without SourceInfo.
|
|
||||||
write!(f, "{}", self.kind)?;
|
|
||||||
|
|
||||||
Ok(())
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Marker trait.
|
|
||||||
impl std::error::Error for AssembleError {}
|
|
||||||
|
|
||||||
#[derive(Debug, Clone)]
|
|
||||||
#[non_exhaustive]
|
|
||||||
pub enum AssembleErrorKind {
|
|
||||||
/// Usually unexpected I/O errors. Not normally recoverable.
|
|
||||||
Io(IoError),
|
|
||||||
/// Errors emitted from the [`Tokeniser`].
|
|
||||||
Tokeniser(TokeniserError),
|
|
||||||
Parser(ParserError),
|
|
||||||
Symbol(SymbolError),
|
|
||||||
Codegen(CodegenError),
|
|
||||||
Threading(ThreadingError),
|
|
||||||
/// Returned for code where the functionality has not yet been implemented but we
|
|
||||||
/// don't want the program to panic.
|
|
||||||
Unimplemented(&'static str),
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug, Clone)]
|
|
||||||
pub enum ParserError {
|
|
||||||
UnexpectedToken,
|
|
||||||
MissingOperand,
|
|
||||||
InvalidInstruction,
|
|
||||||
MissingLabel,
|
|
||||||
DuplicateLabel,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Display for ParserError {
|
|
||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
|
||||||
match self {
|
|
||||||
Self::UnexpectedToken => write!(f, "unexpected token"),
|
|
||||||
Self::MissingOperand => write!(f, "missing operand"),
|
|
||||||
Self::InvalidInstruction => write!(f, "invalid instruction"),
|
|
||||||
Self::MissingLabel => write!(f, "missing label"),
|
|
||||||
Self::DuplicateLabel => write!(f, "duplicate label"),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug, Clone)]
|
|
||||||
pub enum SymbolError {
|
|
||||||
Undefined,
|
|
||||||
Duplicate,
|
|
||||||
CircularDependency,
|
|
||||||
InvalidReference,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Display for SymbolError {
|
|
||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
|
||||||
match self {
|
|
||||||
Self::Undefined => write!(f, "undefined symbol"),
|
|
||||||
Self::Duplicate => write!(f, "duplicate symbol"),
|
|
||||||
Self::CircularDependency => write!(f, "circular dependency"),
|
|
||||||
Self::InvalidReference => write!(f, "invalid reference"),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug, Clone)]
|
|
||||||
pub enum CodegenError {
|
|
||||||
InvalidOperand,
|
|
||||||
OutOfRange,
|
|
||||||
UnsupportedInstruction,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Display for CodegenError {
|
|
||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
|
||||||
match self {
|
|
||||||
Self::InvalidOperand => write!(f, "invalid operand"),
|
|
||||||
Self::OutOfRange => write!(f, "out of range"),
|
|
||||||
Self::UnsupportedInstruction => write!(f, "unsupported instruction"),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug, Clone)]
|
|
||||||
pub enum ThreadingError {
|
|
||||||
LockFailed,
|
|
||||||
ThreadPanic,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Display for ThreadingError {
|
|
||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
|
||||||
match self {
|
|
||||||
Self::LockFailed => write!(f, "lock failed"),
|
|
||||||
Self::ThreadPanic => write!(f, "thread panic"),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug, Clone)]
|
|
||||||
pub struct IoError {
|
|
||||||
msg: Option<String>,
|
|
||||||
kind: IoErrorKind,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl IoError {
|
|
||||||
#[must_use]
|
|
||||||
pub const fn new(kind: IoErrorKind, msg: Option<String>) -> Self {
|
|
||||||
Self { msg, kind }
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug, Clone)]
|
|
||||||
pub enum IoErrorKind {
|
|
||||||
NotFound,
|
|
||||||
PermissionDenied,
|
|
||||||
InvalidData,
|
|
||||||
Other,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl std::fmt::Display for IoErrorKind {
|
|
||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
|
||||||
match self {
|
|
||||||
Self::NotFound => write!(f, "file not found"),
|
|
||||||
Self::PermissionDenied => write!(f, "permission denied"),
|
|
||||||
Self::InvalidData => write!(f, "invalid data"),
|
|
||||||
Self::Other => write!(f, "other I/O error"),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl std::fmt::Display for IoError {
|
|
||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
|
||||||
write!(f, "{}", self.kind)?;
|
|
||||||
|
|
||||||
if let Some(msg) = &self.msg {
|
|
||||||
write!(f, ", \"{msg}\"")?;
|
|
||||||
}
|
|
||||||
|
|
||||||
Ok(())
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Display for AssembleErrorKind {
|
|
||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
|
||||||
match self {
|
|
||||||
Self::Tokeniser(why) => write!(f, "tokeniser error: {why}"),
|
|
||||||
Self::Unimplemented(why) => write!(f, "used unimplemented feature: {why}"),
|
|
||||||
Self::Io(why) => write!(f, "problem occurred with I/O: {why}"),
|
|
||||||
#[allow(unreachable_patterns)]
|
|
||||||
_ => write!(
|
|
||||||
f,
|
|
||||||
"unhandled error type in Display implementation! See error.rs!"
|
|
||||||
),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
pub mod conversions;
|
|
||||||
@@ -1,67 +0,0 @@
|
|||||||
use std::{
|
|
||||||
io::ErrorKind,
|
|
||||||
sync::{PoisonError, RwLockReadGuard, RwLockWriteGuard},
|
|
||||||
};
|
|
||||||
|
|
||||||
use crate::error::{AssembleError, IoError, IoErrorKind};
|
|
||||||
|
|
||||||
use super::{AssembleErrorKind, ThreadingError};
|
|
||||||
|
|
||||||
impl From<std::io::Error> for IoError {
|
|
||||||
fn from(err: std::io::Error) -> Self {
|
|
||||||
let kind = match err.kind() {
|
|
||||||
ErrorKind::NotFound => IoErrorKind::NotFound,
|
|
||||||
ErrorKind::PermissionDenied => IoErrorKind::PermissionDenied,
|
|
||||||
ErrorKind::InvalidData => IoErrorKind::InvalidData,
|
|
||||||
_ => IoErrorKind::Other,
|
|
||||||
};
|
|
||||||
|
|
||||||
let msg = err.to_string();
|
|
||||||
|
|
||||||
Self::new(kind, Some(msg))
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl From<std::io::Error> for AssembleError {
|
|
||||||
fn from(err: std::io::Error) -> Self {
|
|
||||||
Self::new_other_error(AssembleErrorKind::Io(err.into()))
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// TODO: Maybe attempt recovery? To be honest we don't want any threads to panic at all,
|
|
||||||
// or we want them all to panic spectacularly.
|
|
||||||
impl<T> From<PoisonError<RwLockReadGuard<'_, T>>> for AssembleError {
|
|
||||||
fn from(err: PoisonError<RwLockReadGuard<'_, T>>) -> Self {
|
|
||||||
Self::new_other_error(AssembleErrorKind::Threading(err.into()))
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl<T> From<PoisonError<RwLockReadGuard<'_, T>>> for ThreadingError {
|
|
||||||
fn from(_err: PoisonError<RwLockReadGuard<'_, T>>) -> Self {
|
|
||||||
Self::LockFailed
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl<T> From<PoisonError<RwLockWriteGuard<'_, T>>> for AssembleError {
|
|
||||||
fn from(err: PoisonError<RwLockWriteGuard<'_, T>>) -> Self {
|
|
||||||
Self::new_other_error(AssembleErrorKind::Threading(err.into()))
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl<T> From<PoisonError<RwLockWriteGuard<'_, T>>> for ThreadingError {
|
|
||||||
fn from(_err: PoisonError<RwLockWriteGuard<'_, T>>) -> Self {
|
|
||||||
Self::LockFailed
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl From<std::fmt::Error> for AssembleError {
|
|
||||||
fn from(err: std::fmt::Error) -> Self {
|
|
||||||
IoError::new(IoErrorKind::Other, Some(err.to_string())).into()
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl From<IoError> for AssembleError {
|
|
||||||
fn from(err: IoError) -> Self {
|
|
||||||
Self::new_other_error(AssembleErrorKind::Io(err))
|
|
||||||
}
|
|
||||||
}
|
|
||||||
+9
-10
@@ -12,18 +12,17 @@
|
|||||||
clippy::match_wildcard_for_single_variants
|
clippy::match_wildcard_for_single_variants
|
||||||
)]
|
)]
|
||||||
|
|
||||||
pub mod args;
|
pub mod assembler;
|
||||||
// pub mod tooling;
|
pub mod image_builder;
|
||||||
pub mod compiler_engine;
|
pub mod tooling;
|
||||||
pub mod context;
|
|
||||||
pub mod error;
|
|
||||||
pub mod model;
|
|
||||||
pub mod source;
|
|
||||||
pub mod symtab;
|
|
||||||
|
|
||||||
mod util;
|
mod util;
|
||||||
|
|
||||||
// pub mod prelude {}
|
pub mod prelude {
|
||||||
|
pub use crate::assembler::CompilerEngine;
|
||||||
|
pub use crate::image_builder;
|
||||||
|
pub use crate::tooling::brainf;
|
||||||
|
pub use crate::tooling::project;
|
||||||
|
}
|
||||||
|
|
||||||
use num_cpus as _;
|
use num_cpus as _;
|
||||||
use threadpool as _;
|
use threadpool as _;
|
||||||
|
|||||||
+47
-75
@@ -1,92 +1,64 @@
|
|||||||
use std::sync::Arc;
|
|
||||||
|
|
||||||
use assembler::{
|
|
||||||
error::{AssembleError, AssembleErrorKind, ParserError},
|
|
||||||
model::module::Module,
|
|
||||||
source::{source_info::SourceInfo, token::TokenType, tokeniser::Tokeniser},
|
|
||||||
};
|
|
||||||
use common as _;
|
use common as _;
|
||||||
use num_cpus as _;
|
use num_cpus as _;
|
||||||
use threadpool as _;
|
use threadpool as _;
|
||||||
|
|
||||||
// use clap::Parser;
|
use assembler::{
|
||||||
// use std::{fs, io::Write, path::PathBuf};
|
prelude::*,
|
||||||
|
tooling::{brainf, project},
|
||||||
|
};
|
||||||
|
use std::{fs, io::Write, path::PathBuf};
|
||||||
|
|
||||||
fn main() -> Result<(), AssembleError> {
|
fn main() {
|
||||||
// // Parse command line arguments
|
// Parse command line arguments
|
||||||
// let args: Vec<String> = std::env::args().collect();
|
let args: Vec<String> = std::env::args().collect();
|
||||||
let contents = include_bytes!("../../resources/dsa/bf.dsa").to_vec();
|
|
||||||
|
|
||||||
let module = Arc::new(Module::new("resources/dsa/bf.dsa")?);
|
if args.len() == 2 && args[1] == "init" {
|
||||||
let tok = Tokeniser::from_data(contents, module.clone());
|
project::tool_libcreate();
|
||||||
|
std::process::exit(0);
|
||||||
let ts = tok
|
|
||||||
.tokenise()?
|
|
||||||
.into_iter()
|
|
||||||
.filter(|t| !matches!(t.token_type, TokenType::Eof | TokenType::Newline));
|
|
||||||
|
|
||||||
for t in ts {
|
|
||||||
t.source_info.print_context_with_underline()?;
|
|
||||||
}
|
}
|
||||||
|
|
||||||
let test_error: AssembleError = AssembleError::new_source_error(
|
if args.len() == 2 && args[1] == "brainf" {
|
||||||
SourceInfo::new(45, module.clone(), 4..7),
|
let src = PathBuf::from("brainf.bf");
|
||||||
AssembleErrorKind::Parser(ParserError::InvalidInstruction),
|
let result = brainf::build(&src);
|
||||||
);
|
|
||||||
|
|
||||||
eprintln!("\n\n{test_error}");
|
let mut file = match fs::File::create("brainf.dsb") {
|
||||||
|
Err(e) => {
|
||||||
|
eprintln!("Failed to create output file: {e}");
|
||||||
|
std::process::exit(1);
|
||||||
|
}
|
||||||
|
Ok(file) => file,
|
||||||
|
};
|
||||||
|
|
||||||
Ok(())
|
for instruction in result {
|
||||||
|
if let Err(e) = file.write(&instruction.encode().to_be_bytes()) {
|
||||||
|
eprintln!("Failed to write to output file: {e}");
|
||||||
|
std::process::exit(1);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
// let _clap_args = assembler::args::Args::parse();
|
std::process::exit(0);
|
||||||
|
}
|
||||||
|
|
||||||
// if args.len() == 2 && args[1] == "init" {
|
if args.len() != 5 || args[1] != "-i" || args[3] != "-o" {
|
||||||
// // project::tool_libcreate();
|
eprintln!("Usage: {} -i input_path -o output_path", args[0]);
|
||||||
// std::process::exit(0);
|
std::process::exit(1);
|
||||||
// }
|
}
|
||||||
|
|
||||||
// if args.len() == 2 && args[1] == "brainf" {
|
let input_path = &args[2];
|
||||||
// let src = PathBuf::from("brainf.bf");
|
let output_path = &args[4];
|
||||||
// // let result = brainf::build(&src);
|
let src = PathBuf::from(input_path);
|
||||||
|
|
||||||
// let mut file = match fs::File::create("brainf.dsb") {
|
// Initialize the compiler engine
|
||||||
// Err(e) => {
|
let mut compiler = CompilerEngine::new();
|
||||||
// eprintln!("Failed to create output file: {e}");
|
compiler.start_compilation(&src);
|
||||||
// std::process::exit(1);
|
|
||||||
// }
|
|
||||||
// Ok(file) => file,
|
|
||||||
// };
|
|
||||||
|
|
||||||
// // for instruction in result {
|
// Or block until done
|
||||||
// // if let Err(e) = file.write(&instruction.encode().to_be_bytes()) {
|
let result = compiler.wait_for_result().unwrap();
|
||||||
// // eprintln!("Failed to write to output file: {e}");
|
|
||||||
// // std::process::exit(1);
|
|
||||||
// // }
|
|
||||||
// // }
|
|
||||||
|
|
||||||
// std::process::exit(0);
|
for instruction in result {
|
||||||
// }
|
if let Err(e) = fs::write(output_path, instruction.encode().to_be_bytes()) {
|
||||||
|
eprintln!("Failed to write to output file: {e}");
|
||||||
// if args.len() != 5 || args[1] != "-i" || args[3] != "-o" {
|
std::process::exit(1);
|
||||||
// eprintln!("Usage: {} -i input_path -o output_path", args[0]);
|
}
|
||||||
// std::process::exit(1);
|
}
|
||||||
// }
|
|
||||||
|
|
||||||
// let input_path = &args[2];
|
|
||||||
// let output_path = &args[4];
|
|
||||||
// let src = PathBuf::from(input_path);
|
|
||||||
|
|
||||||
// // Initialize the compiler engine
|
|
||||||
// let mut compiler = CompilerEngine::new();
|
|
||||||
// compiler.start_compilation(&src);
|
|
||||||
|
|
||||||
// // Or block until done
|
|
||||||
// let result = compiler.wait_for_result().unwrap();
|
|
||||||
|
|
||||||
// for instruction in result {
|
|
||||||
// if let Err(e) = fs::write(output_path, instruction.encode().to_be_bytes()) {
|
|
||||||
// eprintln!("Failed to write to output file: {e}");
|
|
||||||
// std::process::exit(1);
|
|
||||||
// }
|
|
||||||
// }
|
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -1,5 +0,0 @@
|
|||||||
//! This module contains the underlying data models and enums used by the Assembler.
|
|
||||||
|
|
||||||
pub mod module;
|
|
||||||
pub mod module_registry;
|
|
||||||
pub mod symbol;
|
|
||||||
@@ -1,110 +0,0 @@
|
|||||||
//! This module contains the [`Module`] type and associated types. Each compilation unit
|
|
||||||
//! (file) is represented by a module which is used to namespace "function" calls and
|
|
||||||
//! accesses to global variables.
|
|
||||||
//!
|
|
||||||
//! They have unique identifiers in the form of UUIDs.
|
|
||||||
|
|
||||||
use std::{
|
|
||||||
path::{Path, PathBuf},
|
|
||||||
sync::Arc,
|
|
||||||
};
|
|
||||||
|
|
||||||
use regex::Regex;
|
|
||||||
use uuid::Uuid;
|
|
||||||
|
|
||||||
use crate::{
|
|
||||||
error::{AssembleError, AssembleErrorKind, IoError, IoErrorKind},
|
|
||||||
model::module_registry::ModuleRegistry,
|
|
||||||
};
|
|
||||||
|
|
||||||
/// The ID for a module. A tuple struct for type safety.
|
|
||||||
#[derive(Debug, Hash, PartialEq, Eq, Clone, Copy)]
|
|
||||||
pub struct ModuleId(Uuid);
|
|
||||||
|
|
||||||
impl ModuleId {
|
|
||||||
#[must_use]
|
|
||||||
pub fn new() -> Self {
|
|
||||||
Self(Uuid::new_v4())
|
|
||||||
}
|
|
||||||
|
|
||||||
#[must_use]
|
|
||||||
pub const fn from_module(module: &Module) -> Self {
|
|
||||||
module.id
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Convenience method to get the [`Module`] from a [`ModuleId`].
|
|
||||||
#[must_use]
|
|
||||||
pub fn to_module<'m>(&self, registry: &'m ModuleRegistry) -> Option<&'m Arc<Module>> {
|
|
||||||
registry.get(self)
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Convenience method to get the [`Module`] name from a [`ModuleId`].
|
|
||||||
#[must_use]
|
|
||||||
pub fn to_module_name(self, registry: &ModuleRegistry) -> Option<&str> {
|
|
||||||
self.to_module(registry).map(|module| module.name.as_str())
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Default for ModuleId {
|
|
||||||
fn default() -> Self {
|
|
||||||
Self::new()
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl std::fmt::Display for ModuleId {
|
|
||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
|
||||||
write!(f, "{}", self.0)
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// A single source file or compilation unit. Stores its own symbol table.
|
|
||||||
#[derive(Debug, Clone)]
|
|
||||||
pub struct Module {
|
|
||||||
/// The name of the module. This is typically the name of the file, less the `.dsa`
|
|
||||||
/// extension.
|
|
||||||
pub name: String,
|
|
||||||
/// The file path to the module. This is an absolute path.
|
|
||||||
pub path: PathBuf,
|
|
||||||
/// A unique ID for this module.
|
|
||||||
pub id: ModuleId,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl std::hash::Hash for Module {
|
|
||||||
fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
|
|
||||||
self.id.0.hash(state);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Module {
|
|
||||||
pub fn new<P: AsRef<Path>>(p: P) -> Result<Self, AssembleError> {
|
|
||||||
let path = p.as_ref().to_path_buf();
|
|
||||||
let name = Self::extract_module_name(&path)?;
|
|
||||||
let id = ModuleId::new();
|
|
||||||
|
|
||||||
Ok(Self { name, path, id })
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Gets the name for a module from the path.
|
|
||||||
fn extract_module_name<P: AsRef<Path>>(path: P) -> Result<String, AssembleError> {
|
|
||||||
let extensions_regex = Regex::new(".(dsa|S|asm)$")
|
|
||||||
.expect("For some reason the regular expression failed to compile!");
|
|
||||||
let module_name = path
|
|
||||||
.as_ref()
|
|
||||||
.file_name()
|
|
||||||
.map(|f| f.to_string_lossy())
|
|
||||||
.ok_or_else(|| {
|
|
||||||
AssembleError::new_other_error(AssembleErrorKind::Io(IoError::new(
|
|
||||||
IoErrorKind::InvalidData,
|
|
||||||
Some(
|
|
||||||
"the filename couldn't be extracted, is it valid UTF-8?"
|
|
||||||
.to_string(),
|
|
||||||
),
|
|
||||||
)))
|
|
||||||
})?;
|
|
||||||
|
|
||||||
// Strip any file extensions given. We don't care for now.
|
|
||||||
let out = extensions_regex.replace(&module_name, "");
|
|
||||||
|
|
||||||
Ok(out.to_string())
|
|
||||||
}
|
|
||||||
}
|
|
||||||
@@ -1,44 +0,0 @@
|
|||||||
//! This module contains the code for the module registry. This is a singleton storing all
|
|
||||||
//! the modules being assembled.
|
|
||||||
|
|
||||||
use std::{collections::HashMap, sync::Arc};
|
|
||||||
|
|
||||||
use super::module::{Module, ModuleId};
|
|
||||||
|
|
||||||
/// Stores all the [`Module`]'s to be assembled.
|
|
||||||
pub struct ModuleRegistry {
|
|
||||||
modules: HashMap<ModuleId, Arc<Module>>,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Default for ModuleRegistry {
|
|
||||||
fn default() -> Self {
|
|
||||||
Self::new()
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl ModuleRegistry {
|
|
||||||
#[must_use]
|
|
||||||
pub fn new() -> Self {
|
|
||||||
Self {
|
|
||||||
modules: HashMap::new(),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Gets a [`Module`] by ID.
|
|
||||||
#[must_use]
|
|
||||||
pub fn get(&self, module_id: &ModuleId) -> Option<&Arc<Module>> {
|
|
||||||
self.modules.get(module_id)
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Adds a [`Module`] and returns its [`ModuleId`].
|
|
||||||
pub fn add(&mut self, module: Arc<Module>) -> ModuleId {
|
|
||||||
let id = module.id;
|
|
||||||
self.modules.insert(id, module);
|
|
||||||
id
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Returns an iterator of modules.
|
|
||||||
pub fn modules(&self) -> impl Iterator<Item = &Arc<Module>> {
|
|
||||||
self.modules.values()
|
|
||||||
}
|
|
||||||
}
|
|
||||||
@@ -1,165 +0,0 @@
|
|||||||
//! This module contains the definitions for a Symbol.
|
|
||||||
|
|
||||||
use std::collections::HashSet;
|
|
||||||
|
|
||||||
use uuid::Uuid;
|
|
||||||
|
|
||||||
use crate::{model::module::ModuleId, symtab::SymbolTable};
|
|
||||||
|
|
||||||
/// Tuple struct for type safety. Has methods for fetching symbols by ID.
|
|
||||||
#[derive(Debug, PartialEq, Eq, Hash, Copy, Clone)]
|
|
||||||
pub struct SymbolId(Uuid);
|
|
||||||
|
|
||||||
impl From<Symbol> for SymbolId {
|
|
||||||
fn from(sym: Symbol) -> Self {
|
|
||||||
sym.id
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Default for SymbolId {
|
|
||||||
fn default() -> Self {
|
|
||||||
Self::new()
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl SymbolId {
|
|
||||||
#[must_use]
|
|
||||||
pub fn new() -> Self {
|
|
||||||
Self(Uuid::new_v4())
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Convenience method to get the [`Module`] from a [`ModuleId`].
|
|
||||||
#[must_use]
|
|
||||||
pub fn to_module<'s>(&self, registry: &'s SymbolTable) -> Option<&'s Symbol> {
|
|
||||||
registry.get(self)
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Convenience method to get the [`Module`] name from a [`ModuleId`].
|
|
||||||
#[must_use]
|
|
||||||
pub fn to_module_name(self, registry: &SymbolTable) -> Option<&str> {
|
|
||||||
self.to_module(registry).map(|module| module.name.as_str())
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// A symbol is a named reference that may be resolved later to an address by a linker.
|
|
||||||
#[derive(Debug)]
|
|
||||||
pub struct Symbol {
|
|
||||||
/// Stored cheaply instead of the name. Shall be stored in the symbol table under
|
|
||||||
/// this key.
|
|
||||||
pub id: SymbolId,
|
|
||||||
|
|
||||||
/// The human-readable name for the symbol.
|
|
||||||
pub name: String,
|
|
||||||
|
|
||||||
pub visibility: Visibility,
|
|
||||||
|
|
||||||
pub symbol_type: SymbolType,
|
|
||||||
|
|
||||||
/// The id of the module the symbol is defined in. This will be different for symbols
|
|
||||||
/// in different objects.
|
|
||||||
pub module_id: ModuleId,
|
|
||||||
|
|
||||||
/// Whether or not the symbol requires relocating.
|
|
||||||
pub needs_relocation: bool,
|
|
||||||
|
|
||||||
/// A list of the symbol's dependencies.
|
|
||||||
///
|
|
||||||
/// e.g.
|
|
||||||
///
|
|
||||||
/// ```dsa
|
|
||||||
/// main:
|
|
||||||
/// call another_func
|
|
||||||
///
|
|
||||||
/// another_func:
|
|
||||||
/// // Code goes here
|
|
||||||
/// ret
|
|
||||||
/// ```
|
|
||||||
///
|
|
||||||
/// Where `main` depends on `another_func`.
|
|
||||||
pub dependencies: HashSet<SymbolId>,
|
|
||||||
|
|
||||||
/// The address of the symbol.
|
|
||||||
pub address: Option<u32>,
|
|
||||||
/// The section the symbol is in.
|
|
||||||
/// TODO: Perhaps make this a proper type?
|
|
||||||
pub section: Option<String>,
|
|
||||||
pub size: Option<u32>,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Symbol {
|
|
||||||
#[must_use]
|
|
||||||
pub fn new(
|
|
||||||
name: String,
|
|
||||||
module_id: ModuleId,
|
|
||||||
visibility: Visibility,
|
|
||||||
symbol_type: SymbolType,
|
|
||||||
) -> Self {
|
|
||||||
Self {
|
|
||||||
id: SymbolId::new(),
|
|
||||||
name,
|
|
||||||
module_id,
|
|
||||||
address: None,
|
|
||||||
section: None,
|
|
||||||
size: None,
|
|
||||||
visibility,
|
|
||||||
symbol_type,
|
|
||||||
needs_relocation: false,
|
|
||||||
dependencies: HashSet::new(),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Adds a dependency on another [`Symbol`].
|
|
||||||
pub fn add_dependency(&mut self, dep: SymbolId) {
|
|
||||||
if self.id == dep {
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
|
|
||||||
// We can resolve a lot of addresses at assembly time, but not really foreign
|
|
||||||
// ones, since we aren't certain of their position.
|
|
||||||
//
|
|
||||||
/* TODO: Handle this for flat binary case i.e. no linker required. This may be
|
|
||||||
* done using a similar method to before, such as just concatenating all
|
|
||||||
* of the files together and handling jumps and halts.
|
|
||||||
*
|
|
||||||
* > Ask Harry or read the initial code.
|
|
||||||
*/
|
|
||||||
if self.dependencies.insert(dep) {
|
|
||||||
self.needs_relocation = true;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Returns whether a [`Symbol`] depends on `symbol_id`.
|
|
||||||
#[must_use]
|
|
||||||
pub fn depends_on(&self, symbol_id: &SymbolId) -> bool {
|
|
||||||
self.dependencies.contains(symbol_id)
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Removes a [`Symbol`] from the dependency set.
|
|
||||||
pub fn remove_dependency(&mut self, symbol_id: &SymbolId) {
|
|
||||||
self.dependencies.remove(symbol_id);
|
|
||||||
|
|
||||||
if self.dependencies.is_empty() {
|
|
||||||
self.needs_relocation = false;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug, Copy, Clone)]
|
|
||||||
/// The visibility of the symbol in different object files.
|
|
||||||
pub enum Visibility {
|
|
||||||
/// `STB_PUBLIC` under the ELF spec. Visible in all other object files. Shall be used
|
|
||||||
/// for labels. Remember labels are namespaced in different files so they won't clash
|
|
||||||
/// with one another.
|
|
||||||
Public,
|
|
||||||
/// Only visible within this object file. `STB_LOCAL` under ELF spec. Shall be used
|
|
||||||
/// for data definitions unless they are marked public.
|
|
||||||
Local,
|
|
||||||
/// `STB_WEAK` under the ELF spec. Potentially unused.
|
|
||||||
Weak,
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug)]
|
|
||||||
pub enum SymbolType {
|
|
||||||
LabelOrFunction,
|
|
||||||
Variable,
|
|
||||||
}
|
|
||||||
@@ -1,29 +0,0 @@
|
|||||||
//! This module contains anything within the first stage of assembly, i.e. the
|
|
||||||
//! tokenisation stage, or utility functions for reading input files.
|
|
||||||
|
|
||||||
use std::{
|
|
||||||
io::{BufRead, Lines},
|
|
||||||
path::Path,
|
|
||||||
};
|
|
||||||
|
|
||||||
use crate::error::AssembleError;
|
|
||||||
|
|
||||||
pub mod lines;
|
|
||||||
pub mod opcode;
|
|
||||||
pub mod source_info;
|
|
||||||
pub mod token;
|
|
||||||
pub mod token_info;
|
|
||||||
pub mod tokeniser;
|
|
||||||
|
|
||||||
/// Attempts to load and open a source file, returning a [`Vec<u8>`] or an
|
|
||||||
/// [`AssembleError`].
|
|
||||||
pub fn load_source_bytes<P: AsRef<Path>>(p: P) -> Result<Vec<u8>, AssembleError> {
|
|
||||||
let path = p.as_ref();
|
|
||||||
|
|
||||||
Ok(std::fs::read(path)?)
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Get the lines from a [`BufReader`].
|
|
||||||
pub fn reader_lines<R: BufRead>(rdr: R) -> Lines<R> {
|
|
||||||
rdr.lines()
|
|
||||||
}
|
|
||||||
@@ -1,76 +0,0 @@
|
|||||||
//! Enhanced lines iterator that tracks line numbers and character positions.
|
|
||||||
|
|
||||||
use std::io::{BufRead, BufReader, Cursor};
|
|
||||||
|
|
||||||
use crate::error::AssembleError;
|
|
||||||
|
|
||||||
/// Iterator that yields lines with their line numbers and character spans.
|
|
||||||
pub struct LinesWithSpans<R: BufRead> {
|
|
||||||
reader: R,
|
|
||||||
line_number: usize,
|
|
||||||
total_chars: usize,
|
|
||||||
buffer: String,
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug, Clone)]
|
|
||||||
pub struct LineSpan {
|
|
||||||
/// The line number.
|
|
||||||
pub line_number: usize,
|
|
||||||
/// The contents of the line.
|
|
||||||
pub content: String,
|
|
||||||
/// Character offset from start of file.
|
|
||||||
pub start_char: usize,
|
|
||||||
/// End character offset (exclusive).
|
|
||||||
pub end_char: usize,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl<R: BufRead> LinesWithSpans<R> {
|
|
||||||
pub const fn new(reader: R) -> Self {
|
|
||||||
Self {
|
|
||||||
reader,
|
|
||||||
line_number: 0,
|
|
||||||
total_chars: 0,
|
|
||||||
buffer: String::new(),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl<R: BufRead> Iterator for LinesWithSpans<R> {
|
|
||||||
type Item = Result<LineSpan, AssembleError>;
|
|
||||||
|
|
||||||
fn next(&mut self) -> Option<Self::Item> {
|
|
||||||
self.buffer.clear();
|
|
||||||
|
|
||||||
match self.reader.read_line(&mut self.buffer) {
|
|
||||||
Ok(0) => None, // EOF
|
|
||||||
Ok(bytes_read) => {
|
|
||||||
self.line_number += 1;
|
|
||||||
let start_char = self.total_chars;
|
|
||||||
self.total_chars += bytes_read;
|
|
||||||
|
|
||||||
// Remove trailing newline for cleaner processing
|
|
||||||
let content = if self.buffer.ends_with('\n') {
|
|
||||||
self.buffer[..self.buffer.len() - 1].to_string()
|
|
||||||
} else {
|
|
||||||
self.buffer.clone()
|
|
||||||
};
|
|
||||||
|
|
||||||
Some(Ok(LineSpan {
|
|
||||||
line_number: self.line_number,
|
|
||||||
content,
|
|
||||||
start_char,
|
|
||||||
end_char: self.total_chars,
|
|
||||||
}))
|
|
||||||
}
|
|
||||||
Err(e) => Some(Err(e.into())),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Helper function to create lines iterator from data.
|
|
||||||
#[must_use]
|
|
||||||
pub fn lines_with_spans(data: &[u8]) -> LinesWithSpans<BufReader<Cursor<&[u8]>>> {
|
|
||||||
let cursor = Cursor::new(data);
|
|
||||||
let reader = BufReader::new(cursor);
|
|
||||||
LinesWithSpans::new(reader)
|
|
||||||
}
|
|
||||||
@@ -1,4 +0,0 @@
|
|||||||
//! This module contains code for handling pseudo opcodes.
|
|
||||||
|
|
||||||
/// Pseudo instructions that cannot simply be lowered to ISA instructions.
|
|
||||||
pub enum PseudoOpcode {}
|
|
||||||
@@ -1,104 +0,0 @@
|
|||||||
//! This file contains information on where a [`Token`] or [`Node`] is within the source
|
|
||||||
//! code for more informative errors.
|
|
||||||
//!
|
|
||||||
//! This will likely be attached to a [`Token`] which will in turn be attached to an AST
|
|
||||||
//! [`Node`].
|
|
||||||
|
|
||||||
use std::{
|
|
||||||
fmt::{Display, Write},
|
|
||||||
fs::File,
|
|
||||||
io::BufReader,
|
|
||||||
sync::Arc,
|
|
||||||
};
|
|
||||||
|
|
||||||
use crate::{
|
|
||||||
error::{AssembleError, AssembleErrorKind, IoError, IoErrorKind},
|
|
||||||
model::module::Module,
|
|
||||||
source::lines::LinesWithSpans,
|
|
||||||
};
|
|
||||||
|
|
||||||
/// Information on where the token is within the source.
|
|
||||||
#[derive(Debug, Clone)]
|
|
||||||
pub struct SourceInfo {
|
|
||||||
/// The line number within the source file underpinned by `module_id`.
|
|
||||||
pub line_number: usize,
|
|
||||||
/// The [`Module`] the source code is associated with.
|
|
||||||
pub module: Arc<Module>,
|
|
||||||
/// The indexes where this token may be found (line-local).
|
|
||||||
pub span: std::ops::Range<usize>,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Display for SourceInfo {
|
|
||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
|
||||||
write!(
|
|
||||||
f,
|
|
||||||
"{}:{}:{}",
|
|
||||||
self.module.path.display(),
|
|
||||||
self.line_number,
|
|
||||||
self.span.start + 1
|
|
||||||
)
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl SourceInfo {
|
|
||||||
#[must_use]
|
|
||||||
pub const fn new(
|
|
||||||
line_no: usize,
|
|
||||||
module: Arc<Module>,
|
|
||||||
span: std::ops::Range<usize>,
|
|
||||||
) -> Self {
|
|
||||||
Self {
|
|
||||||
line_number: line_no,
|
|
||||||
module,
|
|
||||||
span,
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Prints out where in the source code the error originated with an underline similar
|
|
||||||
/// to what rustc does.
|
|
||||||
pub fn print_context_with_underline(&self) -> Result<(), AssembleError> {
|
|
||||||
let f = File::open(&self.module.path)?;
|
|
||||||
let rdr = BufReader::new(f);
|
|
||||||
|
|
||||||
let mut lines = LinesWithSpans::new(rdr);
|
|
||||||
|
|
||||||
let Some(line_result) = lines.nth(self.line_number - 1) else {
|
|
||||||
// Handle a line not existing.
|
|
||||||
return Err(AssembleError::new_source_error(
|
|
||||||
self.clone(),
|
|
||||||
AssembleErrorKind::Io(IoError::new(
|
|
||||||
IoErrorKind::Other,
|
|
||||||
Some(format!(
|
|
||||||
"the line {} does not exist in input file `{}` but source info suggested otherwise!.",
|
|
||||||
self.line_number,
|
|
||||||
self.module.path.display()
|
|
||||||
)),
|
|
||||||
)),
|
|
||||||
));
|
|
||||||
};
|
|
||||||
|
|
||||||
let line_span = line_result?;
|
|
||||||
|
|
||||||
// Print the line number and line content.
|
|
||||||
println!("{:>4} | {}", self.line_number, line_span.content);
|
|
||||||
|
|
||||||
let mut pad_left = String::new();
|
|
||||||
write!(pad_left, "{:>4} ", "")?;
|
|
||||||
|
|
||||||
let mut underline = String::new();
|
|
||||||
|
|
||||||
for _ in 0..self.span.start {
|
|
||||||
pad_left.push(' ');
|
|
||||||
}
|
|
||||||
|
|
||||||
for _ in self.span.start..self.span.end.min(line_span.content.len()) {
|
|
||||||
underline.push('^');
|
|
||||||
}
|
|
||||||
|
|
||||||
// Print the underline in red and bold.
|
|
||||||
// TODO: Use a crate to make this extra portable.
|
|
||||||
println!("{pad_left}\x1b[1;31m{underline}\x1b[0m");
|
|
||||||
|
|
||||||
Ok(())
|
|
||||||
}
|
|
||||||
}
|
|
||||||
@@ -1,91 +0,0 @@
|
|||||||
//! Contains [`TokenType`] and [`Token`]'s. Adapted from Harry's old lexer since it was
|
|
||||||
//! easier to build from scratch and edit his code than it would be to try and wrangle it
|
|
||||||
//! into shape.
|
|
||||||
|
|
||||||
use common::prelude::*;
|
|
||||||
|
|
||||||
use crate::source::{
|
|
||||||
opcode::Opcode,
|
|
||||||
source_info::SourceInfo,
|
|
||||||
token_info::{DirectiveToken, LabelToken, RegisterToken, SymbolToken},
|
|
||||||
};
|
|
||||||
|
|
||||||
/// Represents the different types of tokens that can be produced by the tokeniser.
|
|
||||||
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
|
|
||||||
pub enum TokenType {
|
|
||||||
/// Symbol reference (e.g., `loop_start`, `my_data`).
|
|
||||||
Symbol(SymbolToken),
|
|
||||||
/// CPU register (e.g., `r1`, `r2`, `sp`).
|
|
||||||
Register(RegisterToken),
|
|
||||||
/// Immediate value (e.g., `42`, `0xFF`).
|
|
||||||
Immediate(u32),
|
|
||||||
/// String literal (e.g., `"hello world"`).
|
|
||||||
String(String),
|
|
||||||
/// Intermediate token for multiline strings (filtered out in final output)
|
|
||||||
StringContinuation,
|
|
||||||
/// Assembly instruction (e.g., `add`, `jmp`, `nop`).
|
|
||||||
Instruction(Opcode),
|
|
||||||
/// Label definition (e.g., `loop_start:`).
|
|
||||||
Label(LabelToken),
|
|
||||||
/// Assembler directive (e.g., `.global`, `.section`, `.dw`).
|
|
||||||
Directive(DirectiveToken),
|
|
||||||
/// Comment (e.g., `// this is a comment`).
|
|
||||||
Comment,
|
|
||||||
/// Comma separator.
|
|
||||||
Comma,
|
|
||||||
/// End of line.
|
|
||||||
Newline,
|
|
||||||
/// End of file.
|
|
||||||
Eof,
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug)]
|
|
||||||
pub struct Token {
|
|
||||||
/// The type of the token.
|
|
||||||
pub token_type: TokenType,
|
|
||||||
/// Where in the source code is this [`Token`]?
|
|
||||||
pub source_info: SourceInfo,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Token {
|
|
||||||
#[must_use]
|
|
||||||
pub const fn new(token_type: TokenType, source_info: SourceInfo) -> Self {
|
|
||||||
Self {
|
|
||||||
token_type,
|
|
||||||
source_info,
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[must_use]
|
|
||||||
pub const fn symbol(name: String, source_info: SourceInfo) -> Self {
|
|
||||||
Self::new(TokenType::Symbol(SymbolToken { name }), source_info)
|
|
||||||
}
|
|
||||||
|
|
||||||
#[must_use]
|
|
||||||
pub const fn label(name: String, source_info: SourceInfo) -> Self {
|
|
||||||
Self::new(TokenType::Label(LabelToken { name }), source_info)
|
|
||||||
}
|
|
||||||
|
|
||||||
#[must_use]
|
|
||||||
pub const fn instruction(op: Opcode, source_info: SourceInfo) -> Self {
|
|
||||||
Self::new(TokenType::Instruction(op), source_info)
|
|
||||||
}
|
|
||||||
|
|
||||||
#[must_use]
|
|
||||||
pub const fn register(reg: Register, source_info: SourceInfo) -> Self {
|
|
||||||
Self::new(TokenType::Register(RegisterToken { reg }), source_info)
|
|
||||||
}
|
|
||||||
|
|
||||||
#[must_use]
|
|
||||||
pub const fn immediate(value: u32, source_info: SourceInfo) -> Self {
|
|
||||||
Self::new(TokenType::Immediate(value), source_info)
|
|
||||||
}
|
|
||||||
|
|
||||||
#[must_use]
|
|
||||||
pub const fn directive(directive: String, source_info: SourceInfo) -> Self {
|
|
||||||
Self::new(
|
|
||||||
TokenType::Directive(DirectiveToken { directive }),
|
|
||||||
source_info,
|
|
||||||
)
|
|
||||||
}
|
|
||||||
}
|
|
||||||
@@ -1,34 +0,0 @@
|
|||||||
use common::prelude::Register;
|
|
||||||
|
|
||||||
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
|
|
||||||
pub struct SymbolToken {
|
|
||||||
pub name: String,
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
|
|
||||||
pub struct LabelToken {
|
|
||||||
pub name: String,
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
|
|
||||||
pub struct DirectiveToken {
|
|
||||||
pub directive: String,
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
|
|
||||||
pub struct RegisterToken {
|
|
||||||
pub reg: Register,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl RegisterToken {
|
|
||||||
#[must_use]
|
|
||||||
pub const fn new(reg: Register) -> Self {
|
|
||||||
Self { reg }
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Returns the name of a valid [`Register`]
|
|
||||||
#[must_use]
|
|
||||||
pub fn name(&self) -> String {
|
|
||||||
self.reg.to_string()
|
|
||||||
}
|
|
||||||
}
|
|
||||||
@@ -1,421 +0,0 @@
|
|||||||
//! This file contains the [`Tokeniser`], which consumes a [`Vec`] of input bytes and
|
|
||||||
//! outputs a [`Vec<Token>`].
|
|
||||||
|
|
||||||
use std::{path::Path, str::FromStr, sync::Arc};
|
|
||||||
|
|
||||||
use regex::Regex;
|
|
||||||
|
|
||||||
use common::prelude::*;
|
|
||||||
|
|
||||||
use crate::{
|
|
||||||
context::AssemblerContext,
|
|
||||||
error::{AssembleError, AssembleErrorKind},
|
|
||||||
model::module::Module,
|
|
||||||
source::{
|
|
||||||
lines::{LineSpan, lines_with_spans},
|
|
||||||
load_source_bytes,
|
|
||||||
opcode::Opcode,
|
|
||||||
source_info::SourceInfo,
|
|
||||||
token::{Token, TokenType},
|
|
||||||
token_info::{DirectiveToken, LabelToken, RegisterToken, SymbolToken},
|
|
||||||
tokeniser::error::TokeniserError,
|
|
||||||
},
|
|
||||||
};
|
|
||||||
|
|
||||||
pub mod error;
|
|
||||||
#[cfg(test)]
|
|
||||||
mod tests;
|
|
||||||
|
|
||||||
/// Consumes a [`Vec<u8>`] and outputs a [`Vec`] of [Token]'s.
|
|
||||||
pub struct Tokeniser {
|
|
||||||
/// The data in the file.
|
|
||||||
pub data: Vec<u8>,
|
|
||||||
/// A copy of the Module in which the file is situated.
|
|
||||||
pub module: Arc<Module>,
|
|
||||||
|
|
||||||
// Pre-compiled regex patterns
|
|
||||||
label_regex: Regex,
|
|
||||||
register_regex: Regex,
|
|
||||||
immediate_regex: Regex,
|
|
||||||
directive_regex: Regex,
|
|
||||||
instruction_regex: Regex,
|
|
||||||
symbol_regex: Regex,
|
|
||||||
comment_regex: Regex,
|
|
||||||
|
|
||||||
// String parsing state
|
|
||||||
in_string: bool,
|
|
||||||
string_buffer: String,
|
|
||||||
string_start_line: usize,
|
|
||||||
string_start_column: usize,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Tokeniser {
|
|
||||||
#[must_use]
|
|
||||||
pub fn from_data(data: Vec<u8>, module: Arc<Module>) -> Self {
|
|
||||||
Self {
|
|
||||||
data,
|
|
||||||
module,
|
|
||||||
label_regex: Regex::new(r"^([a-zA-Z_][a-zA-Z0-9_]*):")
|
|
||||||
.expect("Failed to compile label regex pattern"),
|
|
||||||
register_regex: Regex::new(
|
|
||||||
r"^(rg[0-9a-f]+|acc|spr|bpr|ret|idr|mmr|zero|noreg|pcx)\b",
|
|
||||||
)
|
|
||||||
.expect("Failed to compile register regex pattern"),
|
|
||||||
immediate_regex: Regex::new(
|
|
||||||
r"^(0x[0-9a-fA-F_]+|0b[0-1_]+|0o[0-7_]+|[0-9_]+)",
|
|
||||||
)
|
|
||||||
.expect("Failed to compile immediate regex pattern"),
|
|
||||||
directive_regex: Regex::new(r"^(res[bwh]|d[bwh]|include|section|global|local)\b")
|
|
||||||
.expect("Failed to compile directive regex pattern"),
|
|
||||||
instruction_regex: Regex::new(
|
|
||||||
r"^(nop|movs?|ld[bhw]s?|st[bhw]|l[lu]i|j(mp|[egl][qte])|cmp|[id]nc|sh[lr]|add[i]?|sub[i]?|x?n?or|and|not|i[rd]t|hlt|lhwmm|lidt|push[a]?|pop[a]?|lwi|return|call)\b",
|
|
||||||
)
|
|
||||||
.expect("Failed to compile instruction regex pattern"),
|
|
||||||
symbol_regex: Regex::new(r"^([a-zA-Z_][a-zA-Z0-9_]*)::{2}([a-zA-Z0-9_]*)|([a-zA-Z_][a-zA-Z0-9_]*)")
|
|
||||||
.expect("Failed to compile symbol regex pattern"),
|
|
||||||
comment_regex: Regex::new("^//.*")
|
|
||||||
.expect("Failed to compile comment regex pattern"),
|
|
||||||
|
|
||||||
// Initialize string parsing state
|
|
||||||
in_string: false,
|
|
||||||
string_buffer: String::new(),
|
|
||||||
string_start_line: 0,
|
|
||||||
string_start_column: 0,
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Creates a [`Tokeniser`] from a file path. Also creates the underlying [`Module`]
|
|
||||||
/// for you.
|
|
||||||
pub fn new<P: AsRef<Path>>(
|
|
||||||
path: P,
|
|
||||||
ctx: &AssemblerContext,
|
|
||||||
) -> Result<Self, AssembleError> {
|
|
||||||
let path = path.as_ref().to_path_buf();
|
|
||||||
let data = load_source_bytes(&path)?;
|
|
||||||
let module = Arc::new(Module::new(path)?);
|
|
||||||
|
|
||||||
{
|
|
||||||
let mut module_registry = ctx.module_registry.write()?;
|
|
||||||
module_registry.add(module.clone());
|
|
||||||
}
|
|
||||||
|
|
||||||
Ok(Self::from_data(data, module))
|
|
||||||
}
|
|
||||||
|
|
||||||
// Note that modules are tokenised in their own threads, possibly in parallel.
|
|
||||||
pub fn tokenise(mut self) -> Result<Vec<Token>, AssembleError> {
|
|
||||||
let mut token_stream = Vec::new();
|
|
||||||
let data = self.data.clone();
|
|
||||||
let lines = lines_with_spans(&data);
|
|
||||||
|
|
||||||
// Process each line
|
|
||||||
for line_result in lines {
|
|
||||||
let line_span = line_result?;
|
|
||||||
let trimmed = line_span.content.trim();
|
|
||||||
|
|
||||||
// Skip empty lines and add newline tokens
|
|
||||||
if trimmed.is_empty() {
|
|
||||||
token_stream.push(Token::new(
|
|
||||||
TokenType::Newline,
|
|
||||||
SourceInfo::new(line_span.line_number, self.module.clone(), 0..1),
|
|
||||||
));
|
|
||||||
continue;
|
|
||||||
}
|
|
||||||
|
|
||||||
// Actually tokenise the line content
|
|
||||||
let line_tokens = self.tokenise_line(&line_span)?;
|
|
||||||
token_stream.extend(line_tokens);
|
|
||||||
|
|
||||||
// Add newline token at end of line
|
|
||||||
token_stream.push(Token::new(
|
|
||||||
TokenType::Newline,
|
|
||||||
SourceInfo::new(
|
|
||||||
line_span.line_number,
|
|
||||||
self.module.clone(),
|
|
||||||
line_span.content.len()..line_span.content.len(),
|
|
||||||
),
|
|
||||||
));
|
|
||||||
}
|
|
||||||
|
|
||||||
// Add EOF token
|
|
||||||
token_stream.push(Token::new(
|
|
||||||
TokenType::Eof,
|
|
||||||
SourceInfo::new(0, self.module.clone(), 0..0),
|
|
||||||
));
|
|
||||||
|
|
||||||
Ok(token_stream)
|
|
||||||
}
|
|
||||||
|
|
||||||
fn tokenise_line(
|
|
||||||
&mut self,
|
|
||||||
line_span: &LineSpan,
|
|
||||||
) -> Result<Vec<Token>, AssembleError> {
|
|
||||||
let mut tokens = Vec::new();
|
|
||||||
let mut remaining = line_span.content.as_str();
|
|
||||||
let mut column = 0;
|
|
||||||
|
|
||||||
// Skip leading whitespace
|
|
||||||
let trimmed_start = remaining.trim_start();
|
|
||||||
column += remaining.len() - trimmed_start.len();
|
|
||||||
remaining = trimmed_start;
|
|
||||||
|
|
||||||
while !remaining.is_empty() {
|
|
||||||
let start_column = column;
|
|
||||||
|
|
||||||
// Try to match a token.
|
|
||||||
let (token_type, consumed) =
|
|
||||||
self.match_token(remaining, line_span.line_number, column)?;
|
|
||||||
|
|
||||||
// Filter out string continuation tokens and comments.
|
|
||||||
match token_type {
|
|
||||||
TokenType::StringContinuation => {
|
|
||||||
// Don't add to token stream, just consume input
|
|
||||||
}
|
|
||||||
TokenType::Comment => {
|
|
||||||
// Don't add to token stream, consume rest of line
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
_ => {
|
|
||||||
tokens.push(Token::new(
|
|
||||||
token_type,
|
|
||||||
SourceInfo::new(
|
|
||||||
line_span.line_number,
|
|
||||||
self.module.clone(),
|
|
||||||
start_column..start_column + consumed,
|
|
||||||
),
|
|
||||||
));
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// Advance position.
|
|
||||||
remaining = &remaining[consumed..];
|
|
||||||
column += consumed;
|
|
||||||
|
|
||||||
// Skip whitespace.
|
|
||||||
let before_trim = remaining.len();
|
|
||||||
remaining = remaining.trim_start();
|
|
||||||
column += before_trim - remaining.len();
|
|
||||||
}
|
|
||||||
|
|
||||||
Ok(tokens)
|
|
||||||
}
|
|
||||||
|
|
||||||
fn try_match_comment(&self, input: &str) -> Option<(TokenType, usize)> {
|
|
||||||
let caps = self.comment_regex.captures(input)?;
|
|
||||||
let len = caps.get(0)?.len();
|
|
||||||
|
|
||||||
Some((TokenType::Comment, len))
|
|
||||||
}
|
|
||||||
|
|
||||||
fn try_match_label(&self, input: &str) -> Option<(TokenType, usize)> {
|
|
||||||
let caps = self.label_regex.captures(input)?;
|
|
||||||
let name = caps.get(1)?.as_str().to_string();
|
|
||||||
let len = caps.get(0)?.len();
|
|
||||||
|
|
||||||
Some((TokenType::Label(LabelToken { name }), len))
|
|
||||||
}
|
|
||||||
|
|
||||||
fn try_match_register(&self, input: &str) -> Option<(TokenType, usize)> {
|
|
||||||
let caps = self.register_regex.captures(input)?;
|
|
||||||
|
|
||||||
let captured_group = caps.get(1)?.as_str();
|
|
||||||
let len = caps.get(0)?.len();
|
|
||||||
|
|
||||||
let reg = Register::try_from(captured_group).ok()?;
|
|
||||||
|
|
||||||
Some((TokenType::Register(RegisterToken { reg }), len))
|
|
||||||
}
|
|
||||||
|
|
||||||
fn try_match_immediate(&self, input: &str) -> Option<(TokenType, usize)> {
|
|
||||||
let caps = self.immediate_regex.captures(input)?;
|
|
||||||
let value_str = caps.get(1)?.as_str();
|
|
||||||
let len = caps.get(0)?.len();
|
|
||||||
|
|
||||||
// Remove any underscores that were inserted for readability.
|
|
||||||
let value_str = value_str.replace('_', "");
|
|
||||||
|
|
||||||
let value = if let Some(hex_part) = value_str.strip_prefix("0x") {
|
|
||||||
u32::from_str_radix(hex_part, 16).ok()?
|
|
||||||
} else if let Some(bin_part) = value_str.strip_prefix("0b") {
|
|
||||||
u32::from_str_radix(bin_part, 2).ok()?
|
|
||||||
} else if let Some(oct_part) = value_str.strip_prefix("0o") {
|
|
||||||
u32::from_str_radix(oct_part, 8).ok()?
|
|
||||||
} else {
|
|
||||||
value_str.parse::<u32>().ok()?
|
|
||||||
};
|
|
||||||
|
|
||||||
Some((TokenType::Immediate(value), len))
|
|
||||||
}
|
|
||||||
|
|
||||||
fn try_match_directive(&self, input: &str) -> Option<(TokenType, usize)> {
|
|
||||||
let caps = self.directive_regex.captures(input)?;
|
|
||||||
let directive = caps.get(1)?.as_str().to_string();
|
|
||||||
let len = caps.get(0)?.len();
|
|
||||||
|
|
||||||
Some((TokenType::Directive(DirectiveToken { directive }), len))
|
|
||||||
}
|
|
||||||
|
|
||||||
fn try_match_instruction(&self, input: &str) -> Option<(TokenType, usize)> {
|
|
||||||
let caps = self.instruction_regex.captures(input)?;
|
|
||||||
let mnemonic = caps.get(1)?.as_str().to_string();
|
|
||||||
let len = caps.get(0)?.len();
|
|
||||||
|
|
||||||
let op = Opcode::from_str(&mnemonic).ok()?;
|
|
||||||
|
|
||||||
Some((TokenType::Instruction(op), len))
|
|
||||||
}
|
|
||||||
|
|
||||||
fn try_match_symbol(&self, input: &str) -> Option<(TokenType, usize)> {
|
|
||||||
let caps = self.symbol_regex.captures(input)?;
|
|
||||||
let len = caps.get(0)?.len();
|
|
||||||
|
|
||||||
// Check which capture group matched.
|
|
||||||
let name = if let Some(scoped_name) = caps.get(1) {
|
|
||||||
// Matched the scoped symbol pattern (name::scope).
|
|
||||||
format!("{}::{}", scoped_name.as_str(), caps.get(2)?.as_str())
|
|
||||||
} else if let Some(simple_name) = caps.get(3) {
|
|
||||||
simple_name.as_str().to_string()
|
|
||||||
} else {
|
|
||||||
return None;
|
|
||||||
};
|
|
||||||
|
|
||||||
Some((TokenType::Symbol(SymbolToken { name }), len))
|
|
||||||
}
|
|
||||||
|
|
||||||
fn try_match_string(
|
|
||||||
&mut self,
|
|
||||||
input: &str,
|
|
||||||
line_number: usize,
|
|
||||||
column: usize,
|
|
||||||
) -> Option<(TokenType, usize)> {
|
|
||||||
if self.in_string {
|
|
||||||
// We're continuing a multiline string
|
|
||||||
Some(self.handle_string_continuation(input, line_number, column))
|
|
||||||
} else {
|
|
||||||
// Look for the start of a new string
|
|
||||||
self.handle_string_start(input, line_number, column)
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
fn handle_string_start(
|
|
||||||
&mut self,
|
|
||||||
input: &str,
|
|
||||||
line_number: usize,
|
|
||||||
column: usize,
|
|
||||||
) -> Option<(TokenType, usize)> {
|
|
||||||
if !input.starts_with('"') {
|
|
||||||
return None;
|
|
||||||
}
|
|
||||||
|
|
||||||
// Find the closing quote on the same line
|
|
||||||
if let Some(end_pos) = input[1..].find('"') {
|
|
||||||
// Complete string on one line
|
|
||||||
let content = input[1..=end_pos].to_string();
|
|
||||||
let len = end_pos + 2; // +2 for both quotes
|
|
||||||
Some((TokenType::String(content), len))
|
|
||||||
} else {
|
|
||||||
// Start of multiline string
|
|
||||||
self.in_string = true;
|
|
||||||
self.string_start_line = line_number;
|
|
||||||
self.string_start_column = column;
|
|
||||||
self.string_buffer = input[1..].to_string(); // Everything after opening quote
|
|
||||||
self.string_buffer.push('\n'); // Add newline for multiline
|
|
||||||
|
|
||||||
// Consume the entire rest of the line
|
|
||||||
Some((TokenType::StringContinuation, input.len()))
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
fn handle_string_continuation(
|
|
||||||
&mut self,
|
|
||||||
input: &str,
|
|
||||||
_line_number: usize,
|
|
||||||
_column: usize,
|
|
||||||
) -> (TokenType, usize) {
|
|
||||||
// Look for closing quote
|
|
||||||
if let Some(end_pos) = input.find('"') {
|
|
||||||
// End of multiline string found
|
|
||||||
self.string_buffer.push_str(&input[..end_pos]);
|
|
||||||
self.in_string = false;
|
|
||||||
|
|
||||||
let content = std::mem::take(&mut self.string_buffer);
|
|
||||||
let len = end_pos + 1; // +1 for the closing quote
|
|
||||||
|
|
||||||
(TokenType::String(content), len)
|
|
||||||
} else {
|
|
||||||
// Continue multiline string
|
|
||||||
self.string_buffer.push_str(input);
|
|
||||||
self.string_buffer.push('\n'); // Add newline
|
|
||||||
|
|
||||||
// Consume the entire line
|
|
||||||
(TokenType::StringContinuation, input.len())
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[expect(clippy::range_plus_one, reason = "RangeInclusive is a different type!")]
|
|
||||||
fn match_token(
|
|
||||||
&mut self,
|
|
||||||
input: &str,
|
|
||||||
line_number: usize,
|
|
||||||
column: usize,
|
|
||||||
) -> Result<(TokenType, usize), AssembleError> {
|
|
||||||
if input.starts_with(',') {
|
|
||||||
return Ok((TokenType::Comma, 1));
|
|
||||||
}
|
|
||||||
|
|
||||||
// Check for string first (including multiline continuations).
|
|
||||||
if let Some(m) = self.try_match_string(input, line_number, column) {
|
|
||||||
return Ok(m);
|
|
||||||
}
|
|
||||||
|
|
||||||
if let Some(m) = self.try_match_directive(input) {
|
|
||||||
return Ok(m);
|
|
||||||
}
|
|
||||||
|
|
||||||
if let Some(m) = self.try_match_instruction(input) {
|
|
||||||
return Ok(m);
|
|
||||||
}
|
|
||||||
|
|
||||||
if let Some(m) = self.try_match_comment(input) {
|
|
||||||
return Ok(m);
|
|
||||||
}
|
|
||||||
|
|
||||||
if let Some(m) = self.try_match_label(input) {
|
|
||||||
return Ok(m);
|
|
||||||
}
|
|
||||||
|
|
||||||
if let Some(m) = self.try_match_register(input) {
|
|
||||||
return Ok(m);
|
|
||||||
}
|
|
||||||
|
|
||||||
if let Some(m) = self.try_match_immediate(input) {
|
|
||||||
return Ok(m);
|
|
||||||
}
|
|
||||||
|
|
||||||
if let Some(m) = self.try_match_symbol(input) {
|
|
||||||
return Ok(m);
|
|
||||||
}
|
|
||||||
|
|
||||||
let mut idx_iter = (column + 1)..;
|
|
||||||
let Some(idx) = idx_iter.next() else {
|
|
||||||
unreachable!()
|
|
||||||
};
|
|
||||||
|
|
||||||
let source = SourceInfo::new(line_number, self.module.clone(), idx..idx + 1);
|
|
||||||
|
|
||||||
// Handle miscellaneous characters.
|
|
||||||
if let Some(c) = input.chars().next() {
|
|
||||||
Err(AssembleError::new_source_error(
|
|
||||||
source,
|
|
||||||
AssembleErrorKind::Tokeniser(TokeniserError::UnexpectedChar(c)),
|
|
||||||
))
|
|
||||||
} else {
|
|
||||||
Err(AssembleError::new_source_error(
|
|
||||||
source,
|
|
||||||
AssembleErrorKind::Tokeniser(TokeniserError::UnexpectedEndOfInput(
|
|
||||||
input.len(),
|
|
||||||
)),
|
|
||||||
))
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
@@ -1,41 +0,0 @@
|
|||||||
//! This module contains the error types for the tokeniser.
|
|
||||||
|
|
||||||
#[derive(Debug, Clone, Copy)]
|
|
||||||
/// Types of errors that may be returned during tokenisation.
|
|
||||||
pub enum TokeniserError {
|
|
||||||
/// An unexpected character was found in the source code.
|
|
||||||
UnexpectedChar(char),
|
|
||||||
/// An unterminated string literal was found. [`SourceInfo`] will be attached if this
|
|
||||||
/// was returned.
|
|
||||||
UnterminatedString,
|
|
||||||
/// An invalid number format was encountered when parsing a literal value
|
|
||||||
/// ([`TokenType::Immediate`]).
|
|
||||||
InvalidNumber(&'static str),
|
|
||||||
/// An unrecognized token was encountered.
|
|
||||||
UnrecognisedToken,
|
|
||||||
/// Returned if the consumed count was lower than the length of the input file.
|
|
||||||
/// This is a sign you will need to debug some [`Tokeniser`] code to ensure that
|
|
||||||
/// [`Tokeniser::match_token`] is working as intended.
|
|
||||||
///
|
|
||||||
/// First field is length of the line.
|
|
||||||
UnexpectedEndOfInput(usize),
|
|
||||||
}
|
|
||||||
|
|
||||||
impl TokeniserError {}
|
|
||||||
|
|
||||||
impl std::fmt::Display for TokeniserError {
|
|
||||||
#[rustfmt::skip]
|
|
||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
|
||||||
match self {
|
|
||||||
Self::UnexpectedChar(c) => write!(f, "unexpected char '{c}' found in input")?,
|
|
||||||
Self::InvalidNumber(lit) => write!(f, "invalid integer literal \"{lit}\" found in input")?,
|
|
||||||
Self::UnrecognisedToken => write!(f, "unrecognised token found in input")?,
|
|
||||||
Self::UnterminatedString => write!(f, "unterminated string literal")?,
|
|
||||||
Self::UnexpectedEndOfInput(line_length) => write!(
|
|
||||||
f, "unexpected end of input, input length: {line_length}"
|
|
||||||
)?,
|
|
||||||
}
|
|
||||||
|
|
||||||
Ok(())
|
|
||||||
}
|
|
||||||
}
|
|
||||||
@@ -1,418 +0,0 @@
|
|||||||
//! Unit tests for the tokenizer
|
|
||||||
|
|
||||||
use common::prelude::Register;
|
|
||||||
|
|
||||||
use crate::{
|
|
||||||
model::module::Module,
|
|
||||||
source::{
|
|
||||||
opcode::Opcode,
|
|
||||||
token::{Token, TokenType},
|
|
||||||
token_info::RegisterToken,
|
|
||||||
tokeniser::Tokeniser,
|
|
||||||
},
|
|
||||||
};
|
|
||||||
use std::{path::PathBuf, sync::Arc};
|
|
||||||
|
|
||||||
/// Helper function to create a tokenizer from source text
|
|
||||||
fn create_tokenizer_from_source(source: &str) -> Tokeniser {
|
|
||||||
let path = PathBuf::from("test.dsa");
|
|
||||||
let module = Module::new(path).expect("Cannot create module!");
|
|
||||||
|
|
||||||
Tokeniser::from_data(source.as_bytes().to_vec(), Arc::new(module))
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Helper function to tokenize source and return tokens
|
|
||||||
fn tokenize_source(source: &str) -> Result<Vec<Token>, crate::error::AssembleError> {
|
|
||||||
let tokenizer = create_tokenizer_from_source(source);
|
|
||||||
|
|
||||||
tokenizer.tokenise()
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Helper function to extract token types from a token vector
|
|
||||||
fn extract_token_types(tokens: &[Token]) -> Vec<&TokenType> {
|
|
||||||
tokens.iter().map(|t| &t.token_type).collect()
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_empty_source() {
|
|
||||||
let tokens = tokenize_source("").expect("Failed to tokenize empty source");
|
|
||||||
|
|
||||||
// Should have at least EOF token
|
|
||||||
assert!(!tokens.is_empty());
|
|
||||||
assert!(matches!(
|
|
||||||
tokens
|
|
||||||
.last()
|
|
||||||
.expect("Expected at least one token")
|
|
||||||
.token_type,
|
|
||||||
TokenType::Eof
|
|
||||||
));
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_whitespace_only() {
|
|
||||||
let tokens = tokenize_source(" \n \n ").expect("Failed to tokenize whitespace");
|
|
||||||
|
|
||||||
// Should have newlines and EOF
|
|
||||||
let token_types = extract_token_types(&tokens);
|
|
||||||
assert!(token_types.iter().any(|t| matches!(t, TokenType::Newline)));
|
|
||||||
assert!(token_types.iter().any(|t| matches!(t, TokenType::Eof)));
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_single_instruction() {
|
|
||||||
let tokens = tokenize_source("add").expect("Failed to tokenize instruction");
|
|
||||||
let token_types = extract_token_types(&tokens);
|
|
||||||
|
|
||||||
// Should have instruction, newline, and EOF
|
|
||||||
assert!(
|
|
||||||
token_types
|
|
||||||
.iter()
|
|
||||||
.any(|t| matches!(t, TokenType::Instruction(_)))
|
|
||||||
);
|
|
||||||
if let TokenType::Instruction(instr) = &tokens[0].token_type {
|
|
||||||
assert_eq!(instr.to_string(), "add");
|
|
||||||
} else {
|
|
||||||
panic!("Expected instruction token");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_all_instructions() {
|
|
||||||
let instructions = ["add", "sub", "jmp", "call", "return", "lli", "nop", "hlt"];
|
|
||||||
|
|
||||||
for instr in &instructions {
|
|
||||||
let tokens = tokenize_source(instr).expect("Failed to tokenize instruction");
|
|
||||||
|
|
||||||
if let TokenType::Instruction(parsed_instr) = &tokens[0].token_type {
|
|
||||||
assert_eq!(parsed_instr.to_string(), *instr);
|
|
||||||
} else {
|
|
||||||
panic!("Expected instruction token for {instr}");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_registers() {
|
|
||||||
let test_cases = [("rg0", "rg0"), ("rgf", "rgf"), ("pcx", "pcx")];
|
|
||||||
|
|
||||||
for (input, expected) in &test_cases {
|
|
||||||
let tokens = tokenize_source(input).expect("Failed to tokenize register");
|
|
||||||
|
|
||||||
if let TokenType::Register(reg) = &tokens[0].token_type {
|
|
||||||
assert_eq!(reg.reg.to_string(), *expected);
|
|
||||||
} else {
|
|
||||||
panic!("Expected register token for {input}");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_immediates() {
|
|
||||||
let test_cases = [
|
|
||||||
("42", 42),
|
|
||||||
("0", 0),
|
|
||||||
("0xFF", 255),
|
|
||||||
("0x1234", 0x1234),
|
|
||||||
("0xDEADBEEF", 0xDEAD_BEEF),
|
|
||||||
("0o12", 0o12),
|
|
||||||
("0b101", 0b101),
|
|
||||||
];
|
|
||||||
|
|
||||||
for (input, expected) in &test_cases {
|
|
||||||
let tokens = tokenize_source(input).expect("Failed to tokenize immediate");
|
|
||||||
|
|
||||||
if let TokenType::Immediate(value) = &tokens[0].token_type {
|
|
||||||
assert_eq!(*value, *expected);
|
|
||||||
} else {
|
|
||||||
panic!("Expected immediate token for {input}");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_labels() {
|
|
||||||
let test_cases = [
|
|
||||||
("loop_start:", "loop_start"),
|
|
||||||
("main:", "main"),
|
|
||||||
("_private_label:", "_private_label"),
|
|
||||||
("Label123:", "Label123"),
|
|
||||||
];
|
|
||||||
|
|
||||||
for (input, expected) in &test_cases {
|
|
||||||
let tokens = tokenize_source(input).expect("Failed to tokenize label");
|
|
||||||
|
|
||||||
if let TokenType::Label(label) = &tokens[0].token_type {
|
|
||||||
assert_eq!(label.name, *expected);
|
|
||||||
} else {
|
|
||||||
panic!("Expected label token for {input}");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_directives() {
|
|
||||||
let test_cases = [
|
|
||||||
("global", "global"),
|
|
||||||
("section", "section"),
|
|
||||||
("local", "local"),
|
|
||||||
];
|
|
||||||
|
|
||||||
for (input, expected) in &test_cases {
|
|
||||||
let tokens = tokenize_source(input).expect("Failed to tokenize directive");
|
|
||||||
|
|
||||||
if let TokenType::Directive(directive) = &tokens[0].token_type {
|
|
||||||
assert_eq!(directive.directive, *expected);
|
|
||||||
} else {
|
|
||||||
panic!("Expected directive token for {input}");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_symbols() {
|
|
||||||
let test_cases = [
|
|
||||||
("my_symbol", "my_symbol"),
|
|
||||||
("_private", "_private"),
|
|
||||||
("Symbol123", "Symbol123"),
|
|
||||||
("camelCase", "camelCase"),
|
|
||||||
];
|
|
||||||
|
|
||||||
for (input, expected) in &test_cases {
|
|
||||||
let tokens = tokenize_source(input).expect("Failed to tokenize symbol");
|
|
||||||
|
|
||||||
if let TokenType::Symbol(symbol) = &tokens[0].token_type {
|
|
||||||
assert_eq!(symbol.name, *expected);
|
|
||||||
} else {
|
|
||||||
panic!("Expected symbol token for {input}");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_complex_instruction_line() {
|
|
||||||
let source = "addi rg1, rg2, 0xFF";
|
|
||||||
let tokens = tokenize_source(source).expect("Failed to tokenise complex instruction");
|
|
||||||
|
|
||||||
// Should have: instruction, register, comma, register, comma, immediate, newline, EOF
|
|
||||||
assert!(tokens.len() >= 6);
|
|
||||||
assert!(matches!(tokens[0].token_type, TokenType::Instruction(_)));
|
|
||||||
assert!(matches!(tokens[1].token_type, TokenType::Register(_)));
|
|
||||||
assert!(matches!(tokens[2].token_type, TokenType::Comma));
|
|
||||||
assert!(matches!(tokens[3].token_type, TokenType::Register(_)));
|
|
||||||
assert!(matches!(tokens[4].token_type, TokenType::Comma));
|
|
||||||
assert!(matches!(tokens[5].token_type, TokenType::Immediate(_)));
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_multiline_with_comments() {
|
|
||||||
const EXPECTED_TOKEN_TYPES: [TokenType; 11] = [
|
|
||||||
TokenType::Instruction(Opcode::Add),
|
|
||||||
TokenType::Register(RegisterToken::new(Register::Rg0)),
|
|
||||||
TokenType::Comma,
|
|
||||||
TokenType::Register(RegisterToken::new(Register::Rg1)),
|
|
||||||
TokenType::Newline,
|
|
||||||
TokenType::Instruction(Opcode::SubI),
|
|
||||||
TokenType::Register(RegisterToken::new(Register::Rg2)),
|
|
||||||
TokenType::Comma,
|
|
||||||
TokenType::Immediate(10),
|
|
||||||
TokenType::Newline,
|
|
||||||
TokenType::Eof,
|
|
||||||
];
|
|
||||||
|
|
||||||
const SOURCE: &str = r"add rg0, rg1 // Another comment
|
|
||||||
subi rg2, 10";
|
|
||||||
|
|
||||||
let tokens =
|
|
||||||
tokenize_source(SOURCE).expect("Failed to tokenise source with comments");
|
|
||||||
let token_types = extract_token_types(&tokens);
|
|
||||||
|
|
||||||
assert_eq!(
|
|
||||||
token_types.len(),
|
|
||||||
EXPECTED_TOKEN_TYPES.len(),
|
|
||||||
"{token_types:#?}"
|
|
||||||
);
|
|
||||||
|
|
||||||
for (expected, got) in EXPECTED_TOKEN_TYPES.iter().zip(token_types.iter()) {
|
|
||||||
assert!(!(expected != *got), "Expected {expected:?}, got {got:?}");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_tokenise_brainf_interpreter() {
|
|
||||||
const SOURCE: &str = include_str!("../../../../resources/dsa/bf.dsa");
|
|
||||||
|
|
||||||
let tokens =
|
|
||||||
tokenize_source(SOURCE).expect("Failed to tokenise the brainfuck compiler!");
|
|
||||||
|
|
||||||
dbg!(tokens);
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_string_literals() {
|
|
||||||
let test_cases = [
|
|
||||||
(r#""hello world""#, "hello world"),
|
|
||||||
(
|
|
||||||
r#""++++++++++++++++++++++++++++++++++++++++++++""#,
|
|
||||||
"++++++++++++++++++++++++++++++++++++++++++++",
|
|
||||||
),
|
|
||||||
(r#""Invalid Instruction!""#, "Invalid Instruction!"),
|
|
||||||
(r#""""#, ""),
|
|
||||||
];
|
|
||||||
|
|
||||||
for (input, expected) in &test_cases {
|
|
||||||
let tokens = tokenize_source(input).expect("Failed to tokenize string literal");
|
|
||||||
|
|
||||||
if let TokenType::String(value) = &tokens[0].token_type {
|
|
||||||
assert_eq!(value, expected);
|
|
||||||
} else {
|
|
||||||
panic!("Expected string token for {input}");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_data_directives() {
|
|
||||||
let test_cases = [("db", "db"), ("dw", "dw"), ("resb", "resb")];
|
|
||||||
|
|
||||||
for (input, expected) in &test_cases {
|
|
||||||
let tokens = tokenize_source(input).expect("Failed to tokenize data declaration");
|
|
||||||
|
|
||||||
if let TokenType::Directive(decl) = &tokens[0].token_type {
|
|
||||||
assert_eq!(decl.directive, *expected);
|
|
||||||
} else {
|
|
||||||
panic!("Expected data declaration token for {input}");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_include_directive() {
|
|
||||||
let source = r#"include print "./lib/print.dsa""#;
|
|
||||||
let tokens = tokenize_source(source).expect("Failed to tokenize include directive");
|
|
||||||
|
|
||||||
assert!(tokens.len() >= 3);
|
|
||||||
assert!(matches!(tokens[0].token_type, TokenType::Directive(_)));
|
|
||||||
assert!(matches!(tokens[1].token_type, TokenType::Symbol(_)));
|
|
||||||
assert!(matches!(tokens[2].token_type, TokenType::String(_)));
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_hex_addresses() {
|
|
||||||
let test_cases = [("0x10000", 0x10000), ("0x30000", 0x30000)];
|
|
||||||
|
|
||||||
for (input, expected) in &test_cases {
|
|
||||||
let tokens = tokenize_source(input).expect("Failed to tokenize hex address");
|
|
||||||
|
|
||||||
if let TokenType::Immediate(value) = &tokens[0].token_type {
|
|
||||||
assert_eq!(*value, *expected);
|
|
||||||
} else {
|
|
||||||
panic!("Expected immediate token for {input}");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_memory_operations() {
|
|
||||||
let source = "ldw rg1, rg2";
|
|
||||||
let tokens = tokenize_source(source).expect("Failed to tokenize memory operation");
|
|
||||||
|
|
||||||
assert!(tokens.len() >= 4);
|
|
||||||
assert!(matches!(tokens[0].token_type, TokenType::Instruction(_)));
|
|
||||||
assert!(matches!(tokens[1].token_type, TokenType::Register(_)));
|
|
||||||
assert!(matches!(tokens[2].token_type, TokenType::Comma));
|
|
||||||
assert!(matches!(tokens[3].token_type, TokenType::Register(_)));
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_function_calls() {
|
|
||||||
let source = "call print::print";
|
|
||||||
let tokens = tokenize_source(source).expect("Failed to tokenize function call");
|
|
||||||
|
|
||||||
assert!(tokens.len() >= 2);
|
|
||||||
assert!(matches!(tokens[0].token_type, TokenType::Instruction(_)));
|
|
||||||
// The symbol might be parsed differently depending on how :: is handled
|
|
||||||
// This test checks basic structure
|
|
||||||
assert!(
|
|
||||||
tokens
|
|
||||||
.iter()
|
|
||||||
.any(|t| matches!(t.token_type, TokenType::Symbol(_)))
|
|
||||||
);
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_comments_are_ignored() {
|
|
||||||
let source = "add rg0, rg1 // this is a comment\nsub rg2, rg3";
|
|
||||||
let tokens = tokenize_source(source).expect("Failed to tokenize with comments");
|
|
||||||
|
|
||||||
// Comments should be stripped, so we should only have instruction tokens
|
|
||||||
let instruction_count = tokens
|
|
||||||
.iter()
|
|
||||||
.filter(|t| matches!(t.token_type, TokenType::Instruction(_)))
|
|
||||||
.count();
|
|
||||||
|
|
||||||
assert_eq!(instruction_count, 2);
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_newline_always_present() {
|
|
||||||
// Test that even without explicit newline at end, one is added
|
|
||||||
let source = "add rg0, rg1"; // No newline at end
|
|
||||||
let tokens = tokenize_source(source).expect("Failed to tokenize without newline");
|
|
||||||
|
|
||||||
// Should have newline before EOF
|
|
||||||
let has_newline = tokens
|
|
||||||
.iter()
|
|
||||||
.any(|t| matches!(t.token_type, TokenType::Newline));
|
|
||||||
|
|
||||||
assert!(
|
|
||||||
has_newline,
|
|
||||||
"Expected newline to be added even when missing from input"
|
|
||||||
);
|
|
||||||
|
|
||||||
// EOF should be last.
|
|
||||||
assert!(matches!(
|
|
||||||
tokens
|
|
||||||
.last()
|
|
||||||
.expect("Expected at least one token")
|
|
||||||
.token_type,
|
|
||||||
TokenType::Eof
|
|
||||||
));
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_complex_branching_code() {
|
|
||||||
let source = r"
|
|
||||||
cmp rg3, rg8
|
|
||||||
jeq increment
|
|
||||||
cmp rg3, rg9
|
|
||||||
jeq decrement";
|
|
||||||
|
|
||||||
let tokens = tokenize_source(source).expect("Failed to tokenize branching code");
|
|
||||||
|
|
||||||
let instruction_count = tokens
|
|
||||||
.iter()
|
|
||||||
.filter(|t| matches!(t.token_type, TokenType::Instruction(_)))
|
|
||||||
.count();
|
|
||||||
|
|
||||||
assert_eq!(instruction_count, 4);
|
|
||||||
|
|
||||||
let symbol_count = tokens
|
|
||||||
.iter()
|
|
||||||
.filter(|t| matches!(t.token_type, TokenType::Symbol(_)))
|
|
||||||
.count();
|
|
||||||
|
|
||||||
assert_eq!(symbol_count, 2); // increment and decrement labels
|
|
||||||
}
|
|
||||||
|
|
||||||
#[test]
|
|
||||||
fn test_stack_operations() {
|
|
||||||
let source = "push rg2\npop zero\npusha 2\npopa 2";
|
|
||||||
let tokens = tokenize_source(source).expect("Failed to tokenize stack operations");
|
|
||||||
|
|
||||||
let instruction_count = tokens
|
|
||||||
.iter()
|
|
||||||
.filter(|t| matches!(t.token_type, TokenType::Instruction(_)))
|
|
||||||
.count();
|
|
||||||
|
|
||||||
assert_eq!(instruction_count, 4);
|
|
||||||
}
|
|
||||||
@@ -1,122 +0,0 @@
|
|||||||
//! This module contains the code for the Symbol Table, which can be written into object
|
|
||||||
//! files to support deferred relocations when using ELF files.
|
|
||||||
//!
|
|
||||||
//! It is also required for detection of duplicate symbols, and resolution in the flat
|
|
||||||
//! binary output type.
|
|
||||||
|
|
||||||
use crate::{
|
|
||||||
error::AssembleError,
|
|
||||||
model::{
|
|
||||||
module::ModuleId,
|
|
||||||
symbol::{Symbol, SymbolId, Visibility},
|
|
||||||
},
|
|
||||||
};
|
|
||||||
use std::collections::HashMap;
|
|
||||||
|
|
||||||
/// Global symbol table - single source of truth for all symbols.
|
|
||||||
/// Much simpler than per-module tables.
|
|
||||||
#[derive(Debug)]
|
|
||||||
pub struct SymbolTable {
|
|
||||||
/// All symbols by their ID - O(1) lookup
|
|
||||||
symbols: HashMap<SymbolId, Symbol>,
|
|
||||||
/// Name to ID mapping for human-readable lookups - O(1) lookup
|
|
||||||
name_to_id: HashMap<String, SymbolId>,
|
|
||||||
/// Module to symbols mapping for module-specific queries
|
|
||||||
module_symbols: HashMap<ModuleId, Vec<SymbolId>>,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl SymbolTable {
|
|
||||||
#[must_use]
|
|
||||||
pub fn new() -> Self {
|
|
||||||
Self {
|
|
||||||
symbols: HashMap::new(),
|
|
||||||
name_to_id: HashMap::new(),
|
|
||||||
module_symbols: HashMap::new(),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Adds a symbol to the global table
|
|
||||||
pub fn add_symbol(&mut self, symbol: Symbol) -> Result<SymbolId, AssembleError> {
|
|
||||||
let id = symbol.id;
|
|
||||||
let module_id = symbol.module_id;
|
|
||||||
let name = symbol.name.clone();
|
|
||||||
|
|
||||||
// Check for duplicate names in the same module
|
|
||||||
if let Some(&existing_id) = self.name_to_id.get(&name)
|
|
||||||
&& let Some(existing) = self.symbols.get(&existing_id)
|
|
||||||
&& existing.module_id == module_id
|
|
||||||
{
|
|
||||||
return Err(std::io::Error::new(
|
|
||||||
std::io::ErrorKind::AlreadyExists,
|
|
||||||
format!("Symbol '{name}' already defined in module"),
|
|
||||||
)
|
|
||||||
.into());
|
|
||||||
}
|
|
||||||
|
|
||||||
// Add to all mappings
|
|
||||||
self.name_to_id.insert(name, id);
|
|
||||||
self.symbols.insert(id, symbol);
|
|
||||||
self.module_symbols.entry(module_id).or_default().push(id);
|
|
||||||
|
|
||||||
Ok(id)
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Gets the [`Symbol`] by its [`SymbolId`].
|
|
||||||
#[must_use]
|
|
||||||
pub fn get(&self, id: &SymbolId) -> Option<&Symbol> {
|
|
||||||
self.symbols.get(id)
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Gets the [`Symbol`] by its name.
|
|
||||||
#[must_use]
|
|
||||||
pub fn get_by_name(&self, name: &str) -> Option<&Symbol> {
|
|
||||||
self.name_to_id
|
|
||||||
.get(name)
|
|
||||||
.and_then(|id| self.symbols.get(id))
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Gets all [`Symbol`]s in a module.
|
|
||||||
#[must_use]
|
|
||||||
pub fn get_module_symbols(&self, module_id: &ModuleId) -> Vec<&Symbol> {
|
|
||||||
self.module_symbols
|
|
||||||
.get(module_id)
|
|
||||||
.map(|ids| ids.iter().filter_map(|id| self.symbols.get(id)).collect())
|
|
||||||
.unwrap_or_default()
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Gets all the public symbols.
|
|
||||||
#[must_use]
|
|
||||||
pub fn get_public_symbols(&self) -> Vec<&Symbol> {
|
|
||||||
self.symbols
|
|
||||||
.values()
|
|
||||||
.filter(|sym| matches!(sym.visibility, Visibility::Public))
|
|
||||||
.collect()
|
|
||||||
}
|
|
||||||
|
|
||||||
/// Updates symbol address (during resolution). Used for flat binaries or symbols with
|
|
||||||
/// no relocations.
|
|
||||||
pub fn update_symbol_address(
|
|
||||||
&mut self,
|
|
||||||
id: &SymbolId,
|
|
||||||
address: u32,
|
|
||||||
) -> Result<(), AssembleError> {
|
|
||||||
if let Some(symbol) = self.symbols.get_mut(id) {
|
|
||||||
symbol.address = Some(address);
|
|
||||||
if symbol.dependencies.is_empty() {
|
|
||||||
symbol.needs_relocation = false;
|
|
||||||
}
|
|
||||||
Ok(())
|
|
||||||
} else {
|
|
||||||
Err(
|
|
||||||
std::io::Error::new(std::io::ErrorKind::NotFound, "Symbol not found")
|
|
||||||
.into(),
|
|
||||||
)
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Default for SymbolTable {
|
|
||||||
fn default() -> Self {
|
|
||||||
Self::new()
|
|
||||||
}
|
|
||||||
}
|
|
||||||
@@ -2,7 +2,6 @@
|
|||||||
#![allow(unused)]
|
#![allow(unused)]
|
||||||
use std::{fmt, sync::mpsc::Sender};
|
use std::{fmt, sync::mpsc::Sender};
|
||||||
|
|
||||||
#[derive(Debug, PartialEq, Eq)]
|
|
||||||
pub struct Logger {}
|
pub struct Logger {}
|
||||||
|
|
||||||
impl Logger {
|
impl Logger {
|
||||||
|
|||||||
@@ -2,7 +2,7 @@ pub mod logging;
|
|||||||
|
|
||||||
use std::io::Write;
|
use std::io::Write;
|
||||||
|
|
||||||
pub fn _input(prompt: &str) -> String {
|
pub fn input(prompt: &str) -> String {
|
||||||
print!("{prompt}\n > ");
|
print!("{prompt}\n > ");
|
||||||
std::io::stdout().flush().expect("Failed to flush stdout");
|
std::io::stdout().flush().expect("Failed to flush stdout");
|
||||||
let mut input = String::new();
|
let mut input = String::new();
|
||||||
|
|||||||
@@ -0,0 +1 @@
|
|||||||
|
disallowed-types = ["std::collections::HashMap", "std::collections::HashSet"]
|
||||||
@@ -5,4 +5,3 @@ edition.workspace = true
|
|||||||
authors.workspace = true
|
authors.workspace = true
|
||||||
|
|
||||||
[dependencies]
|
[dependencies]
|
||||||
object = { version = "0.37.1", default-features = false, features = ["elf", "std", "read", "read_core", "write_std", "write", "alloc", "build"] }
|
|
||||||
|
|||||||
@@ -1,3 +0,0 @@
|
|||||||
# Common types and methods for the DSA
|
|
||||||
|
|
||||||
This library contains the instruction set, encoding and decoding routines, and ELF encoding and loading routines (WIP).
|
|
||||||
@@ -1,8 +0,0 @@
|
|||||||
//! ELF file creation and parsing routines.
|
|
||||||
|
|
||||||
use object::{Endianness, build::elf::Builder};
|
|
||||||
|
|
||||||
#[allow(clippy::missing_const_for_fn)]
|
|
||||||
pub fn write() {
|
|
||||||
let _builder = Builder::new(Endianness::Little, false);
|
|
||||||
}
|
|
||||||
@@ -1,17 +1,18 @@
|
|||||||
use crate::{instructions::encode::Encode, prelude::*};
|
use crate::{instructions::encode::Encode, prelude::*};
|
||||||
|
|
||||||
#[derive(Copy, Clone, Debug, PartialEq, Eq, Default)]
|
#[derive(Copy, Clone, Debug, PartialEq, Eq)]
|
||||||
pub enum Interrupt {
|
pub enum Interrupt {
|
||||||
Software(u8),
|
Software(u8),
|
||||||
Breakpoint,
|
Breakpoint,
|
||||||
#[default]
|
|
||||||
HardFault,
|
HardFault,
|
||||||
}
|
}
|
||||||
|
|
||||||
pub type Address = u32;
|
pub type Address = u32;
|
||||||
|
|
||||||
impl Interrupt {
|
impl Interrupt {
|
||||||
const fn as_u8(self) -> u8 {
|
// someone tell clippy to stfu.
|
||||||
|
#[allow(clippy::must_use_candidate)]
|
||||||
|
pub const fn as_u8(self) -> u8 {
|
||||||
match self {
|
match self {
|
||||||
Self::Breakpoint => 0,
|
Self::Breakpoint => 0,
|
||||||
Self::HardFault => 1,
|
Self::HardFault => 1,
|
||||||
@@ -39,7 +40,7 @@ pub enum InstructionType {
|
|||||||
Immediate,
|
Immediate,
|
||||||
}
|
}
|
||||||
|
|
||||||
#[derive(Copy, Clone, Debug, PartialEq, Eq, Hash)]
|
#[derive(Copy, Clone, Debug, PartialEq, Eq)]
|
||||||
#[non_exhaustive]
|
#[non_exhaustive]
|
||||||
pub enum Register {
|
pub enum Register {
|
||||||
// general purpose registers
|
// general purpose registers
|
||||||
|
|||||||
@@ -1,5 +1,4 @@
|
|||||||
//! Various types of arguments that instructions can take, alongside encoding and decoding
|
//! Various types of arguments that instructions can take, alongside encoding and decoding logic.
|
||||||
//! logic.
|
|
||||||
|
|
||||||
use crate::{
|
use crate::{
|
||||||
instructions::{RegisterParseError, encode::Encode},
|
instructions::{RegisterParseError, encode::Encode},
|
||||||
@@ -36,20 +35,18 @@ impl std::fmt::Display for ArgsDecodeError {
|
|||||||
|
|
||||||
impl std::error::Error for ArgsDecodeError {}
|
impl std::error::Error for ArgsDecodeError {}
|
||||||
|
|
||||||
#[derive(Debug, Clone, Copy, PartialEq, Eq, Default)]
|
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
|
||||||
/// Used by instructions with 2 registers and an immediate argument.
|
/// Used by instructions with 2 registers and an immediate argument.
|
||||||
pub struct ITypeArgs {
|
pub struct ITypeArgs {
|
||||||
pub immediate: u16,
|
pub immediate: u16,
|
||||||
pub r1: Register,
|
pub r1: Register,
|
||||||
/// May not actually be used by some instructions taking an immediate e.g. LUI. This
|
/// May not actually be used by some instructions taking an immediate e.g. LUI. This is solved by making the constructor take Options.
|
||||||
/// is solved by making the constructor take Options.
|
|
||||||
pub r2: Register,
|
pub r2: Register,
|
||||||
}
|
}
|
||||||
|
|
||||||
impl ITypeArgs {
|
impl ITypeArgs {
|
||||||
#[must_use]
|
#[must_use]
|
||||||
/// Creates a new [`ITypeArgs`]. If r1 or r2 is unset, they will be replaced with
|
/// Creates a new [`ITypeArgs`]. If r1 or r2 is unset, they will be replaced with [`Register::NoReg`].
|
||||||
/// [`Register::NoReg`].
|
|
||||||
pub fn new(immediate: u16, r1: Option<Register>, r2: Option<Register>) -> Self {
|
pub fn new(immediate: u16, r1: Option<Register>, r2: Option<Register>) -> Self {
|
||||||
let r1 = r1.unwrap_or_default();
|
let r1 = r1.unwrap_or_default();
|
||||||
let r2 = r2.unwrap_or_default();
|
let r2 = r2.unwrap_or_default();
|
||||||
@@ -59,8 +56,8 @@ impl ITypeArgs {
|
|||||||
}
|
}
|
||||||
|
|
||||||
impl Encode for ITypeArgs {
|
impl Encode for ITypeArgs {
|
||||||
/// Encodes an I-type instruction from its fields. These must have some unused
|
/// Encodes an I-type instruction from its fields. These must have some unused high-order
|
||||||
/// high-order bits set to 0 else the bit shifting logic gets fucked.
|
/// bits set to 0 else the bit shifting logic gets fucked.
|
||||||
fn encode(self, opcode: u8) -> u32 {
|
fn encode(self, opcode: u8) -> u32 {
|
||||||
let opcode = u32::from(opcode);
|
let opcode = u32::from(opcode);
|
||||||
let r1 = self.r1 as u32;
|
let r1 = self.r1 as u32;
|
||||||
@@ -87,7 +84,7 @@ impl TryFrom<u32> for ITypeArgs {
|
|||||||
}
|
}
|
||||||
|
|
||||||
/// Used by instructions not using immediates (besides 5 bit shift values).
|
/// Used by instructions not using immediates (besides 5 bit shift values).
|
||||||
#[derive(Debug, Clone, Copy, PartialEq, Eq, Default)]
|
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
|
||||||
pub struct RTypeArgs {
|
pub struct RTypeArgs {
|
||||||
pub sr1: Register,
|
pub sr1: Register,
|
||||||
pub sr2: Register,
|
pub sr2: Register,
|
||||||
@@ -98,8 +95,7 @@ pub struct RTypeArgs {
|
|||||||
|
|
||||||
impl RTypeArgs {
|
impl RTypeArgs {
|
||||||
#[must_use]
|
#[must_use]
|
||||||
/// Creates a new [`RTypeArgs`]. If any registers are unset, they will be replaced
|
/// Creates a new [`RTypeArgs`]. If any registers are unset, they will be replaced with [`Register::NoReg`]. If `shamt` is unset, it will be set to 0.
|
||||||
/// with [`Register::NoReg`]. If `shamt` is unset, it will be set to 0.
|
|
||||||
pub fn new(
|
pub fn new(
|
||||||
sr1: Option<Register>,
|
sr1: Option<Register>,
|
||||||
sr2: Option<Register>,
|
sr2: Option<Register>,
|
||||||
@@ -126,8 +122,7 @@ impl Encode for RTypeArgs {
|
|||||||
///
|
///
|
||||||
/// # Arguments
|
/// # Arguments
|
||||||
///
|
///
|
||||||
/// - `shamt`: The amount to shift value (used only in shift instructions, otherwise
|
/// - `shamt`: The amount to shift value (used only in shift instructions, otherwise 0).
|
||||||
/// 0).
|
|
||||||
fn encode(self, opcode: u8) -> u32 {
|
fn encode(self, opcode: u8) -> u32 {
|
||||||
let opcode = u32::from(opcode);
|
let opcode = u32::from(opcode);
|
||||||
let sr1 = self.sr1 as u32;
|
let sr1 = self.sr1 as u32;
|
||||||
|
|||||||
@@ -54,12 +54,14 @@ impl Encode for Instruction {
|
|||||||
],
|
],
|
||||||
no_args: [Nop, IntReturn, Halt],
|
no_args: [Nop, IntReturn, Halt],
|
||||||
special: [
|
special: [
|
||||||
Self::Interrupt(_) => todo!(),
|
|
||||||
Self::Data(data) => data,
|
Self::Data(data) => data,
|
||||||
|
Self::Interrupt(interrupt) => {
|
||||||
|
let opcode = u32::from(self.opcode());
|
||||||
|
(opcode << 26) | u32::from(interrupt.as_u8())
|
||||||
|
},
|
||||||
Self::Segment(segment) => {
|
Self::Segment(segment) => {
|
||||||
let opcode = u32::from(self.opcode());
|
let opcode = u32::from(self.opcode());
|
||||||
let segment = segment as u8;
|
(opcode << 26) | u32::from(segment as u8)
|
||||||
(opcode << 26) | u32::from(segment)
|
|
||||||
}
|
}
|
||||||
]
|
]
|
||||||
)
|
)
|
||||||
|
|||||||
@@ -39,9 +39,7 @@ impl std::fmt::Display for InstructionDecodeError {
|
|||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
||||||
match self {
|
match self {
|
||||||
Self::InvalidOpcode(code) => write!(f, "invalid opcode, got {code:x}")?,
|
Self::InvalidOpcode(code) => write!(f, "invalid opcode, got {code:x}")?,
|
||||||
Self::InvalidArgument(err) => {
|
Self::InvalidArgument(err) => write!(f, "invalid arguments, got an error {err}")?,
|
||||||
write!(f, "invalid arguments, got an error {err}")?;
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
Ok(())
|
Ok(())
|
||||||
|
|||||||
@@ -12,7 +12,6 @@
|
|||||||
clippy::match_wildcard_for_single_variants
|
clippy::match_wildcard_for_single_variants
|
||||||
)]
|
)]
|
||||||
|
|
||||||
pub mod elf;
|
|
||||||
pub mod instructions;
|
pub mod instructions;
|
||||||
|
|
||||||
pub mod prelude {
|
pub mod prelude {
|
||||||
|
|||||||
@@ -160,12 +160,11 @@ impl CodeEditor {
|
|||||||
|
|
||||||
/// Stick to bottom
|
/// Stick to bottom
|
||||||
/// The scroll handle will stick to the bottom position even while the content size
|
/// The scroll handle will stick to the bottom position even while the content size
|
||||||
/// changes dynamically. This can be useful to simulate terminal UIs or log/info
|
/// changes dynamically. This can be useful to simulate terminal UIs or log/info scrollers.
|
||||||
/// scrollers. The scroll handle remains stuck until user manually changes
|
/// The scroll handle remains stuck until user manually changes position. Once "unstuck"
|
||||||
/// position. Once "unstuck" it will remain focused on whatever content viewport
|
/// it will remain focused on whatever content viewport the user left it on. If the scroll
|
||||||
/// the user left it on. If the scroll handle is dragged to the bottom it will
|
/// handle is dragged to the bottom it will again become stuck and remain there until manually
|
||||||
/// again become stuck and remain there until manually pulled from the end
|
/// pulled from the end position.
|
||||||
/// position.
|
|
||||||
///
|
///
|
||||||
/// **Default: false**
|
/// **Default: false**
|
||||||
pub fn stick_to_bottom(self, stick_to_bottom: bool) -> Self {
|
pub fn stick_to_bottom(self, stick_to_bottom: bool) -> Self {
|
||||||
|
|||||||
+2
-1
@@ -19,10 +19,11 @@ assembler = { path = "../assembler" }
|
|||||||
dsa_editor = { path = "../dsa_editor" }
|
dsa_editor = { path = "../dsa_editor" }
|
||||||
egui = "0.31.1"
|
egui = "0.31.1"
|
||||||
dirs = "6.0.0"
|
dirs = "6.0.0"
|
||||||
discord-presence = { version = "1.6.0", optional = true }
|
discord-presence = { version = "2.0.0", optional = true }
|
||||||
toml = { version = "0.8.23", optional = true }
|
toml = { version = "0.8.23", optional = true }
|
||||||
serde = { version = "1.0.219", features = ["derive"], optional = true }
|
serde = { version = "1.0.219", features = ["derive"], optional = true }
|
||||||
egui_file = "0.22.1"
|
egui_file = "0.22.1"
|
||||||
|
rustc-hash = "2.1.1"
|
||||||
|
|
||||||
[features]
|
[features]
|
||||||
default = ["config"]
|
default = ["config"]
|
||||||
|
|||||||
@@ -180,10 +180,10 @@ impl Drop for RpcClient {
|
|||||||
fn drop(&mut self) {
|
fn drop(&mut self) {
|
||||||
self.stop();
|
self.stop();
|
||||||
|
|
||||||
if let Some(handle) = self.thread_handle.take()
|
if let Some(handle) = self.thread_handle.take() {
|
||||||
&& let Some(handle) = Arc::into_inner(handle)
|
if let Some(handle) = Arc::into_inner(handle) {
|
||||||
{
|
let _ = handle.join();
|
||||||
let _ = handle.join();
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -25,7 +25,7 @@ pub fn run_emulator(
|
|||||||
let mut running = Running::Paused;
|
let mut running = Running::Paused;
|
||||||
let mut step = 0;
|
let mut step = 0;
|
||||||
let mut addr;
|
let mut addr;
|
||||||
let mut history = Vec::<(u32, Instruction)>::new();
|
let mut history = Vec::<(u32, Instruction)>::with_capacity(32768);
|
||||||
let size = 256;
|
let size = 256;
|
||||||
|
|
||||||
state_tx
|
state_tx
|
||||||
@@ -36,7 +36,9 @@ pub fn run_emulator(
|
|||||||
let mut update = false;
|
let mut update = false;
|
||||||
|
|
||||||
loop {
|
loop {
|
||||||
let cmd = if running == Running::Running || step > 0 {
|
let cmd = if step > 0 {
|
||||||
|
None
|
||||||
|
} else if running == Running::Running && step == 0 {
|
||||||
match cmd_rx.try_recv() {
|
match cmd_rx.try_recv() {
|
||||||
Ok(cmd) => Some(cmd),
|
Ok(cmd) => Some(cmd),
|
||||||
Err(mpsc::TryRecvError::Empty) => {
|
Err(mpsc::TryRecvError::Empty) => {
|
||||||
@@ -52,10 +54,15 @@ pub fn run_emulator(
|
|||||||
}
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
|
if running == Running::Running && step == 0 {
|
||||||
|
step = 32768;
|
||||||
|
}
|
||||||
|
|
||||||
if let Some(cmd) = cmd {
|
if let Some(cmd) = cmd {
|
||||||
match cmd {
|
match cmd {
|
||||||
Command::Start => {
|
Command::Start => {
|
||||||
running = Running::Running;
|
running = Running::Running;
|
||||||
|
step = 32768;
|
||||||
|
|
||||||
// Update RPC with current state. TODO: Make this only occur on state
|
// Update RPC with current state. TODO: Make this only occur on state
|
||||||
// changes.
|
// changes.
|
||||||
@@ -71,9 +78,11 @@ pub fn run_emulator(
|
|||||||
}
|
}
|
||||||
Command::Stop => {
|
Command::Stop => {
|
||||||
running = Running::Paused;
|
running = Running::Paused;
|
||||||
|
step = 0;
|
||||||
}
|
}
|
||||||
Command::Reset(x) => {
|
Command::Reset(x) => {
|
||||||
running = Running::Paused;
|
running = Running::Paused;
|
||||||
|
step = 0;
|
||||||
|
|
||||||
match x {
|
match x {
|
||||||
0 => {
|
0 => {
|
||||||
@@ -95,22 +104,13 @@ pub fn run_emulator(
|
|||||||
}
|
}
|
||||||
Command::Step(x) => {
|
Command::Step(x) => {
|
||||||
step = x;
|
step = x;
|
||||||
|
running = Running::Paused;
|
||||||
}
|
}
|
||||||
Command::Write(offset, data) => {
|
Command::Write(offset, data) => {
|
||||||
update = true;
|
update = true;
|
||||||
|
|
||||||
processor
|
processor.memory.write_range(offset, data);
|
||||||
.memory
|
|
||||||
.write_range(offset, data)
|
|
||||||
.unwrap_or_else(|_| {
|
|
||||||
report_err(
|
|
||||||
state_tx,
|
|
||||||
"Failed to write memory range!",
|
|
||||||
&mut processor,
|
|
||||||
);
|
|
||||||
});
|
|
||||||
}
|
}
|
||||||
#[expect(unused_assignments)]
|
|
||||||
Command::Interrupt(_interrupt) => {
|
Command::Interrupt(_interrupt) => {
|
||||||
update = true;
|
update = true;
|
||||||
|
|
||||||
@@ -119,14 +119,7 @@ pub fn run_emulator(
|
|||||||
Command::MemRequest(new, size) if update => {
|
Command::MemRequest(new, size) if update => {
|
||||||
addr = new;
|
addr = new;
|
||||||
let _ = state_tx.send(StateUpdate::MemoryView(
|
let _ = state_tx.send(StateUpdate::MemoryView(
|
||||||
processor.memory.read_range(addr, size).unwrap_or_else(|_| {
|
processor.memory.read_range(addr, size),
|
||||||
report_err(
|
|
||||||
state_tx,
|
|
||||||
"Failed to read memory range!",
|
|
||||||
&mut processor,
|
|
||||||
);
|
|
||||||
Vec::new()
|
|
||||||
}),
|
|
||||||
));
|
));
|
||||||
}
|
}
|
||||||
Command::DisplayRequest if update => {
|
Command::DisplayRequest if update => {
|
||||||
@@ -164,26 +157,16 @@ pub fn run_emulator(
|
|||||||
let _ = state_tx.send(StateUpdate::Instructions(instruction_count));
|
let _ = state_tx.send(StateUpdate::Instructions(instruction_count));
|
||||||
}
|
}
|
||||||
Command::WriteBlock(addr, block) => {
|
Command::WriteBlock(addr, block) => {
|
||||||
processor
|
processor.memory.write_range(addr, block.to_vec());
|
||||||
.memory
|
|
||||||
.write_range(addr, block.to_vec())
|
|
||||||
.unwrap_or_else(|_| {
|
|
||||||
report_err(
|
|
||||||
state_tx,
|
|
||||||
"Failed to write memory block!",
|
|
||||||
&mut processor,
|
|
||||||
);
|
|
||||||
});
|
|
||||||
}
|
}
|
||||||
|
|
||||||
_ => {}
|
_ => {}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
if step > 0 {
|
if running == Running::Paused && step > 0 {
|
||||||
step -= 1;
|
step -= 1;
|
||||||
update = true;
|
update = true;
|
||||||
running = Running::Paused;
|
|
||||||
|
|
||||||
// Execute one cycle.
|
// Execute one cycle.
|
||||||
match processor.cycle() {
|
match processor.cycle() {
|
||||||
@@ -191,7 +174,9 @@ pub fn run_emulator(
|
|||||||
history.push((addr, instruction));
|
history.push((addr, instruction));
|
||||||
}
|
}
|
||||||
Err(why) => {
|
Err(why) => {
|
||||||
let pcx = processor.get(Register::Pcx);
|
let pcx = processor
|
||||||
|
.get(Register::Pcx)
|
||||||
|
.expect("SPR should never be invalid");
|
||||||
report_err(
|
report_err(
|
||||||
state_tx,
|
state_tx,
|
||||||
&format!(
|
&format!(
|
||||||
@@ -206,21 +191,31 @@ pub fn run_emulator(
|
|||||||
}
|
}
|
||||||
|
|
||||||
if running == Running::Running {
|
if running == Running::Running {
|
||||||
|
step -= 1;
|
||||||
update = true;
|
update = true;
|
||||||
|
|
||||||
// Execute one cycle.
|
// Execute one cycle.
|
||||||
let instruction = match processor.cycle() {
|
let instruction = match processor.cycle() {
|
||||||
Ok(instruction) => instruction,
|
Ok(instruction) => instruction,
|
||||||
Err(why) => {
|
Err(why) => {
|
||||||
let pcx = processor.get(Register::Pcx);
|
let pcx = processor
|
||||||
eprintln!("Could not decode instruction at {pcx:x}. Reason: {why}");
|
.get(Register::Pcx)
|
||||||
continue;
|
.expect("PCX should never be invalid");
|
||||||
|
report_err(
|
||||||
|
state_tx,
|
||||||
|
&format!(
|
||||||
|
"Could not decode instruction at {pcx:x}. Reason: {why}"
|
||||||
|
),
|
||||||
|
&mut processor,
|
||||||
|
);
|
||||||
|
(pcx, Instruction::Nop)
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
|
|
||||||
history.push(instruction);
|
history.push(instruction);
|
||||||
if matches!(instruction.1, Instruction::Halt) {
|
if matches!(instruction.1, Instruction::Halt) {
|
||||||
running = Running::Halted;
|
running = Running::Halted;
|
||||||
|
step = 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
instruction_count += 1;
|
instruction_count += 1;
|
||||||
@@ -229,6 +224,8 @@ pub fn run_emulator(
|
|||||||
}
|
}
|
||||||
|
|
||||||
fn report_err(state_tx: &Sender<StateUpdate>, why: &str, processor: &mut Processor) {
|
fn report_err(state_tx: &Sender<StateUpdate>, why: &str, processor: &mut Processor) {
|
||||||
processor.begin_interrupt(Interrupt::HardFault);
|
processor
|
||||||
|
.begin_interrupt(Interrupt::HardFault)
|
||||||
|
.expect("What kind of goofy ahh shenanigans did you do with your fault handler? At this point, the emulator can just crash. this is on you.");
|
||||||
let _ = state_tx.send(StateUpdate::Error(why.to_string()));
|
let _ = state_tx.send(StateUpdate::Error(why.to_string()));
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -1,53 +1,51 @@
|
|||||||
use std::collections::HashMap;
|
use rustc_hash::FxHashMap;
|
||||||
|
|
||||||
use crate::emulator::system::model::ProcessorError;
|
use crate::emulator::system::model::ProcessorError;
|
||||||
|
|
||||||
pub trait MemoryUnit: Send + Sync {
|
pub trait MemoryUnit: Send + Sync {
|
||||||
fn reset(&mut self);
|
fn reset(&mut self);
|
||||||
fn read_byte(&mut self, addr: u32) -> Result<u8, ProcessorError>;
|
fn read_byte(&mut self, addr: u32) -> u8;
|
||||||
fn write_byte(&mut self, addr: u32, value: u8) -> Result<(), ProcessorError>;
|
fn write_byte(&mut self, addr: u32, value: u8);
|
||||||
fn read_word(&mut self, addr: u32) -> Result<u32, ProcessorError>;
|
fn read_word(&mut self, addr: u32) -> Result<u32, ProcessorError>;
|
||||||
fn write_word(&mut self, addr: u32, value: u32) -> Result<(), ProcessorError>;
|
fn write_word(&mut self, addr: u32, value: u32) -> Result<(), ProcessorError>;
|
||||||
|
|
||||||
fn read_range(&mut self, addr: u32, size: u32) -> Result<Vec<u8>, ProcessorError> {
|
fn read_range(&mut self, addr: u32, size: u32) -> Vec<u8> {
|
||||||
let mut data = Vec::with_capacity(size as usize);
|
let mut data = Vec::with_capacity(size as usize);
|
||||||
for i in 0..size {
|
for i in 0..size {
|
||||||
data.push(self.read_byte(addr + i)?);
|
data.push(self.read_byte(addr + i));
|
||||||
}
|
}
|
||||||
Ok(data)
|
data
|
||||||
}
|
}
|
||||||
|
|
||||||
fn write_range(&mut self, addr: u32, value: Vec<u8>) -> Result<(), ProcessorError> {
|
fn write_range(&mut self, addr: u32, value: Vec<u8>) {
|
||||||
for (i, byte) in value.into_iter().enumerate() {
|
for (i, byte) in value.into_iter().enumerate() {
|
||||||
self.write_byte(addr + i as u32, byte)?;
|
self.write_byte(addr + i as u32, byte);
|
||||||
}
|
}
|
||||||
Ok(())
|
|
||||||
}
|
}
|
||||||
|
|
||||||
fn read_block(&mut self, addr: u32) -> Result<[u8; 256], ProcessorError> {
|
fn read_block(&mut self, addr: u32) -> &[u8; 256];
|
||||||
let mut data = [0; 256];
|
|
||||||
for (i, byte) in data.iter_mut().enumerate() {
|
|
||||||
*byte = self.read_byte(addr + i as u32)?;
|
|
||||||
}
|
|
||||||
Ok(data)
|
|
||||||
}
|
|
||||||
|
|
||||||
fn write_block(&mut self, addr: u32, data: [u8; 256]) -> Result<(), ProcessorError> {
|
fn write_block(&mut self, addr: u32, data: &[u8; 256]) {
|
||||||
for (i, byte) in data.iter().enumerate() {
|
for (i, byte) in data.iter().enumerate() {
|
||||||
self.write_byte(addr + i as u32, *byte)?;
|
self.write_byte(addr + i as u32, *byte);
|
||||||
}
|
}
|
||||||
Ok(())
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
pub struct MainStore {
|
pub struct MainStore {
|
||||||
pub data: HashMap<u32, Block>,
|
pub data: FxHashMap<u32, Block>,
|
||||||
}
|
}
|
||||||
|
|
||||||
pub struct Block {
|
pub struct Block {
|
||||||
data: [u8; 256],
|
data: [u8; 256],
|
||||||
}
|
}
|
||||||
|
|
||||||
|
impl Default for Block {
|
||||||
|
fn default() -> Self {
|
||||||
|
Self { data: [0; 256] }
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
impl Default for MainStore {
|
impl Default for MainStore {
|
||||||
fn default() -> Self {
|
fn default() -> Self {
|
||||||
Self::new()
|
Self::new()
|
||||||
@@ -58,79 +56,73 @@ impl MainStore {
|
|||||||
#[must_use]
|
#[must_use]
|
||||||
pub fn new() -> Self {
|
pub fn new() -> Self {
|
||||||
Self {
|
Self {
|
||||||
data: HashMap::new(),
|
data: FxHashMap::default(),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[inline]
|
||||||
const fn segment_addr(addr: u32) -> (u32, u8) {
|
const fn segment_addr(addr: u32) -> (u32, u8) {
|
||||||
(addr / 256, (addr % 256) as u8)
|
(addr / 256, (addr % 256) as u8)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[inline]
|
||||||
fn mut_block(&mut self, addr: u32) -> &mut Block {
|
fn mut_block(&mut self, addr: u32) -> &mut Block {
|
||||||
self.data
|
self.data.entry(addr).or_default()
|
||||||
.entry(addr)
|
|
||||||
.or_insert_with(|| Block { data: [0; 256] });
|
|
||||||
|
|
||||||
self.data.get_mut(&addr).map_or_else(
|
|
||||||
|| panic!("Could not fetch block with address {addr:x?}"),
|
|
||||||
|block| block,
|
|
||||||
)
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[inline]
|
||||||
fn block(&mut self, addr: u32) -> &Block {
|
fn block(&mut self, addr: u32) -> &Block {
|
||||||
self.data
|
self.data.entry(addr).or_default()
|
||||||
.entry(addr)
|
|
||||||
.or_insert_with(|| Block { data: [0; 256] });
|
|
||||||
|
|
||||||
self.data.get(&addr).map_or_else(
|
|
||||||
|| panic!("Could not fetch block with address {addr:x?}"),
|
|
||||||
|block| block,
|
|
||||||
)
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
impl MemoryUnit for MainStore {
|
impl MemoryUnit for MainStore {
|
||||||
|
#[inline]
|
||||||
fn reset(&mut self) {
|
fn reset(&mut self) {
|
||||||
self.data.clear();
|
self.data.clear();
|
||||||
}
|
}
|
||||||
|
|
||||||
fn read_byte(&mut self, addr: u32) -> Result<u8, ProcessorError> {
|
#[inline]
|
||||||
|
fn read_byte(&mut self, addr: u32) -> u8 {
|
||||||
let (block_addr, offset) = Self::segment_addr(addr);
|
let (block_addr, offset) = Self::segment_addr(addr);
|
||||||
let block = self.block(block_addr);
|
let block = self.block(block_addr);
|
||||||
Ok(block.data[offset as usize])
|
block.data[offset as usize]
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[inline]
|
||||||
fn read_word(&mut self, addr: u32) -> Result<u32, ProcessorError> {
|
fn read_word(&mut self, addr: u32) -> Result<u32, ProcessorError> {
|
||||||
if addr % 4 != 0 {
|
if addr % 4 != 0 {
|
||||||
return Err(ProcessorError::BadMemoryAccess(addr));
|
return Err(ProcessorError::BadMemoryAccess(addr));
|
||||||
}
|
}
|
||||||
|
|
||||||
let (block_addr, offset) = Self::segment_addr(addr);
|
let (block_addr, offset) = Self::segment_addr(addr);
|
||||||
let block = self.mut_block(block_addr);
|
let offset = offset as usize;
|
||||||
let mut bytes = [0; 4];
|
let block = self.block(block_addr);
|
||||||
bytes[0] = block.data[offset as usize];
|
Ok(u32::from_be_bytes(
|
||||||
bytes[1] = block.data[(offset + 1) as usize];
|
block.data[offset..=offset + 3]
|
||||||
bytes[2] = block.data[(offset + 2) as usize];
|
.try_into()
|
||||||
bytes[3] = block.data[(offset + 3) as usize];
|
.expect("Failed to read word!"),
|
||||||
Ok(u32::from_be_bytes(bytes))
|
))
|
||||||
}
|
}
|
||||||
|
|
||||||
fn read_range(&mut self, addr: u32, size: u32) -> Result<Vec<u8>, ProcessorError> {
|
#[inline]
|
||||||
|
fn read_range(&mut self, addr: u32, size: u32) -> Vec<u8> {
|
||||||
let mut data = Vec::with_capacity(size as usize);
|
let mut data = Vec::with_capacity(size as usize);
|
||||||
for i in 0..size {
|
for i in 0..size {
|
||||||
data.push(self.read_byte(addr + i)?);
|
data.push(self.read_byte(addr + i));
|
||||||
}
|
}
|
||||||
|
|
||||||
Ok(data)
|
data
|
||||||
}
|
}
|
||||||
|
|
||||||
fn write_byte(&mut self, addr: u32, value: u8) -> Result<(), ProcessorError> {
|
#[inline]
|
||||||
|
fn write_byte(&mut self, addr: u32, value: u8) {
|
||||||
let (block_addr, offset) = Self::segment_addr(addr);
|
let (block_addr, offset) = Self::segment_addr(addr);
|
||||||
let block = self.mut_block(block_addr);
|
let block = self.mut_block(block_addr);
|
||||||
block.data[offset as usize] = value;
|
block.data[offset as usize] = value;
|
||||||
Ok(())
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[inline]
|
||||||
fn write_word(&mut self, addr: u32, value: u32) -> Result<(), ProcessorError> {
|
fn write_word(&mut self, addr: u32, value: u32) -> Result<(), ProcessorError> {
|
||||||
if addr % 4 != 0 {
|
if addr % 4 != 0 {
|
||||||
return Err(ProcessorError::BadMemoryAccess(addr));
|
return Err(ProcessorError::BadMemoryAccess(addr));
|
||||||
@@ -138,33 +130,36 @@ impl MemoryUnit for MainStore {
|
|||||||
|
|
||||||
let (block_addr, offset) = Self::segment_addr(addr);
|
let (block_addr, offset) = Self::segment_addr(addr);
|
||||||
let block = self.mut_block(block_addr);
|
let block = self.mut_block(block_addr);
|
||||||
block.data[offset as usize] = (value >> 24) as u8;
|
block.data[offset as usize..=(offset + 3) as usize]
|
||||||
block.data[(offset + 1) as usize] = (value >> 16) as u8;
|
.copy_from_slice(&value.to_be_bytes());
|
||||||
block.data[(offset + 2) as usize] = (value >> 8) as u8;
|
|
||||||
block.data[(offset + 3) as usize] = value as u8;
|
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
fn write_range(&mut self, addr: u32, value: Vec<u8>) -> Result<(), ProcessorError> {
|
#[inline]
|
||||||
for (i, byte) in value.into_iter().enumerate() {
|
fn write_range(&mut self, addr: u32, value: Vec<u8>) {
|
||||||
let (block_addr, offset) = Self::segment_addr(addr + i as u32);
|
let mut current_block_addr = addr / 256;
|
||||||
let block = self.mut_block(block_addr);
|
let mut current_block = self.mut_block(current_block_addr);
|
||||||
block.data[offset as usize] = byte;
|
let mut offset = addr % 256;
|
||||||
|
for byte in value {
|
||||||
|
current_block.data[offset as usize] = byte;
|
||||||
|
offset += 1;
|
||||||
|
if offset >= 256 {
|
||||||
|
offset = 0;
|
||||||
|
current_block_addr += 1;
|
||||||
|
current_block = self.mut_block(current_block_addr);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
Ok(())
|
|
||||||
}
|
}
|
||||||
|
|
||||||
fn read_block(&mut self, addr: u32) -> Result<[u8; 256], ProcessorError> {
|
#[inline]
|
||||||
|
fn read_block(&mut self, addr: u32) -> &[u8; 256] {
|
||||||
let (block_addr, _) = Self::segment_addr(addr);
|
let (block_addr, _) = Self::segment_addr(addr);
|
||||||
let block = self.block(block_addr);
|
&self.block(block_addr).data
|
||||||
Ok(block.data)
|
|
||||||
}
|
}
|
||||||
|
|
||||||
fn write_block(&mut self, addr: u32, data: [u8; 256]) -> Result<(), ProcessorError> {
|
#[inline]
|
||||||
|
fn write_block(&mut self, addr: u32, data: &[u8; 256]) {
|
||||||
let (block_addr, _) = Self::segment_addr(addr);
|
let (block_addr, _) = Self::segment_addr(addr);
|
||||||
let block = self.mut_block(block_addr);
|
let _ = self.data.insert(block_addr, Block { data: *data });
|
||||||
block.data = data;
|
|
||||||
Ok(())
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -257,8 +257,8 @@ impl RegFile {
|
|||||||
self.pcx = 0;
|
self.pcx = 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn reg(&mut self, reg: Register) -> &mut u32 {
|
pub const fn reg(&mut self, reg: Register) -> Result<&mut u32, ProcessorError> {
|
||||||
match reg {
|
Ok(match reg {
|
||||||
Register::Rg0 => &mut self.rg0,
|
Register::Rg0 => &mut self.rg0,
|
||||||
Register::Rg1 => &mut self.rg1,
|
Register::Rg1 => &mut self.rg1,
|
||||||
Register::Rg2 => &mut self.rg2,
|
Register::Rg2 => &mut self.rg2,
|
||||||
@@ -286,13 +286,13 @@ impl RegFile {
|
|||||||
Register::Sts => &mut self.sts,
|
Register::Sts => &mut self.sts,
|
||||||
Register::Cir => &mut self.cir,
|
Register::Cir => &mut self.cir,
|
||||||
Register::Pcx => &mut self.pcx,
|
Register::Pcx => &mut self.pcx,
|
||||||
_ => panic!("Invalid register."),
|
_ => return Err(ProcessorError::InvalidRegister(Register::NoReg as u8)),
|
||||||
}
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
#[must_use]
|
#[must_use]
|
||||||
pub fn get(&self, reg: Register) -> u32 {
|
pub const fn get(&self, reg: Register) -> Result<u32, ProcessorError> {
|
||||||
match reg {
|
Ok(match reg {
|
||||||
Register::Rg0 => self.rg0,
|
Register::Rg0 => self.rg0,
|
||||||
Register::Rg1 => self.rg1,
|
Register::Rg1 => self.rg1,
|
||||||
Register::Rg2 => self.rg2,
|
Register::Rg2 => self.rg2,
|
||||||
@@ -321,7 +321,7 @@ impl RegFile {
|
|||||||
Register::Cir => self.cir,
|
Register::Cir => self.cir,
|
||||||
Register::Pcx => self.pcx,
|
Register::Pcx => self.pcx,
|
||||||
Register::Zero => 0,
|
Register::Zero => 0,
|
||||||
_ => panic!("Invalid register."),
|
_ => return Err(ProcessorError::InvalidRegister(Register::NoReg as u8)),
|
||||||
}
|
})
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -16,10 +16,9 @@ pub struct Processor {
|
|||||||
pub halted: bool,
|
pub halted: bool,
|
||||||
pub io_devices: Vec<Arc<dyn IODevice>>,
|
pub io_devices: Vec<Arc<dyn IODevice>>,
|
||||||
|
|
||||||
pub dustbin: u32,
|
pub void: u32,
|
||||||
}
|
}
|
||||||
|
|
||||||
#[expect(dead_code)]
|
|
||||||
fn log(message: &str) {
|
fn log(message: &str) {
|
||||||
println!("\x1b[32mINFO:\x1b[0m {message}");
|
println!("\x1b[32mINFO:\x1b[0m {message}");
|
||||||
}
|
}
|
||||||
@@ -32,7 +31,7 @@ impl Processor {
|
|||||||
registers: RegFile::default(),
|
registers: RegFile::default(),
|
||||||
halted: false,
|
halted: false,
|
||||||
io_devices,
|
io_devices,
|
||||||
dustbin: 0,
|
void: 0,
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -50,16 +49,16 @@ impl Processor {
|
|||||||
self.halted = false;
|
self.halted = false;
|
||||||
|
|
||||||
// Get value from PCX.
|
// Get value from PCX.
|
||||||
let addr = self.fetch();
|
let addr = self.fetch()?;
|
||||||
// Increment PCX.
|
// Increment PCX.
|
||||||
self.advance();
|
self.advance()?;
|
||||||
|
|
||||||
// Set MAR to the previous value of PCX.
|
// Set MAR to the previous value of PCX.
|
||||||
*self.reg(Register::Mar) = addr;
|
*self.reg(Register::Mar)? = addr;
|
||||||
let val = self.memory.read_word(addr)?;
|
let val = self.memory.read_word(addr)?;
|
||||||
|
|
||||||
// Set CIR to the value of RAM[MAR].
|
// Set CIR to the value of RAM[MAR].
|
||||||
*self.reg(Register::Mar) = val;
|
*self.reg(Register::Mar)? = val;
|
||||||
|
|
||||||
// Decode and execute the instruction.
|
// Decode and execute the instruction.
|
||||||
let instruction = Instruction::decode(val)
|
let instruction = Instruction::decode(val)
|
||||||
@@ -69,24 +68,23 @@ impl Processor {
|
|||||||
Ok((addr, instruction))
|
Ok((addr, instruction))
|
||||||
}
|
}
|
||||||
|
|
||||||
fn fetch(&self) -> u32 {
|
const fn fetch(&self) -> Result<u32, ProcessorError> {
|
||||||
self.get(Register::Pcx)
|
self.get(Register::Pcx)
|
||||||
}
|
}
|
||||||
|
|
||||||
#[must_use]
|
pub const fn get(&self, reg: Register) -> Result<u32, ProcessorError> {
|
||||||
pub fn get(&self, reg: Register) -> u32 {
|
|
||||||
self.registers.get(reg)
|
self.registers.get(reg)
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn reg(&mut self, reg: Register) -> &mut u32 {
|
pub const fn reg(&mut self, reg: Register) -> Result<&mut u32, ProcessorError> {
|
||||||
match reg {
|
match reg {
|
||||||
Register::Zero => &mut self.dustbin,
|
Register::Zero => Ok(&mut self.void),
|
||||||
_ => self.registers.reg(reg),
|
_ => self.registers.reg(reg),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn display(&mut self) -> Result<Vec<u8>, ProcessorError> {
|
pub fn display(&mut self) -> Result<Vec<u8>, ProcessorError> {
|
||||||
self.memory.read_range(0x20000, 2000)
|
Ok(self.memory.read_range(0x20000, 2000))
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn cmp(&mut self, a: u32, b: u32) {
|
pub fn cmp(&mut self, a: u32, b: u32) {
|
||||||
@@ -98,44 +96,77 @@ impl Processor {
|
|||||||
// functions to set new state
|
// functions to set new state
|
||||||
fn set_flag(&mut self, flag: Flag, value: bool) {
|
fn set_flag(&mut self, flag: Flag, value: bool) {
|
||||||
if value {
|
if value {
|
||||||
*self.reg(Register::Sts) |= flag as u32;
|
*self
|
||||||
|
.reg(Register::Sts)
|
||||||
|
.expect("STS should never be invalid") |= flag as u32;
|
||||||
} else {
|
} else {
|
||||||
*self.reg(Register::Sts) &= !(flag as u32);
|
*self
|
||||||
|
.reg(Register::Sts)
|
||||||
|
.expect("STS should never be invalid") &= !(flag as u32);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
fn get_flag(&self, flag: Flag) -> bool {
|
fn get_flag(&self, flag: Flag) -> Result<bool, ProcessorError> {
|
||||||
self.get(Register::Sts) & (flag as u32) != 0
|
Ok(self.get(Register::Sts)? & (flag as u32) != 0)
|
||||||
}
|
}
|
||||||
|
|
||||||
fn advance(&mut self) {
|
fn advance(&mut self) -> Result<(), ProcessorError> {
|
||||||
// increment PCX
|
// increment PCX
|
||||||
*self.reg(Register::Pcx) += 4;
|
*self.reg(Register::Pcx)? += 4;
|
||||||
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
fn jump(&mut self, reg: Register, offset: u16) {
|
fn jump(&mut self, reg: Register, offset: u16) -> Result<(), ProcessorError> {
|
||||||
*self.reg(Register::Pcx) = self.get(reg) + u32::from(offset);
|
*self.reg(Register::Pcx)? = self.get(reg)? + u32::from(offset);
|
||||||
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn begin_interrupt(&mut self, _int: Interrupt) {
|
pub fn begin_interrupt(
|
||||||
// first we get the address of the interrupt descriptor table.
|
&mut self,
|
||||||
todo!();
|
interrupt: Interrupt,
|
||||||
|
) -> Result<(), ProcessorError> {
|
||||||
|
let idt = self.get(Register::Idr)?;
|
||||||
|
|
||||||
|
let addr = self
|
||||||
|
.memory
|
||||||
|
.read_word(idt + u32::from(interrupt.as_u8()) * 4)?;
|
||||||
|
println!("INFO: Interrupt {interrupt:?} addr: {addr}");
|
||||||
|
|
||||||
|
self.push(self.get(Register::Pcx)?)?;
|
||||||
|
*self.reg(Register::Pcx)? = addr;
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
fn push(&mut self, val: u32) -> Result<(), ProcessorError> {
|
||||||
|
*self.reg(Register::Spr)? -= 4;
|
||||||
|
let reg = *self.reg(Register::Spr)?;
|
||||||
|
self.memory.write_word(reg, val)
|
||||||
|
}
|
||||||
|
|
||||||
|
fn pop(&mut self) -> Result<u32, ProcessorError> {
|
||||||
|
let reg = *self.reg(Register::Spr)?;
|
||||||
|
let val = self.memory.read_word(reg)?;
|
||||||
|
*self.reg(Register::Spr)? += 4;
|
||||||
|
Ok(val)
|
||||||
}
|
}
|
||||||
|
|
||||||
// TODO: remove this once implemented
|
// TODO: remove this once implemented
|
||||||
#[allow(clippy::needless_pass_by_ref_mut)]
|
#[allow(clippy::needless_pass_by_ref_mut)]
|
||||||
fn end_interrupt(&mut self) {
|
fn end_interrupt(&mut self) -> Result<(), ProcessorError> {
|
||||||
todo!();
|
let ret = self.pop()?;
|
||||||
|
*self.reg(Register::Ret)? = ret;
|
||||||
|
*self.reg(Register::Pcx)? = ret;
|
||||||
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn get_stack(&mut self, n: u32) -> Result<Vec<u8>, ProcessorError> {
|
pub fn get_stack(&mut self, n: u32) -> Result<Vec<u8>, ProcessorError> {
|
||||||
let addr = self.get(Register::Spr);
|
let addr = self.get(Register::Spr)?;
|
||||||
let size = n * 4;
|
let size = n * 4;
|
||||||
// returns the stack
|
// returns the stack
|
||||||
self.memory.read_range(
|
Ok(self.memory.read_range(
|
||||||
max(addr, 0), // ensures that we cannot read from a negative address
|
max(addr, 0), // ensures that we cannot read from a negative address
|
||||||
min(size, addr), // ensures we don't read above the top of the stack
|
min(size, addr), // ensures we don't read above the top of the stack
|
||||||
)
|
))
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -164,30 +195,30 @@ impl Executable for Instruction {
|
|||||||
// No operation - a blank line.
|
// No operation - a blank line.
|
||||||
// Copies from SrcReg to a.drReg.
|
// Copies from SrcReg to a.drReg.
|
||||||
Self::Mov(a) => {
|
Self::Mov(a) => {
|
||||||
*cpu.reg(a.dr) = cpu.get(a.sr1);
|
*cpu.reg(a.dr)? = cpu.get(a.sr1)?;
|
||||||
}
|
}
|
||||||
|
|
||||||
// Copies from SrcReg to a.drReg, sign extending the value to take up a full
|
// Copies from SrcReg to a.drReg, sign extending the value to take up a full
|
||||||
// word.
|
// word.
|
||||||
Self::MovSigned(a) => {
|
Self::MovSigned(a) => {
|
||||||
*cpu.reg(a.dr) = sign_extend(cpu.get(a.sr1));
|
*cpu.reg(a.dr)? = sign_extend(cpu.get(a.sr1)?);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Loads a byte from memory address (base + offset) into a.drReg. The
|
// Loads a byte from memory address (base + offset) into a.drReg. The
|
||||||
// effective address must be byte-aligned.
|
// effective address must be byte-aligned.
|
||||||
Self::LoadByte(a) => {
|
Self::LoadByte(a) => {
|
||||||
*cpu.reg(a.r2) = u32::from(
|
*cpu.reg(a.r2)? = u32::from(
|
||||||
cpu.memory
|
cpu.memory
|
||||||
.read_byte(cpu.get(a.r1) + u32::from(a.immediate))?,
|
.read_byte(cpu.get(a.r1)? + u32::from(a.immediate)),
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Loads a sign-extended byte from memory address (base + offset) into
|
// Loads a sign-extended byte from memory address (base + offset) into
|
||||||
// a.drReg. The effective address must be byte-aligned.
|
// a.drReg. The effective address must be byte-aligned.
|
||||||
Self::LoadByteSigned(a) => {
|
Self::LoadByteSigned(a) => {
|
||||||
*cpu.reg(a.r2) = sign_extend(u32::from(
|
*cpu.reg(a.r2)? = sign_extend(u32::from(
|
||||||
cpu.memory
|
cpu.memory
|
||||||
.read_byte(cpu.get(a.r1) + u32::from(a.immediate))?,
|
.read_byte(cpu.get(a.r1)? + u32::from(a.immediate)),
|
||||||
));
|
));
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -196,18 +227,18 @@ impl Executable for Instruction {
|
|||||||
Self::LoadHalfword(a) => {
|
Self::LoadHalfword(a) => {
|
||||||
// we read an entire word, then right shift so we only get the first half
|
// we read an entire word, then right shift so we only get the first half
|
||||||
// of the word
|
// of the word
|
||||||
*cpu.reg(a.r2) = cpu
|
*cpu.reg(a.r2)? = cpu
|
||||||
.memory
|
.memory
|
||||||
.read_word(cpu.get(a.r1) + u32::from(a.immediate))?
|
.read_word(cpu.get(a.r1)? + u32::from(a.immediate))?
|
||||||
>> 16;
|
>> 16;
|
||||||
}
|
}
|
||||||
|
|
||||||
// Loads a sign-extended half-word from memory address (base + offset) into
|
// Loads a sign-extended half-word from memory address (base + offset) into
|
||||||
// a.drReg. The effective address must be 2-byte-aligned.
|
// a.drReg. The effective address must be 2-byte-aligned.
|
||||||
Self::LoadHalfwordSigned(a) => {
|
Self::LoadHalfwordSigned(a) => {
|
||||||
*cpu.reg(a.r2) = sign_extend(
|
*cpu.reg(a.r2)? = sign_extend(
|
||||||
cpu.memory
|
cpu.memory
|
||||||
.read_word(cpu.get(a.r1) + u32::from(a.immediate))?
|
.read_word(cpu.get(a.r1)? + u32::from(a.immediate))?
|
||||||
>> 16,
|
>> 16,
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
@@ -215,167 +246,165 @@ impl Executable for Instruction {
|
|||||||
// Loads a word from memory address (base + offset) into a.drReg. The
|
// Loads a word from memory address (base + offset) into a.drReg. The
|
||||||
// effective address must be 4-byte-aligned.
|
// effective address must be 4-byte-aligned.
|
||||||
Self::LoadWord(a) => {
|
Self::LoadWord(a) => {
|
||||||
*cpu.reg(a.r2) = cpu
|
*cpu.reg(a.r2)? = cpu
|
||||||
.memory
|
.memory
|
||||||
.read_word(cpu.get(a.r1) + u32::from(a.immediate))?;
|
.read_word(cpu.get(a.r1)? + u32::from(a.immediate))?;
|
||||||
}
|
}
|
||||||
|
|
||||||
// Stores a byte from SrcReg in memory address (base + offset) The effective
|
// Stores a byte from SrcReg in memory address (base + offset) The effective
|
||||||
// address must be byte-aligned.
|
// address must be byte-aligned.
|
||||||
Self::StoreByte(a) => {
|
Self::StoreByte(a) => {
|
||||||
cpu.memory.write_byte(
|
cpu.memory.write_byte(
|
||||||
cpu.get(a.r2) + u32::from(a.immediate),
|
cpu.get(a.r2)? + u32::from(a.immediate),
|
||||||
cpu.get(a.r1) as u8,
|
cpu.get(a.r1)? as u8,
|
||||||
)?;
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Stores a half-word from SrcReg in memory address (base + offset) The
|
// Stores a half-word from SrcReg in memory address (base + offset) The
|
||||||
// effective address must be 2-byte-aligned.
|
// effective address must be 2-byte-aligned.
|
||||||
Self::StoreHalfword(a) => {
|
Self::StoreHalfword(a) => {
|
||||||
// split the value into bytes and then write two bytes
|
// split the value into bytes and then write two bytes
|
||||||
let bytes = (cpu.get(a.r1) as u16).to_le_bytes();
|
let bytes = (cpu.get(a.r1)? as u16).to_le_bytes();
|
||||||
cpu.memory
|
cpu.memory
|
||||||
.write_byte(cpu.get(a.r2) + u32::from(a.immediate), bytes[0])?;
|
.write_byte(cpu.get(a.r2)? + u32::from(a.immediate), bytes[0]);
|
||||||
cpu.memory
|
cpu.memory
|
||||||
.write_byte(cpu.get(a.r2) + u32::from(a.immediate) + 1, bytes[1])?;
|
.write_byte(cpu.get(a.r2)? + u32::from(a.immediate) + 1, bytes[1]);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Stores a word from SrcReg in memory address (base + offset) The effective
|
// Stores a word from SrcReg in memory address (base + offset) The effective
|
||||||
// address must be 4-byte-aligned.
|
// address must be 4-byte-aligned.
|
||||||
Self::StoreWord(a) => {
|
Self::StoreWord(a) => {
|
||||||
cpu.memory
|
cpu.memory.write_word(
|
||||||
.write_word(cpu.get(a.r2) + u32::from(a.immediate), cpu.get(a.r1))?;
|
cpu.get(a.r2)? + u32::from(a.immediate),
|
||||||
|
cpu.get(a.r1)?,
|
||||||
|
)?;
|
||||||
}
|
}
|
||||||
|
|
||||||
// Loads a 16-bit literal value into reg, setting the bottom 16 bits of the
|
// Loads a 16-bit literal value into reg, setting the bottom 16 bits of the
|
||||||
// word. To populate the upper 16 bits, see LUI.
|
// word. To populate the upper 16 bits, see LUI.
|
||||||
Self::LoadLowerImmediate(a) => {
|
Self::LoadLowerImmediate(a) => {
|
||||||
*cpu.reg(a.r1) = u32::from(a.immediate);
|
*cpu.reg(a.r1)? = u32::from(a.immediate);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Loads a 16-bit literal value into reg, setting the top 16 bits of the word.
|
// Loads a 16-bit literal value into reg, setting the top 16 bits of the word.
|
||||||
// To populate the lower 16 bits, see LLI.
|
// To populate the lower 16 bits, see LLI.
|
||||||
Self::LoadUpperImmediate(a) => {
|
Self::LoadUpperImmediate(a) => {
|
||||||
*cpu.reg(a.r1) =
|
*cpu.reg(a.r1)? =
|
||||||
(cpu.get(a.r1) & 0x0000_FFFF) | (u32::from(a.immediate) << 16);
|
(cpu.get(a.r1)? & 0x0000_FFFF) | (u32::from(a.immediate) << 16);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Unconditionally jumps to the calculated address or direct address
|
// Unconditionally jumps to the calculated address or direct address
|
||||||
Self::Jump(a) => cpu.jump(a.r1, a.immediate),
|
Self::Jump(a) => cpu.jump(a.r1, a.immediate)?,
|
||||||
|
|
||||||
// Jumps to the calculated address or direct address if equal flag set.
|
// Jumps to the calculated address or direct address if equal flag set.
|
||||||
Self::JumpEq(a) => {
|
Self::JumpEq(a) => {
|
||||||
if cpu.get_flag(Flag::Equal) {
|
if cpu.get_flag(Flag::Equal)? {
|
||||||
cpu.jump(a.r1, a.immediate);
|
cpu.jump(a.r1, a.immediate)?;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// Jumps to the calculated address or direct address if equal flag not set.
|
// Jumps to the calculated address or direct address if equal flag not set.
|
||||||
Self::JumpNeq(a) => {
|
Self::JumpNeq(a) => {
|
||||||
if !cpu.get_flag(Flag::Equal) {
|
if !cpu.get_flag(Flag::Equal)? {
|
||||||
cpu.jump(a.r1, a.immediate);
|
cpu.jump(a.r1, a.immediate)?;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// Jumps to the calculated address or direct address if greater than flag set.
|
// Jumps to the calculated address or direct address if greater than flag set.
|
||||||
Self::JumpGt(a) => {
|
Self::JumpGt(a) => {
|
||||||
if cpu.get_flag(Flag::GreaterThan) {
|
if cpu.get_flag(Flag::GreaterThan)? {
|
||||||
cpu.jump(a.r1, a.immediate);
|
cpu.jump(a.r1, a.immediate)?;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// Jumps to the calculated address or direct address if greater than flag or
|
// Jumps to the calculated address or direct address if greater than flag or
|
||||||
// equal flag set.
|
// equal flag set.
|
||||||
Self::JumpGe(a) => {
|
Self::JumpGe(a) => {
|
||||||
if cpu.get_flag(Flag::GreaterThan) || cpu.get_flag(Flag::Equal) {
|
if cpu.get_flag(Flag::GreaterThan)? || cpu.get_flag(Flag::Equal)? {
|
||||||
cpu.jump(a.r1, a.immediate);
|
cpu.jump(a.r1, a.immediate)?;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// Jumps to the calculated address or direct address if less than flag set.
|
// Jumps to the calculated address or direct address if less than flag set.
|
||||||
Self::JumpLt(a) => {
|
Self::JumpLt(a) => {
|
||||||
if cpu.get_flag(Flag::LessThan) {
|
if cpu.get_flag(Flag::LessThan)? {
|
||||||
cpu.jump(a.r1, a.immediate);
|
cpu.jump(a.r1, a.immediate)?;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// Jumps to the calculated address or direct address if less than flag or
|
// Jumps to the calculated address or direct address if less than flag or
|
||||||
// equal flag set.
|
// equal flag set.
|
||||||
Self::JumpLe(a) => {
|
Self::JumpLe(a) => {
|
||||||
if cpu.get_flag(Flag::LessThan) || cpu.get_flag(Flag::Equal) {
|
if cpu.get_flag(Flag::LessThan)? || cpu.get_flag(Flag::Equal)? {
|
||||||
cpu.jump(a.r1, a.immediate);
|
cpu.jump(a.r1, a.immediate)?;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// Increments the value in the given register
|
// Increments the value in the given register
|
||||||
Self::Increment(a) => *cpu.reg(a.sr1) = inc(cpu.get(a.sr1)),
|
Self::Increment(a) => *cpu.reg(a.sr1)? = inc(cpu.get(a.sr1)?),
|
||||||
|
|
||||||
// Decrements the value in the given register
|
// Decrements the value in the given register
|
||||||
Self::Decrement(a) => *cpu.reg(a.sr1) = dec(cpu.get(a.sr1)),
|
Self::Decrement(a) => *cpu.reg(a.sr1)? = dec(cpu.get(a.sr1)?),
|
||||||
|
|
||||||
// Left shifts the value in Reg by the given amount (either a register, or a
|
// Left shifts the value in Reg by the given amount (either a register, or a
|
||||||
// literal value)
|
// literal value)
|
||||||
Self::ShiftLeft(a) => {
|
Self::ShiftLeft(a) => {
|
||||||
let regval = cpu.get(a.sr2);
|
let reg = cpu.get(a.sr1)?;
|
||||||
let val = cpu.get(a.sr1);
|
let val = a.shamt;
|
||||||
|
*cpu.reg(a.sr1)? = shl(reg, val);
|
||||||
*cpu.reg(a.sr1) =
|
|
||||||
shl(val, if regval != 0 { regval as u8 } else { a.shamt });
|
|
||||||
}
|
}
|
||||||
|
|
||||||
// Right shifts the value in Reg by the given amount (either a register, or a
|
// Right shifts the value in Reg by the given amount (either a register, or a
|
||||||
// literal value).
|
// literal value).
|
||||||
Self::ShiftRight(a) => {
|
Self::ShiftRight(a) => {
|
||||||
let regval = cpu.get(a.sr2);
|
let regval = cpu.get(a.sr1)?;
|
||||||
let val = cpu.get(a.sr1);
|
let val = a.shamt;
|
||||||
|
*cpu.reg(a.sr1)? = shr(regval, val);
|
||||||
*cpu.reg(a.sr1) =
|
|
||||||
shr(val, if regval != 0 { regval as u8 } else { a.shamt });
|
|
||||||
}
|
}
|
||||||
|
|
||||||
// Adds the value of Src2 to Src1 and writes the result to a.dr
|
// Adds the value of Src2 to Src1 and writes the result to a.dr
|
||||||
Self::Add(a) => {
|
Self::Add(a) => {
|
||||||
*cpu.reg(a.dr) = add(cpu.get(a.sr1), cpu.get(a.sr2));
|
*cpu.reg(a.dr)? = add(cpu.get(a.sr1)?, cpu.get(a.sr2)?);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Subtracts the value of Src2 from Src1 and writes the result to a.dr
|
// Subtracts the value of Src2 from Src1 and writes the result to a.dr
|
||||||
Self::Sub(a) => {
|
Self::Sub(a) => {
|
||||||
*cpu.reg(a.dr) = sub(cpu.get(a.sr1), cpu.get(a.sr2));
|
*cpu.reg(a.dr)? = sub(cpu.get(a.sr1)?, cpu.get(a.sr2)?);
|
||||||
}
|
}
|
||||||
|
|
||||||
Self::AddImmediate(a) => {
|
Self::AddImmediate(a) => {
|
||||||
*cpu.reg(a.r2) = add(cpu.get(a.r1), u32::from(a.immediate));
|
*cpu.reg(a.r2)? = add(cpu.get(a.r1)?, u32::from(a.immediate));
|
||||||
}
|
}
|
||||||
|
|
||||||
Self::SubImmediate(a) => {
|
Self::SubImmediate(a) => {
|
||||||
*cpu.reg(a.r2) = sub(cpu.get(a.r1), u32::from(a.immediate));
|
*cpu.reg(a.r2)? = sub(cpu.get(a.r1)?, u32::from(a.immediate));
|
||||||
}
|
}
|
||||||
|
|
||||||
// Performs bitwise AND on Src1 and Src2 storing the result in a.dr
|
// Performs bitwise AND on Src1 and Src2 storing the result in a.dr
|
||||||
Self::And(a) => *cpu.reg(a.dr) = and(cpu.get(a.sr1), cpu.get(a.sr2)),
|
Self::And(a) => *cpu.reg(a.dr)? = and(cpu.get(a.sr1)?, cpu.get(a.sr2)?),
|
||||||
|
|
||||||
// Performs bitwise OR on Src1 and Src2 storing the result in a.dr
|
// Performs bitwise OR on Src1 and Src2 storing the result in a.dr
|
||||||
Self::Or(a) => *cpu.reg(a.dr) = or(cpu.get(a.sr1), cpu.get(a.sr2)),
|
Self::Or(a) => *cpu.reg(a.dr)? = or(cpu.get(a.sr1)?, cpu.get(a.sr2)?),
|
||||||
|
|
||||||
// Performs bitwise NOT on Src storing the result in a.dr
|
// Performs bitwise NOT on Src storing the result in a.dr
|
||||||
Self::Not(a) => *cpu.reg(a.dr) = not(cpu.get(a.sr1)),
|
Self::Not(a) => *cpu.reg(a.dr)? = not(cpu.get(a.sr1)?),
|
||||||
|
|
||||||
// Performs bitwise XOR on Src1 and Src2 storing the result in a.dr
|
// Performs bitwise XOR on Src1 and Src2 storing the result in a.dr
|
||||||
Self::Xor(a) => *cpu.reg(a.dr) = xor(cpu.get(a.sr1), cpu.get(a.sr2)),
|
Self::Xor(a) => *cpu.reg(a.dr)? = xor(cpu.get(a.sr1)?, cpu.get(a.sr2)?),
|
||||||
|
|
||||||
// Performs bitwise NAND on Src1 and Src2 storing the result in a.dr
|
// Performs bitwise NAND on Src1 and Src2 storing the result in a.dr
|
||||||
Self::Nand(a) => *cpu.reg(a.dr) = nand(cpu.get(a.sr1), cpu.get(a.sr2)),
|
Self::Nand(a) => *cpu.reg(a.dr)? = nand(cpu.get(a.sr1)?, cpu.get(a.sr2)?),
|
||||||
|
|
||||||
// Performs bitwise NOR on Src1 and Src2 storing the result in a.dr
|
// Performs bitwise NOR on Src1 and Src2 storing the result in a.dr
|
||||||
Self::Nor(a) => *cpu.reg(a.dr) = nor(cpu.get(a.sr1), cpu.get(a.sr2)),
|
Self::Nor(a) => *cpu.reg(a.dr)? = nor(cpu.get(a.sr1)?, cpu.get(a.sr2)?),
|
||||||
|
|
||||||
// Performs bitwise XNOR on Src1 and Src2 storing the result in a.dr
|
// Performs bitwise XNOR on Src1 and Src2 storing the result in a.dr
|
||||||
Self::Xnor(a) => *cpu.reg(a.dr) = xnor(cpu.get(a.sr1), cpu.get(a.sr2)),
|
Self::Xnor(a) => *cpu.reg(a.dr)? = xnor(cpu.get(a.sr1)?, cpu.get(a.sr2)?),
|
||||||
|
|
||||||
// Compares the value of Reg1 to the value in Reg2. The results of the
|
// Compares the value of Reg1 to the value in Reg2. The results of the
|
||||||
// comparisons are set in the Status register.
|
// comparisons are set in the Status register.
|
||||||
Self::Compare(a) => {
|
Self::Compare(a) => {
|
||||||
cpu.cmp(cpu.get(a.sr1), cpu.get(a.sr2));
|
cpu.cmp(cpu.get(a.sr1)?, cpu.get(a.sr2)?);
|
||||||
}
|
}
|
||||||
|
|
||||||
// Initiates an interrupt with the given 8 bit interrupt code.
|
// Initiates an interrupt with the given 8 bit interrupt code.
|
||||||
@@ -383,12 +412,12 @@ impl Executable for Instruction {
|
|||||||
// - The return address is saved to the RET register.
|
// - The return address is saved to the RET register.
|
||||||
// - The stack base ptr is set to the kernel stack.
|
// - The stack base ptr is set to the kernel stack.
|
||||||
Self::Interrupt(interrupt_code) => {
|
Self::Interrupt(interrupt_code) => {
|
||||||
cpu.begin_interrupt(interrupt_code);
|
cpu.begin_interrupt(interrupt_code)?;
|
||||||
}
|
}
|
||||||
|
|
||||||
// Returns from an interrupt,
|
// Returns from an interrupt,
|
||||||
Self::IntReturn => {
|
Self::IntReturn => {
|
||||||
cpu.end_interrupt();
|
cpu.end_interrupt()?;
|
||||||
}
|
}
|
||||||
|
|
||||||
// Halts the processor.
|
// Halts the processor.
|
||||||
|
|||||||
@@ -18,19 +18,27 @@ fn test_nop_instruction() {
|
|||||||
);
|
);
|
||||||
|
|
||||||
assert_eq!(
|
assert_eq!(
|
||||||
cpu.registers.get(Register::Rg0),
|
cpu.registers
|
||||||
initial_state.get(Register::Rg0)
|
.get(Register::Rg0)
|
||||||
|
.expect("Failed to get register Rg0"),
|
||||||
|
initial_state
|
||||||
|
.get(Register::Rg0)
|
||||||
|
.expect("Failed to get register Rg0")
|
||||||
);
|
);
|
||||||
assert_eq!(
|
assert_eq!(
|
||||||
cpu.registers.get(Register::Acc),
|
cpu.registers
|
||||||
initial_state.get(Register::Acc)
|
.get(Register::Acc)
|
||||||
|
.expect("Failed to get register Acc"),
|
||||||
|
initial_state
|
||||||
|
.get(Register::Acc)
|
||||||
|
.expect("Failed to get register Acc")
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_mov_instruction() {
|
fn test_mov_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 0x1234_5678;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0x1234_5678;
|
||||||
|
|
||||||
let mov_instr = Instruction::Mov(RTypeArgs::new(
|
let mov_instr = Instruction::Mov(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -42,13 +50,16 @@ fn test_mov_instruction() {
|
|||||||
mov_instr.execute(&mut cpu).expect(
|
mov_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg2), 0x1234_5678);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg2).expect("Failed to get register Rg2"),
|
||||||
|
0x1234_5678
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_mov_signed_instruction() {
|
fn test_mov_signed_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 0x0000_00FF;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0x0000_00FF;
|
||||||
|
|
||||||
let mov_signed_instr = Instruction::MovSigned(RTypeArgs::new(
|
let mov_signed_instr = Instruction::MovSigned(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -60,17 +71,18 @@ fn test_mov_signed_instruction() {
|
|||||||
mov_signed_instr.execute(&mut cpu).expect(
|
mov_signed_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg2), 0xFFFF_FFFF);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg2).expect("Failed to get register Rg2"),
|
||||||
|
0xFFFF_FFFF
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_load_byte_instruction() {
|
fn test_load_byte_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
let addr = 0x100;
|
let addr = 0x100;
|
||||||
cpu.memory
|
cpu.memory.write_byte(addr, 0xAB);
|
||||||
.write_byte(addr, 0xAB)
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = addr - 4;
|
||||||
.expect("Failed to write byte to memory");
|
|
||||||
*cpu.reg(Register::Rg1) = addr - 4;
|
|
||||||
|
|
||||||
let load_byte_instr = Instruction::LoadByte(ITypeArgs::new(
|
let load_byte_instr = Instruction::LoadByte(ITypeArgs::new(
|
||||||
4,
|
4,
|
||||||
@@ -81,17 +93,18 @@ fn test_load_byte_instruction() {
|
|||||||
load_byte_instr.execute(&mut cpu).expect(
|
load_byte_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg2), 0x0000_00AB);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg2).expect("Failed to get register Rg2"),
|
||||||
|
0x0000_00AB
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_load_byte_signed_instruction() {
|
fn test_load_byte_signed_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
let addr = 0x100;
|
let addr = 0x100;
|
||||||
cpu.memory
|
cpu.memory.write_byte(addr, 0xFF);
|
||||||
.write_byte(addr, 0xFF)
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = addr;
|
||||||
.expect("Failed to write byte to memory");
|
|
||||||
*cpu.reg(Register::Rg1) = addr;
|
|
||||||
|
|
||||||
let load_byte_signed_instr = Instruction::LoadByteSigned(ITypeArgs::new(
|
let load_byte_signed_instr = Instruction::LoadByteSigned(ITypeArgs::new(
|
||||||
0,
|
0,
|
||||||
@@ -102,7 +115,10 @@ fn test_load_byte_signed_instruction() {
|
|||||||
load_byte_signed_instr.execute(&mut cpu).expect(
|
load_byte_signed_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg2), 0xFFFF_FFFF);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg2).expect("Failed to get register Rg2"),
|
||||||
|
0xFFFF_FFFF
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
@@ -112,7 +128,7 @@ fn test_load_halfword_instruction() {
|
|||||||
cpu.memory
|
cpu.memory
|
||||||
.write_word(addr, 0x1234_5678)
|
.write_word(addr, 0x1234_5678)
|
||||||
.expect("Failed to write word to memory");
|
.expect("Failed to write word to memory");
|
||||||
*cpu.reg(Register::Rg1) = addr;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = addr;
|
||||||
|
|
||||||
let load_halfword_instr = Instruction::LoadHalfword(ITypeArgs::new(
|
let load_halfword_instr = Instruction::LoadHalfword(ITypeArgs::new(
|
||||||
0,
|
0,
|
||||||
@@ -123,7 +139,10 @@ fn test_load_halfword_instruction() {
|
|||||||
load_halfword_instr.execute(&mut cpu).expect(
|
load_halfword_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg2), 0x0000_1234);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg2).expect("Failed to get register Rg2"),
|
||||||
|
0x0000_1234
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
@@ -133,7 +152,7 @@ fn test_load_word_instruction() {
|
|||||||
cpu.memory
|
cpu.memory
|
||||||
.write_word(addr, 0x1234_5678)
|
.write_word(addr, 0x1234_5678)
|
||||||
.expect("Failed to write word to memory");
|
.expect("Failed to write word to memory");
|
||||||
*cpu.reg(Register::Rg1) = addr;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = addr;
|
||||||
|
|
||||||
let load_word_instr = Instruction::LoadWord(ITypeArgs::new(
|
let load_word_instr = Instruction::LoadWord(ITypeArgs::new(
|
||||||
0,
|
0,
|
||||||
@@ -144,15 +163,18 @@ fn test_load_word_instruction() {
|
|||||||
load_word_instr.execute(&mut cpu).expect(
|
load_word_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg2), 0x1234_5678);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg2).expect("Failed to get register Rg2"),
|
||||||
|
0x1234_5678
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_store_byte_instruction() {
|
fn test_store_byte_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
let addr = 0x100;
|
let addr = 0x100;
|
||||||
*cpu.reg(Register::Rg1) = addr;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = addr;
|
||||||
*cpu.reg(Register::Rg2) = 0xAB;
|
*cpu.reg(Register::Rg2).expect("Failed to get register Rg2") = 0xAB;
|
||||||
|
|
||||||
let store_byte_instr = Instruction::StoreByte(ITypeArgs::new(
|
let store_byte_instr = Instruction::StoreByte(ITypeArgs::new(
|
||||||
0,
|
0,
|
||||||
@@ -163,15 +185,15 @@ fn test_store_byte_instruction() {
|
|||||||
store_byte_instr.execute(&mut cpu).expect(
|
store_byte_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.memory.read_byte(addr).expect("Emulator was slain by losing the game while attempting to execute instruction"), 0xAB);
|
assert_eq!(cpu.memory.read_byte(addr), 0xAB);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_store_word_instruction() {
|
fn test_store_word_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
let addr = 0x100;
|
let addr = 0x100;
|
||||||
*cpu.reg(Register::Rg1) = addr;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = addr;
|
||||||
*cpu.reg(Register::Rg2) = 0x1234_5678;
|
*cpu.reg(Register::Rg2).expect("Failed to get register Rg2") = 0x1234_5678;
|
||||||
|
|
||||||
let store_word_instr = Instruction::StoreWord(ITypeArgs::new(
|
let store_word_instr = Instruction::StoreWord(ITypeArgs::new(
|
||||||
0,
|
0,
|
||||||
@@ -188,8 +210,8 @@ fn test_store_word_instruction() {
|
|||||||
#[test]
|
#[test]
|
||||||
fn test_add_instruction() {
|
fn test_add_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 15;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 15;
|
||||||
*cpu.reg(Register::Rg2) = 25;
|
*cpu.reg(Register::Rg2).expect("Failed to get register Rg2") = 25;
|
||||||
|
|
||||||
let add_instr = Instruction::Add(RTypeArgs::new(
|
let add_instr = Instruction::Add(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -201,14 +223,17 @@ fn test_add_instruction() {
|
|||||||
add_instr.execute(&mut cpu).expect(
|
add_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg3), 40);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg3).expect("Failed to get register Rg3"),
|
||||||
|
40
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_sub_instruction() {
|
fn test_sub_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 50;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 50;
|
||||||
*cpu.reg(Register::Rg2) = 20;
|
*cpu.reg(Register::Rg2).expect("Failed to get register Rg2") = 20;
|
||||||
|
|
||||||
let sub_instr = Instruction::Sub(RTypeArgs::new(
|
let sub_instr = Instruction::Sub(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -220,14 +245,17 @@ fn test_sub_instruction() {
|
|||||||
sub_instr.execute(&mut cpu).expect(
|
sub_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg3), 30);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg3).expect("Failed to get register Rg3"),
|
||||||
|
30
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_and_instruction() {
|
fn test_and_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 0b1100;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0b1100;
|
||||||
*cpu.reg(Register::Rg2) = 0b1010;
|
*cpu.reg(Register::Rg2).expect("Failed to get register Rg2") = 0b1010;
|
||||||
|
|
||||||
let and_instr = Instruction::And(RTypeArgs::new(
|
let and_instr = Instruction::And(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -239,14 +267,17 @@ fn test_and_instruction() {
|
|||||||
and_instr.execute(&mut cpu).expect(
|
and_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg3), 0b1000);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg3).expect("Failed to get register Rg3"),
|
||||||
|
0b1000
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_or_instruction() {
|
fn test_or_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 0b1100;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0b1100;
|
||||||
*cpu.reg(Register::Rg2) = 0b1010;
|
*cpu.reg(Register::Rg2).expect("Failed to get register Rg2") = 0b1010;
|
||||||
|
|
||||||
let or_instr = Instruction::Or(RTypeArgs::new(
|
let or_instr = Instruction::Or(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -258,14 +289,17 @@ fn test_or_instruction() {
|
|||||||
or_instr.execute(&mut cpu).expect(
|
or_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg3), 0b1110);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg3).expect("Failed to get register Rg3"),
|
||||||
|
0b1110
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_xor_instruction() {
|
fn test_xor_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 0b1100;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0b1100;
|
||||||
*cpu.reg(Register::Rg2) = 0b1010;
|
*cpu.reg(Register::Rg2).expect("Failed to get register Rg2") = 0b1010;
|
||||||
|
|
||||||
let xor_instr = Instruction::Xor(RTypeArgs::new(
|
let xor_instr = Instruction::Xor(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -277,13 +311,16 @@ fn test_xor_instruction() {
|
|||||||
xor_instr.execute(&mut cpu).expect(
|
xor_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg3), 0b0110);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg3).expect("Failed to get register Rg3"),
|
||||||
|
0b0110
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_not_instruction() {
|
fn test_not_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 0x0F0F_0F0F;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0x0F0F_0F0F;
|
||||||
|
|
||||||
let not_instr = Instruction::Not(RTypeArgs::new(
|
let not_instr = Instruction::Not(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -295,14 +332,17 @@ fn test_not_instruction() {
|
|||||||
not_instr.execute(&mut cpu).expect(
|
not_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg2), 0xF0F0_F0F0);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg2).expect("Failed to get register Rg2"),
|
||||||
|
0xF0F0_F0F0
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_compare_equal() {
|
fn test_compare_equal() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 42;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 42;
|
||||||
*cpu.reg(Register::Rg2) = 42;
|
*cpu.reg(Register::Rg2).expect("Failed to get register Rg2") = 42;
|
||||||
|
|
||||||
let cmp_instr = Instruction::Compare(RTypeArgs::new(
|
let cmp_instr = Instruction::Compare(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -315,16 +355,22 @@ fn test_compare_equal() {
|
|||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
|
|
||||||
assert!(cpu.get_flag(Flag::Equal));
|
assert!(cpu.get_flag(Flag::Equal).expect("Failed to get flag Equal"));
|
||||||
assert!(!cpu.get_flag(Flag::GreaterThan));
|
assert!(
|
||||||
assert!(!cpu.get_flag(Flag::LessThan));
|
!cpu.get_flag(Flag::GreaterThan)
|
||||||
|
.expect("Failed to get flag GreaterThan")
|
||||||
|
);
|
||||||
|
assert!(
|
||||||
|
!cpu.get_flag(Flag::LessThan)
|
||||||
|
.expect("Failed to get flag LessThan")
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_compare_greater_than() {
|
fn test_compare_greater_than() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 50;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 50;
|
||||||
*cpu.reg(Register::Rg2) = 30;
|
*cpu.reg(Register::Rg2).expect("Failed to get register Rg2") = 30;
|
||||||
|
|
||||||
let cmp_instr = Instruction::Compare(RTypeArgs::new(
|
let cmp_instr = Instruction::Compare(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -337,16 +383,22 @@ fn test_compare_greater_than() {
|
|||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
|
|
||||||
assert!(!cpu.get_flag(Flag::Equal));
|
assert!(!cpu.get_flag(Flag::Equal).expect("Failed to get flag Equal"));
|
||||||
assert!(cpu.get_flag(Flag::GreaterThan));
|
assert!(
|
||||||
assert!(!cpu.get_flag(Flag::LessThan));
|
cpu.get_flag(Flag::GreaterThan)
|
||||||
|
.expect("Failed to get flag GreaterThan")
|
||||||
|
);
|
||||||
|
assert!(
|
||||||
|
!cpu.get_flag(Flag::LessThan)
|
||||||
|
.expect("Failed to get flag LessThan")
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_compare_less_than() {
|
fn test_compare_less_than() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 20;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 20;
|
||||||
*cpu.reg(Register::Rg2) = 30;
|
*cpu.reg(Register::Rg2).expect("Failed to get register Rg2") = 30;
|
||||||
|
|
||||||
let cmp_instr = Instruction::Compare(RTypeArgs::new(
|
let cmp_instr = Instruction::Compare(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -359,15 +411,21 @@ fn test_compare_less_than() {
|
|||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
|
|
||||||
assert!(!cpu.get_flag(Flag::Equal));
|
assert!(!cpu.get_flag(Flag::Equal).expect("Failed to get flag Equal"));
|
||||||
assert!(!cpu.get_flag(Flag::GreaterThan));
|
assert!(
|
||||||
assert!(cpu.get_flag(Flag::LessThan));
|
!cpu.get_flag(Flag::GreaterThan)
|
||||||
|
.expect("Failed to get flag GreaterThan")
|
||||||
|
);
|
||||||
|
assert!(
|
||||||
|
cpu.get_flag(Flag::LessThan)
|
||||||
|
.expect("Failed to get flag LessThan")
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_increment_instruction() {
|
fn test_increment_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 42;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 42;
|
||||||
|
|
||||||
let inc_instr =
|
let inc_instr =
|
||||||
Instruction::Increment(RTypeArgs::new(Some(Register::Rg1), None, None, None));
|
Instruction::Increment(RTypeArgs::new(Some(Register::Rg1), None, None, None));
|
||||||
@@ -375,13 +433,16 @@ fn test_increment_instruction() {
|
|||||||
inc_instr.execute(&mut cpu).expect(
|
inc_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg1), 43);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg1).expect("Failed to get register Rg1"),
|
||||||
|
43
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_decrement_instruction() {
|
fn test_decrement_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 42;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 42;
|
||||||
|
|
||||||
let dec_instr =
|
let dec_instr =
|
||||||
Instruction::Decrement(RTypeArgs::new(Some(Register::Rg1), None, None, None));
|
Instruction::Decrement(RTypeArgs::new(Some(Register::Rg1), None, None, None));
|
||||||
@@ -389,13 +450,16 @@ fn test_decrement_instruction() {
|
|||||||
dec_instr.execute(&mut cpu).expect(
|
dec_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg1), 41);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg1).expect("Failed to get register Rg1"),
|
||||||
|
41
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_shift_left_with_shamt() {
|
fn test_shift_left_with_shamt() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 0b1010;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0b1010;
|
||||||
|
|
||||||
let shl_instr = Instruction::ShiftLeft(RTypeArgs::new(
|
let shl_instr = Instruction::ShiftLeft(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -407,13 +471,16 @@ fn test_shift_left_with_shamt() {
|
|||||||
shl_instr.execute(&mut cpu).expect(
|
shl_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg1), 0b10_1000);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg1).expect("Failed to get register Rg1"),
|
||||||
|
0b10_1000
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_shift_right_with_shamt() {
|
fn test_shift_right_with_shamt() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 0b10_1000;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0b10_1000;
|
||||||
|
|
||||||
let shr_instr = Instruction::ShiftRight(RTypeArgs::new(
|
let shr_instr = Instruction::ShiftRight(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -425,28 +492,30 @@ fn test_shift_right_with_shamt() {
|
|||||||
shr_instr.execute(&mut cpu).expect(
|
shr_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg1), 0b1010);
|
assert_eq!(
|
||||||
}
|
cpu.get(Register::Rg1).expect("Failed to get register Rg1"),
|
||||||
|
0b1010
|
||||||
#[test]
|
|
||||||
fn test_shift_left_with_register() {
|
|
||||||
let mut cpu = create_test_processor();
|
|
||||||
*cpu.reg(Register::Rg1) = 0b1010;
|
|
||||||
*cpu.reg(Register::Rg2) = 3;
|
|
||||||
|
|
||||||
let shl_instr = Instruction::ShiftLeft(RTypeArgs::new(
|
|
||||||
Some(Register::Rg1),
|
|
||||||
Some(Register::Rg2),
|
|
||||||
None,
|
|
||||||
None,
|
|
||||||
));
|
|
||||||
|
|
||||||
shl_instr.execute(&mut cpu).expect(
|
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg1), 0b101_0000);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// #[test]
|
||||||
|
// fn test_shift_left_with_register() {
|
||||||
|
// let mut cpu = create_test_processor();
|
||||||
|
// *cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0b1010;
|
||||||
|
|
||||||
|
// let shl_instr =
|
||||||
|
// Instruction::ShiftLeft(RTypeArgs::new(Some(Register::Rg1), None, None,
|
||||||
|
// Some(3)));
|
||||||
|
|
||||||
|
// shl_instr.execute(&mut cpu).expect(
|
||||||
|
// "Emulator was slain by losing the game while attempting to execute
|
||||||
|
// instruction", );
|
||||||
|
// assert_eq!(
|
||||||
|
// cpu.get(Register::Rg1).expect("Failed to get register Rg1"),
|
||||||
|
// 0b101_0000
|
||||||
|
// );
|
||||||
|
// }
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_load_lower_immediate() {
|
fn test_load_lower_immediate() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
@@ -460,13 +529,16 @@ fn test_load_lower_immediate() {
|
|||||||
lli_instr.execute(&mut cpu).expect(
|
lli_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg1), 0x0000_1234);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg1).expect("Failed to get register Rg1"),
|
||||||
|
0x0000_1234
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_load_upper_immediate() {
|
fn test_load_upper_immediate() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 0x0000_5678;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0x0000_5678;
|
||||||
|
|
||||||
let lui_instr = Instruction::LoadUpperImmediate(ITypeArgs::new(
|
let lui_instr = Instruction::LoadUpperImmediate(ITypeArgs::new(
|
||||||
0x1234,
|
0x1234,
|
||||||
@@ -477,29 +549,38 @@ fn test_load_upper_immediate() {
|
|||||||
lui_instr.execute(&mut cpu).expect(
|
lui_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg1), 0x1234_5678);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg1).expect("Failed to get register Rg1"),
|
||||||
|
0x1234_5678
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_jump_unconditional() {
|
fn test_jump_unconditional() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 0x1000;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0x1000;
|
||||||
let initial_pc = cpu.get(Register::Pcx);
|
let initial_pc = cpu.get(Register::Pcx).expect("Failed to get register Pcx");
|
||||||
|
|
||||||
let jump_instr = Instruction::Jump(ITypeArgs::new(0x100, Some(Register::Rg1), None));
|
let jump_instr = Instruction::Jump(ITypeArgs::new(0x100, Some(Register::Rg1), None));
|
||||||
|
|
||||||
jump_instr.execute(&mut cpu).expect(
|
jump_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Pcx), 0x1100);
|
assert_eq!(
|
||||||
assert_ne!(cpu.get(Register::Pcx), initial_pc);
|
cpu.get(Register::Pcx).expect("Failed to get register Pcx"),
|
||||||
|
0x1100
|
||||||
|
);
|
||||||
|
assert_ne!(
|
||||||
|
cpu.get(Register::Pcx).expect("Failed to get register Pcx"),
|
||||||
|
initial_pc
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_jump_equal_when_flag_set() {
|
fn test_jump_equal_when_flag_set() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
cpu.set_flag(Flag::Equal, true);
|
cpu.set_flag(Flag::Equal, true);
|
||||||
*cpu.reg(Register::Rg1) = 0x1000;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0x1000;
|
||||||
|
|
||||||
let jump_eq_instr =
|
let jump_eq_instr =
|
||||||
Instruction::JumpEq(ITypeArgs::new(0x100, Some(Register::Rg1), None));
|
Instruction::JumpEq(ITypeArgs::new(0x100, Some(Register::Rg1), None));
|
||||||
@@ -507,15 +588,18 @@ fn test_jump_equal_when_flag_set() {
|
|||||||
jump_eq_instr.execute(&mut cpu).expect(
|
jump_eq_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Pcx), 0x1100);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Pcx).expect("Failed to get register Pcx"),
|
||||||
|
0x1100
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_jump_equal_when_flag_not_set() {
|
fn test_jump_equal_when_flag_not_set() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
cpu.set_flag(Flag::Equal, false);
|
cpu.set_flag(Flag::Equal, false);
|
||||||
*cpu.reg(Register::Rg1) = 0x1000;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0x1000;
|
||||||
let initial_pc = cpu.get(Register::Pcx);
|
let initial_pc = cpu.get(Register::Pcx).expect("Failed to get register Pcx");
|
||||||
|
|
||||||
let jump_eq_instr =
|
let jump_eq_instr =
|
||||||
Instruction::JumpEq(ITypeArgs::new(0x100, Some(Register::Rg1), None));
|
Instruction::JumpEq(ITypeArgs::new(0x100, Some(Register::Rg1), None));
|
||||||
@@ -523,7 +607,10 @@ fn test_jump_equal_when_flag_not_set() {
|
|||||||
jump_eq_instr.execute(&mut cpu).expect(
|
jump_eq_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Pcx), initial_pc);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Pcx).expect("Failed to get register Pcx"),
|
||||||
|
initial_pc
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
@@ -540,8 +627,8 @@ fn test_halt_instruction() {
|
|||||||
#[test]
|
#[test]
|
||||||
fn test_nand_instruction() {
|
fn test_nand_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 0b1100;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0b1100;
|
||||||
*cpu.reg(Register::Rg2) = 0b1010;
|
*cpu.reg(Register::Rg2).expect("Failed to get register Rg2") = 0b1010;
|
||||||
|
|
||||||
let nand_instr = Instruction::Nand(RTypeArgs::new(
|
let nand_instr = Instruction::Nand(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -553,14 +640,17 @@ fn test_nand_instruction() {
|
|||||||
nand_instr.execute(&mut cpu).expect(
|
nand_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg3), !0b1000);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg3).expect("Failed to get register Rg3"),
|
||||||
|
!0b1000
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_nor_instruction() {
|
fn test_nor_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 0b1100;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0b1100;
|
||||||
*cpu.reg(Register::Rg2) = 0b1010;
|
*cpu.reg(Register::Rg2).expect("Failed to get register Rg2") = 0b1010;
|
||||||
|
|
||||||
let nor_instr = Instruction::Nor(RTypeArgs::new(
|
let nor_instr = Instruction::Nor(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -572,14 +662,17 @@ fn test_nor_instruction() {
|
|||||||
nor_instr.execute(&mut cpu).expect(
|
nor_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg3), !0b1110);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg3).expect("Failed to get register Rg3"),
|
||||||
|
!0b1110
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#[test]
|
#[test]
|
||||||
fn test_xnor_instruction() {
|
fn test_xnor_instruction() {
|
||||||
let mut cpu = create_test_processor();
|
let mut cpu = create_test_processor();
|
||||||
*cpu.reg(Register::Rg1) = 0b1100;
|
*cpu.reg(Register::Rg1).expect("Failed to get register Rg1") = 0b1100;
|
||||||
*cpu.reg(Register::Rg2) = 0b1010;
|
*cpu.reg(Register::Rg2).expect("Failed to get register Rg2") = 0b1010;
|
||||||
|
|
||||||
let xnor_instr = Instruction::Xnor(RTypeArgs::new(
|
let xnor_instr = Instruction::Xnor(RTypeArgs::new(
|
||||||
Some(Register::Rg1),
|
Some(Register::Rg1),
|
||||||
@@ -591,5 +684,8 @@ fn test_xnor_instruction() {
|
|||||||
xnor_instr.execute(&mut cpu).expect(
|
xnor_instr.execute(&mut cpu).expect(
|
||||||
"Emulator was slain by losing the game while attempting to execute instruction",
|
"Emulator was slain by losing the game while attempting to execute instruction",
|
||||||
);
|
);
|
||||||
assert_eq!(cpu.get(Register::Rg3), !0b0110);
|
assert_eq!(
|
||||||
|
cpu.get(Register::Rg3).expect("Failed to get register Rg3"),
|
||||||
|
!0b0110
|
||||||
|
);
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -133,17 +133,25 @@ impl Component for ControlPanel {
|
|||||||
}
|
}
|
||||||
));
|
));
|
||||||
|
|
||||||
let pcx = state.reg_file.get(Register::Pcx);
|
let pcx = state
|
||||||
|
.reg_file
|
||||||
|
.get(Register::Pcx)
|
||||||
|
.expect("PCX should never be invalid");
|
||||||
let instructions = state.instructions;
|
let instructions = state.instructions;
|
||||||
|
|
||||||
ui.label(format!("Instructions: {instructions}"));
|
ui.label(format!("Instructions: {instructions}"));
|
||||||
ui.label(format!("PC: 0x{pcx:08X}"));
|
ui.label(format!("PC: 0x{pcx:08X}"));
|
||||||
|
|
||||||
let instruction = Instruction::decode(state.reg_file.get(Register::Cir))
|
let instruction = Instruction::decode(
|
||||||
.map_or_else(
|
state
|
||||||
|_| "Invalid Instruction".to_string(),
|
.reg_file
|
||||||
|instruction| instruction.to_string(),
|
.get(Register::Cir)
|
||||||
);
|
.expect("CIR should never be invalid"),
|
||||||
|
)
|
||||||
|
.map_or_else(
|
||||||
|
|_| "Invalid Instruction".to_string(),
|
||||||
|
|instruction| instruction.to_string(),
|
||||||
|
);
|
||||||
|
|
||||||
ui.label(format!("Instruction: {instruction}"));
|
ui.label(format!("Instruction: {instruction}"));
|
||||||
});
|
});
|
||||||
|
|||||||
@@ -5,7 +5,6 @@ use std::{
|
|||||||
path::{Path, PathBuf},
|
path::{Path, PathBuf},
|
||||||
};
|
};
|
||||||
|
|
||||||
use assembler::compiler_engine::CompilerEngine;
|
|
||||||
use common::prelude::Instruction;
|
use common::prelude::Instruction;
|
||||||
use egui::{Align, Context, Key, Layout, Ui};
|
use egui::{Align, Context, Key, Layout, Ui};
|
||||||
|
|
||||||
@@ -17,7 +16,7 @@ use crate::emulator::{
|
|||||||
ui::interface::Component,
|
ui::interface::Component,
|
||||||
};
|
};
|
||||||
|
|
||||||
// use assembler::prelude::*;
|
use assembler::prelude::*;
|
||||||
|
|
||||||
#[derive(Default)]
|
#[derive(Default)]
|
||||||
pub struct Editor {
|
pub struct Editor {
|
||||||
|
|||||||
@@ -61,7 +61,7 @@ impl Component for StackInspector {
|
|||||||
ui.label(format!(
|
ui.label(format!(
|
||||||
"{} [{}]",
|
"{} [{}]",
|
||||||
i,
|
i,
|
||||||
state.reg_file.get(Register::Spr) - i as u32 * 4
|
state.reg_file.get(Register::Spr).expect("SPR should never be invalid") - i as u32 * 4
|
||||||
));
|
));
|
||||||
ui.label(format!("0x{value:08X} ({value})"));
|
ui.label(format!("0x{value:08X} ({value})"));
|
||||||
ui.end_row();
|
ui.end_row();
|
||||||
|
|||||||
@@ -1,279 +0,0 @@
|
|||||||
|
|
||||||
|
|
||||||
```rust
|
|
||||||
// src/assembler/source.rs
|
|
||||||
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
|
|
||||||
pub struct SourcePosition {
|
|
||||||
pub line: u32,
|
|
||||||
pub column: u32,
|
|
||||||
pub offset: usize,
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug, Clone, PartialEq, Eq)]
|
|
||||||
pub struct SourceSpan {
|
|
||||||
pub start: SourcePosition,
|
|
||||||
pub end: SourcePosition,
|
|
||||||
pub file_id: u64, // Hash of the file path
|
|
||||||
}
|
|
||||||
|
|
||||||
impl SourceSpan {
|
|
||||||
pub fn new(start: SourcePosition, end: SourcePosition, file_id: u64) -> Self {
|
|
||||||
Self { start, end, file_id }
|
|
||||||
}
|
|
||||||
|
|
||||||
pub fn single_char(pos: SourcePosition, file_id: u64) -> Self {
|
|
||||||
Self {
|
|
||||||
start: pos,
|
|
||||||
end: pos,
|
|
||||||
file_id,
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
2. Enhanced Token with Source Information
|
|
||||||
Update the Token type to include source positions:
|
|
||||||
|
|
||||||
```rust
|
|
||||||
// src/assembler/model.rs
|
|
||||||
pub struct Token {
|
|
||||||
pub kind: TokenKind,
|
|
||||||
pub span: SourceSpan,
|
|
||||||
pub raw: String, // Original source text
|
|
||||||
}
|
|
||||||
|
|
||||||
pub enum TokenKind {
|
|
||||||
// ... existing variants ...
|
|
||||||
}
|
|
||||||
3. Enhanced CodeModule Structure
|
|
||||||
Enhance the
|
|
||||||
CodeModule
|
|
||||||
struct to track source information:
|
|
||||||
|
|
||||||
```rust
|
|
||||||
// src/assembler/mod.rs
|
|
||||||
pub struct CodeModule {
|
|
||||||
pub path: PathBuf,
|
|
||||||
pub hash: u64,
|
|
||||||
pub source: String,
|
|
||||||
pub lines: Vec<usize>, // Line start offsets for quick lookup
|
|
||||||
pub tokens: Vec<Token>,
|
|
||||||
pub nodes: Vec<Node>,
|
|
||||||
pub dependencies: Vec<CodeModule>,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl CodeModule {
|
|
||||||
pub fn new(path: PathBuf, source: String) -> Self {
|
|
||||||
let hash = quick_hash(&path);
|
|
||||||
let lines = source.lines()
|
|
||||||
.scan(0, |offset, line| {
|
|
||||||
let start = *offset;
|
|
||||||
*offset += line.len() + 1; // +1 for newline
|
|
||||||
Some(start)
|
|
||||||
})
|
|
||||||
.collect();
|
|
||||||
|
|
||||||
Self {
|
|
||||||
path,
|
|
||||||
hash,
|
|
||||||
source,
|
|
||||||
lines,
|
|
||||||
tokens: Vec::new(),
|
|
||||||
nodes: Vec::new(),
|
|
||||||
dependencies: Vec::new(),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
pub fn position_from_offset(&self, offset: usize) -> (u32, u32) {
|
|
||||||
match self.lines.binary_search(&offset) {
|
|
||||||
Ok(line) => (line as u32 + 1, 1),
|
|
||||||
Err(0) => (1, offset as u32 + 1),
|
|
||||||
Err(line) => {
|
|
||||||
let line_start = self.lines[line - 1];
|
|
||||||
(line as u32, (offset - line_start + 1) as u32)
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
4. Enhanced Lexer with Source Positions
|
|
||||||
Update the lexer to track source positions:
|
|
||||||
|
|
||||||
```rust
|
|
||||||
// src/assembler/lexer.rs
|
|
||||||
pub fn lex(module: &mut CodeModule) -> Result<(), AssembleError> {
|
|
||||||
let source = &module.source;
|
|
||||||
let mut tokens = Vec::new();
|
|
||||||
let mut pos = 0;
|
|
||||||
let mut line_start = 0;
|
|
||||||
let mut line = 1;
|
|
||||||
|
|
||||||
while pos < source.len() {
|
|
||||||
let c = source[pos..].chars().next().unwrap();
|
|
||||||
|
|
||||||
if c == '\n' {
|
|
||||||
line += 1;
|
|
||||||
line_start = pos + 1;
|
|
||||||
pos += 1;
|
|
||||||
continue;
|
|
||||||
}
|
|
||||||
|
|
||||||
if c.is_whitespace() {
|
|
||||||
pos += 1;
|
|
||||||
continue;
|
|
||||||
}
|
|
||||||
|
|
||||||
let token_start = pos;
|
|
||||||
// ... existing token parsing logic ...
|
|
||||||
|
|
||||||
// When creating a token:
|
|
||||||
let start_pos = SourcePosition {
|
|
||||||
line,
|
|
||||||
column: (token_start - line_start + 1) as u32,
|
|
||||||
offset: token_start,
|
|
||||||
};
|
|
||||||
|
|
||||||
// Update pos based on token length
|
|
||||||
let token_length = /* calculate token length */;
|
|
||||||
pos += token_length;
|
|
||||||
|
|
||||||
let end_pos = SourcePosition {
|
|
||||||
line,
|
|
||||||
column: (pos - line_start + 1) as u32,
|
|
||||||
offset: pos,
|
|
||||||
};
|
|
||||||
|
|
||||||
tokens.push(Token {
|
|
||||||
kind: token_kind,
|
|
||||||
span: SourceSpan::new(start_pos, end_pos, module.hash),
|
|
||||||
raw: source[token_start..pos].to_string(),
|
|
||||||
});
|
|
||||||
}
|
|
||||||
|
|
||||||
module.tokens = tokens;
|
|
||||||
Ok(())
|
|
||||||
}
|
|
||||||
5. Enhanced Error Reporting
|
|
||||||
Create a structured error type with source context:
|
|
||||||
|
|
||||||
```rust
|
|
||||||
// src/assembler/error.rs
|
|
||||||
#[derive(Debug)]
|
|
||||||
pub struct AssemblerError {
|
|
||||||
pub kind: ErrorKind,
|
|
||||||
pub span: SourceSpan,
|
|
||||||
pub message: String,
|
|
||||||
pub context: Vec<String>,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl AssemblerError {
|
|
||||||
pub fn new(kind: ErrorKind, span: SourceSpan, message: impl Into<String>) -> Self {
|
|
||||||
Self {
|
|
||||||
kind,
|
|
||||||
span,
|
|
||||||
message: message.into(),
|
|
||||||
context: Vec::new(),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
pub fn with_context(mut self, context: impl Into<String>) -> Self {
|
|
||||||
self.context.push(context.into());
|
|
||||||
self
|
|
||||||
}
|
|
||||||
|
|
||||||
pub fn format(&self, module: &CodeModule) -> String {
|
|
||||||
let (line, col) = module.position_from_offset(self.span.start.offset);
|
|
||||||
let line_content = module.source.lines().nth(line as usize - 1).unwrap_or("");
|
|
||||||
|
|
||||||
let mut output = format!(
|
|
||||||
"{}:{}:{}: {}\n",
|
|
||||||
module.path.display(),
|
|
||||||
line,
|
|
||||||
col,
|
|
||||||
self.message
|
|
||||||
);
|
|
||||||
|
|
||||||
// Add source line with caret
|
|
||||||
output.push_str(&format!("{}\n", line_content));
|
|
||||||
output.push_str(&" ".repeat(col as usize - 1));
|
|
||||||
output.push_str("^\n");
|
|
||||||
|
|
||||||
// Add context if any
|
|
||||||
for ctx in &self.context {
|
|
||||||
output.push_str(&format!(" = note: {}\n", ctx));
|
|
||||||
}
|
|
||||||
|
|
||||||
output
|
|
||||||
}
|
|
||||||
}
|
|
||||||
6. Integration with Compilation Pipeline
|
|
||||||
Update the compilation pipeline to use the enhanced types:
|
|
||||||
|
|
||||||
```rust
|
|
||||||
// src/assembler/mod.rs
|
|
||||||
pub fn assemble(src: &Path) -> Result<Vec<Instruction>, AssemblerError> {
|
|
||||||
let source = std::fs::read_to_string(src)
|
|
||||||
.map_err(|e| AssemblerError::io_error(src, e))?;
|
|
||||||
|
|
||||||
let mut module = CodeModule::new(src.to_path_buf(), source);
|
|
||||||
|
|
||||||
// Lexing
|
|
||||||
lexer::lex(&mut module)?;
|
|
||||||
|
|
||||||
// Parsing
|
|
||||||
parser::parse(&mut module)?;
|
|
||||||
|
|
||||||
// Resolution
|
|
||||||
resolver::resolve(&mut module)?;
|
|
||||||
|
|
||||||
// Code generation
|
|
||||||
codegen::generate(&module)
|
|
||||||
}
|
|
||||||
7. Logging Integration
|
|
||||||
Enhance the logging system to include source context:
|
|
||||||
|
|
||||||
```rust
|
|
||||||
// src/util/logging.rs
|
|
||||||
pub trait Loggable {
|
|
||||||
fn log(&self, level: LogLevel, message: impl std::fmt::Display);
|
|
||||||
fn log_with_span(&self, level: LogLevel, span: &SourceSpan, message: impl std::fmt::Display);
|
|
||||||
}
|
|
||||||
|
|
||||||
impl Loggable for CodeModule {
|
|
||||||
fn log_with_span(&self, level: LogLevel, span: &SourceSpan, message: impl std::fmt::Display) {
|
|
||||||
if span.file_id != self.hash {
|
|
||||||
if let Some(dep) = self.find_dependency(span.file_id) {
|
|
||||||
return dep.log_with_span(level, span, message);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
let (line, col) = self.position_from_offset(span.start.offset);
|
|
||||||
let line_content = self.source.lines().nth(line as usize - 1).unwrap_or("");
|
|
||||||
|
|
||||||
log::log!(
|
|
||||||
level,
|
|
||||||
"{}:{}:{}: {}\n {}\n {}{}",
|
|
||||||
self.path.display(),
|
|
||||||
line,
|
|
||||||
col,
|
|
||||||
message,
|
|
||||||
line_content,
|
|
||||||
" ".repeat(col as usize - 1),
|
|
||||||
"^"
|
|
||||||
);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
8. Usage Example
|
|
||||||
Here's how you'd use this in practice:
|
|
||||||
|
|
||||||
```rust
|
|
||||||
// In your parser or code that needs to report errors
|
|
||||||
fn parse_token(&mut self, module: &CodeModule) -> Result<Token, AssemblerError> {
|
|
||||||
// ...
|
|
||||||
if !is_valid_token(&token) {
|
|
||||||
return Err(AssemblerError::new(
|
|
||||||
ErrorKind::SyntaxError,
|
|
||||||
token.span,
|
|
||||||
"Invalid token"
|
|
||||||
).with_context("Expected a valid instruction or directive"));
|
|
||||||
}
|
|
||||||
// ...
|
|
||||||
}
|
|
||||||
```
|
|
||||||
@@ -2,10 +2,10 @@
|
|||||||
// a simple brainf##k interpreter,
|
// a simple brainf##k interpreter,
|
||||||
// because I already wrote a compiler lol.
|
// because I already wrote a compiler lol.
|
||||||
|
|
||||||
include print "./lib/print.dsa"
|
include print "./lib/io/print.dsa"
|
||||||
|
|
||||||
// "print hello world"
|
// "print hello world"
|
||||||
db program "++++++++++++++++++++++++++++++++++++++++++++
|
db program: "++++++++++++++++++++++++++++++++++++++++++++
|
||||||
>++++++++++++++++++++++++++++++++
|
>++++++++++++++++++++++++++++++++
|
||||||
>++++++++++++++++
|
>++++++++++++++++
|
||||||
>
|
>
|
||||||
@@ -35,10 +35,10 @@ db program "++++++++++++++++++++++++++++++++++++++++++++
|
|||||||
]
|
]
|
||||||
<<++..."
|
<<++..."
|
||||||
|
|
||||||
db error "Invalid Instruction!"
|
db error: "Invalid Instruction!"
|
||||||
dw stack 0x10000
|
dw stack: 0x10000
|
||||||
dw input 0x30000
|
dw input: 0x30000
|
||||||
resb data 1024
|
resb data: 1024
|
||||||
|
|
||||||
// set up a stack so we can call functions
|
// set up a stack so we can call functions
|
||||||
_init_stack:
|
_init_stack:
|
||||||
|
|||||||
@@ -0,0 +1,34 @@
|
|||||||
|
include print "../io/print.dsa"
|
||||||
|
|
||||||
|
dw idt: 0xFFFF0000
|
||||||
|
|
||||||
|
setup_idt:
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
|
||||||
|
// load the IDT into the IDR
|
||||||
|
ldw idt, idr
|
||||||
|
|
||||||
|
mov bpr, spr
|
||||||
|
pop bpr
|
||||||
|
irt
|
||||||
|
|
||||||
|
setup_hard_fault_handler:
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
|
||||||
|
lwi handle_hard_fault, rg0
|
||||||
|
stw rg0, idr, 4
|
||||||
|
|
||||||
|
mov bpr, spr
|
||||||
|
pop bpr
|
||||||
|
irt
|
||||||
|
|
||||||
|
dw hard_fault_err: "FATAL: Illegal Instruction or Memory Access!"
|
||||||
|
handle_hard_fault:
|
||||||
|
call print::reset
|
||||||
|
lwi hard_fault_err, rg0
|
||||||
|
push rg0
|
||||||
|
call print::print
|
||||||
|
pop zero
|
||||||
|
hlt
|
||||||
@@ -1,18 +0,0 @@
|
|||||||
fib_n:
|
|
||||||
pop ret
|
|
||||||
pop rg0 // n
|
|
||||||
|
|
||||||
lli 0, rg1
|
|
||||||
lli 1, rg2
|
|
||||||
|
|
||||||
start:
|
|
||||||
add rg1, rg2, acc
|
|
||||||
push rg1
|
|
||||||
mov rg2, rg1
|
|
||||||
mov acc, rg2
|
|
||||||
|
|
||||||
cmp rg0, zero
|
|
||||||
dec rg0
|
|
||||||
|
|
||||||
jgt start
|
|
||||||
jmp 4, ret
|
|
||||||
@@ -0,0 +1,244 @@
|
|||||||
|
// lib:
|
||||||
|
// print.dsa
|
||||||
|
|
||||||
|
// usage:
|
||||||
|
//
|
||||||
|
// include print "<relative path>""
|
||||||
|
//
|
||||||
|
// usage for print:
|
||||||
|
// push (register containing address of string)
|
||||||
|
// push pcx
|
||||||
|
// jmp print::print
|
||||||
|
//
|
||||||
|
// usage for reset:
|
||||||
|
// push pcx
|
||||||
|
// jmp print::reset
|
||||||
|
//
|
||||||
|
// usage for clear:
|
||||||
|
// push pcx
|
||||||
|
// jmp print::clear
|
||||||
|
//
|
||||||
|
// usage for print_byte:
|
||||||
|
// push (register containing byte)
|
||||||
|
// push pcx
|
||||||
|
// jmp print::print_byte
|
||||||
|
//
|
||||||
|
// usage for print_word:
|
||||||
|
// push (register containing word)
|
||||||
|
// push pcx
|
||||||
|
// jmp print::print_word
|
||||||
|
//
|
||||||
|
|
||||||
|
include maths "../maths/core.dsa"
|
||||||
|
|
||||||
|
dw display: 0x20000
|
||||||
|
dw current: 0x20000
|
||||||
|
|
||||||
|
// ------------------------------------------
|
||||||
|
// prints the string at addr(arg[0]) to the screen.
|
||||||
|
print:
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
|
||||||
|
ldw bpr, rg0, 8
|
||||||
|
ldw current, rg1
|
||||||
|
|
||||||
|
_print_loop:
|
||||||
|
ldb rg0, acc
|
||||||
|
stb acc, rg1
|
||||||
|
|
||||||
|
addi rg0, 1
|
||||||
|
addi rg1, 1
|
||||||
|
|
||||||
|
cmp acc, zero
|
||||||
|
jne _print_loop
|
||||||
|
jmp _end
|
||||||
|
|
||||||
|
// ------------------------------------------
|
||||||
|
// prints the value of arg[0] to the screen.
|
||||||
|
print_word:
|
||||||
|
// initialise
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
|
||||||
|
// load byte into acc
|
||||||
|
ldw bpr, rg0, 8
|
||||||
|
ldw current, rg1
|
||||||
|
|
||||||
|
addi rg1, 3
|
||||||
|
|
||||||
|
stb rg0, rg1
|
||||||
|
subi rg1, 1
|
||||||
|
shr rg0, 8
|
||||||
|
stb rg0, rg1
|
||||||
|
subi rg1, 1
|
||||||
|
shr rg0, 8
|
||||||
|
stb rg0, rg1
|
||||||
|
subi rg1, 1
|
||||||
|
shr rg0, 8
|
||||||
|
stb rg0, rg1
|
||||||
|
|
||||||
|
addi rg1, 4
|
||||||
|
jmp _end
|
||||||
|
|
||||||
|
// ------------------------------------------
|
||||||
|
// prints the last byte of arg[0] to the screen.
|
||||||
|
print_byte:
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
|
||||||
|
ldw bpr, rg0, 8
|
||||||
|
ldw current, rg1
|
||||||
|
|
||||||
|
stb rg0, rg1
|
||||||
|
addi rg1, 1
|
||||||
|
jmp _end
|
||||||
|
|
||||||
|
// ------------------------------------------
|
||||||
|
// prints the value of arg[0] to the screen in hex.
|
||||||
|
print_hex_word:
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
|
||||||
|
ldw current, rg1
|
||||||
|
|
||||||
|
ldb bpr, rg0, 8
|
||||||
|
push rg0
|
||||||
|
call _print_hex_byte
|
||||||
|
addi spr, 4
|
||||||
|
|
||||||
|
ldb bpr, rg0, 9
|
||||||
|
push rg0
|
||||||
|
call _print_hex_byte
|
||||||
|
addi spr, 4
|
||||||
|
|
||||||
|
ldb bpr, rg0, 10
|
||||||
|
push rg0
|
||||||
|
call _print_hex_byte
|
||||||
|
addi spr, 4
|
||||||
|
|
||||||
|
ldb bpr, rg0, 11
|
||||||
|
push rg0
|
||||||
|
call _print_hex_byte
|
||||||
|
addi spr, 4
|
||||||
|
|
||||||
|
jmp _end
|
||||||
|
|
||||||
|
// ------------------------------------------
|
||||||
|
// prints the last byte of arg[0] to the screen in hex.
|
||||||
|
print_hex_byte:
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
|
||||||
|
ldw bpr, rg0, 8
|
||||||
|
ldw current, rg1
|
||||||
|
|
||||||
|
call _print_hex_byte
|
||||||
|
jmp _end
|
||||||
|
|
||||||
|
// function body
|
||||||
|
_print_hex_byte:
|
||||||
|
// mask to get lower nibble
|
||||||
|
lli 0xF, rg2
|
||||||
|
// save rg0 state
|
||||||
|
push rg0
|
||||||
|
|
||||||
|
shr rg0, 4
|
||||||
|
and rg0, rg2, rg0
|
||||||
|
call _print_hex_nibble
|
||||||
|
pop rg0
|
||||||
|
|
||||||
|
and rg0, rg2, rg0
|
||||||
|
call _print_hex_nibble
|
||||||
|
return
|
||||||
|
|
||||||
|
// print a hex digit
|
||||||
|
_print_hex_nibble:
|
||||||
|
lli 10, rg3
|
||||||
|
cmp rg0, rg3
|
||||||
|
jlt _print_hex_nibble_number
|
||||||
|
addi rg0, 0x37, rg0
|
||||||
|
stb rg0, rg1
|
||||||
|
addi rg1, 1
|
||||||
|
return
|
||||||
|
|
||||||
|
// helper function.
|
||||||
|
_print_hex_nibble_number:
|
||||||
|
addi rg0, 0x30, rg0
|
||||||
|
stb rg0, rg1
|
||||||
|
addi rg1, 1
|
||||||
|
return
|
||||||
|
|
||||||
|
// ------------------------------------------
|
||||||
|
// print whitespace
|
||||||
|
print_whitespace:
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
|
||||||
|
ldw current, rg1
|
||||||
|
lli 0x20, rg0
|
||||||
|
stb rg0, rg1
|
||||||
|
addi rg1, 1
|
||||||
|
jmp _end
|
||||||
|
|
||||||
|
// ------------------------------------------
|
||||||
|
// print newline
|
||||||
|
print_newline:
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
|
||||||
|
// load variables into registers
|
||||||
|
ldw display, rg0
|
||||||
|
ldw current, rg1
|
||||||
|
|
||||||
|
// get the offset from the display base
|
||||||
|
sub rg1, rg0, rg0
|
||||||
|
|
||||||
|
lwi 80, rg2
|
||||||
|
pusha 3
|
||||||
|
push rg0
|
||||||
|
push rg2
|
||||||
|
call maths::divmod
|
||||||
|
pop zero // result
|
||||||
|
pop rg3 // remainder
|
||||||
|
popa 3
|
||||||
|
|
||||||
|
sub rg1, rg3, rg2
|
||||||
|
addi rg2, 80, rg1
|
||||||
|
|
||||||
|
// _end saves the display state
|
||||||
|
jmp _end
|
||||||
|
|
||||||
|
// ------------------------------------------
|
||||||
|
// resets the cursor position on the screen to 0x20000. (0,0)
|
||||||
|
reset:
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
ldw display, rg1
|
||||||
|
jmp _end
|
||||||
|
|
||||||
|
// ------------------------------------------
|
||||||
|
// clears the screen
|
||||||
|
clear:
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
// display size = 2000 bytes / 500 words
|
||||||
|
lli 500 rg0
|
||||||
|
ldw display, rg1
|
||||||
|
|
||||||
|
_clear_loop:
|
||||||
|
dec rg0
|
||||||
|
stw zero, rg1
|
||||||
|
addi rg1, 4
|
||||||
|
cmp rg0, zero
|
||||||
|
jgt _clear_loop
|
||||||
|
jmp _end
|
||||||
|
|
||||||
|
// ------------------------------------------
|
||||||
|
// return
|
||||||
|
_end:
|
||||||
|
stw rg1, current
|
||||||
|
|
||||||
|
mov bpr, spr
|
||||||
|
pop bpr
|
||||||
|
return
|
||||||
@@ -0,0 +1,60 @@
|
|||||||
|
// multiply.dsa
|
||||||
|
// usage:
|
||||||
|
//
|
||||||
|
// include multiply "<relative path>"
|
||||||
|
//
|
||||||
|
// usage for multiply:
|
||||||
|
// push (arg1)
|
||||||
|
// push (arg0)
|
||||||
|
// call multiply::multiply
|
||||||
|
// pop (arg0)
|
||||||
|
// pop (arg1)
|
||||||
|
|
||||||
|
multiply:
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
|
||||||
|
ldw bpr, rg0, 8 // load op 2
|
||||||
|
ldw bpr, rg1, 12 // load op 1
|
||||||
|
|
||||||
|
_multiply_loop:
|
||||||
|
add rg2, rg0, rg2
|
||||||
|
dec rg1
|
||||||
|
|
||||||
|
cmp rg1, zero
|
||||||
|
jgt _multiply_loop
|
||||||
|
|
||||||
|
_multiply_end:
|
||||||
|
stw rg2, bpr, 8
|
||||||
|
|
||||||
|
mov bpr, spr
|
||||||
|
pop bpr
|
||||||
|
return
|
||||||
|
|
||||||
|
divmod:
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
|
||||||
|
ldw bpr, rg1, 8 // load op 2
|
||||||
|
ldw bpr, rg0, 12 // load op 1
|
||||||
|
|
||||||
|
lli 0, rg3
|
||||||
|
|
||||||
|
_divmod_loop:
|
||||||
|
cmp rg0, rg1
|
||||||
|
jlt _divmod_end
|
||||||
|
|
||||||
|
sub rg0, rg1, rg0
|
||||||
|
inc rg3
|
||||||
|
|
||||||
|
jmp _divmod_loop
|
||||||
|
|
||||||
|
_divmod_end:
|
||||||
|
// store div in first arg
|
||||||
|
// store mod in second arg
|
||||||
|
stw rg3, bpr, 8
|
||||||
|
stw rg0, bpr, 12
|
||||||
|
|
||||||
|
mov bpr, spr
|
||||||
|
pop bpr
|
||||||
|
return
|
||||||
@@ -0,0 +1,31 @@
|
|||||||
|
include print "../io/print.dsa"
|
||||||
|
|
||||||
|
fib_n:
|
||||||
|
push bpr
|
||||||
|
mov spr, bpr
|
||||||
|
|
||||||
|
ldw bpr, rg0, 8 // load arg
|
||||||
|
mov rg1, rg2
|
||||||
|
lwi 1, rg1
|
||||||
|
|
||||||
|
start:
|
||||||
|
add rg1, rg2, rg3
|
||||||
|
|
||||||
|
pusha 4
|
||||||
|
push rg1
|
||||||
|
call print::print_hex_byte
|
||||||
|
call print::print_newline
|
||||||
|
pop zero
|
||||||
|
popa 4
|
||||||
|
|
||||||
|
mov rg2, rg1
|
||||||
|
mov rg3, rg2
|
||||||
|
|
||||||
|
dec rg0
|
||||||
|
cmp rg0, zero
|
||||||
|
jgt start
|
||||||
|
|
||||||
|
stw rg1, bpr, 8
|
||||||
|
mov bpr, spr
|
||||||
|
pop bpr
|
||||||
|
return
|
||||||
@@ -1,30 +0,0 @@
|
|||||||
// multiply.dsa
|
|
||||||
// usage:
|
|
||||||
//
|
|
||||||
// include multiply "<relative path>"
|
|
||||||
//
|
|
||||||
// usage for multiply:
|
|
||||||
// push (arg1)
|
|
||||||
// push (arg0)
|
|
||||||
// call multiply::multiply
|
|
||||||
// pop (arg0)
|
|
||||||
// pop (arg1)
|
|
||||||
|
|
||||||
multiply:
|
|
||||||
push bpr
|
|
||||||
mov spr, bpr
|
|
||||||
|
|
||||||
ldw bpr, rg0, 8 // load op 1
|
|
||||||
ldw bpr, rg1, 12 // load op 2
|
|
||||||
|
|
||||||
start:
|
|
||||||
add acc, rg0, acc
|
|
||||||
dec rg1
|
|
||||||
|
|
||||||
cmp rg1, zero
|
|
||||||
jgt start
|
|
||||||
|
|
||||||
end:
|
|
||||||
mov bpr, spr
|
|
||||||
pop bpr
|
|
||||||
return
|
|
||||||
@@ -1,115 +0,0 @@
|
|||||||
// lib:
|
|
||||||
// print.dsa
|
|
||||||
|
|
||||||
// usage:
|
|
||||||
//
|
|
||||||
// include print "<relative path>""
|
|
||||||
//
|
|
||||||
// usage for print:
|
|
||||||
// push (register containing address of string)
|
|
||||||
// push pcx
|
|
||||||
// jmp print::print
|
|
||||||
//
|
|
||||||
// usage for reset:
|
|
||||||
// push pcx
|
|
||||||
// jmp print::reset
|
|
||||||
//
|
|
||||||
// usage for clear:
|
|
||||||
// push pcx
|
|
||||||
// jmp print::clear
|
|
||||||
//
|
|
||||||
// usage for print_byte:
|
|
||||||
// push (register containing byte)
|
|
||||||
// push pcx
|
|
||||||
// jmp print::print_byte
|
|
||||||
//
|
|
||||||
// usage for print_word:
|
|
||||||
// push (register containing word)
|
|
||||||
// push pcx
|
|
||||||
// jmp print::print_word
|
|
||||||
//
|
|
||||||
|
|
||||||
dw display: 0x20000
|
|
||||||
dw current: 0x20000
|
|
||||||
|
|
||||||
// ------------------------------------------
|
|
||||||
// prints the string at addr(arg[0]) to the screen.
|
|
||||||
print:
|
|
||||||
push bpr
|
|
||||||
mov spr, bpr
|
|
||||||
|
|
||||||
ldw bpr, rg0, 8
|
|
||||||
ldw current, rg1
|
|
||||||
|
|
||||||
_print_loop:
|
|
||||||
ldb rg0, acc
|
|
||||||
stb acc, rg1
|
|
||||||
|
|
||||||
addi rg0, 1
|
|
||||||
addi rg1, 1
|
|
||||||
|
|
||||||
cmp acc, zero
|
|
||||||
jne _print_loop
|
|
||||||
jmp _end
|
|
||||||
|
|
||||||
// ------------------------------------------
|
|
||||||
// prints the value of arg[0] to the screen.
|
|
||||||
print_word:
|
|
||||||
// initialise
|
|
||||||
push bpr
|
|
||||||
mov spr, bpr
|
|
||||||
|
|
||||||
// load byte into acc
|
|
||||||
ldw bpr, rg0, 8
|
|
||||||
ldw current, rg1
|
|
||||||
|
|
||||||
stw rg0, rg1
|
|
||||||
addi rg1, 4
|
|
||||||
jmp _end
|
|
||||||
|
|
||||||
// ------------------------------------------
|
|
||||||
// prints the last byte of arg[0] to the screen.
|
|
||||||
print_byte:
|
|
||||||
push bpr
|
|
||||||
mov spr, bpr
|
|
||||||
|
|
||||||
ldw bpr, rg0, 8
|
|
||||||
ldw current, rg1
|
|
||||||
|
|
||||||
stb rg0, rg1
|
|
||||||
addi rg1, 1
|
|
||||||
jmp _end
|
|
||||||
|
|
||||||
// ------------------------------------------
|
|
||||||
// resets the cursor position on the screen to 0x20000. (0,0)
|
|
||||||
reset:
|
|
||||||
push bpr
|
|
||||||
mov spr, bpr
|
|
||||||
ldw display, rg1
|
|
||||||
jmp _end
|
|
||||||
|
|
||||||
// ------------------------------------------
|
|
||||||
// clears the screen
|
|
||||||
clear:
|
|
||||||
push bpr
|
|
||||||
mov spr, bpr
|
|
||||||
// display size = 2000 bytes / 500 words
|
|
||||||
lli 500 rg0
|
|
||||||
ldw display, rg1
|
|
||||||
|
|
||||||
_clear_loop:
|
|
||||||
dec rg0
|
|
||||||
stw zero, rg1
|
|
||||||
addi rg1, 4
|
|
||||||
cmp rg0, zero
|
|
||||||
jgt _clear_loop
|
|
||||||
jmp _end
|
|
||||||
|
|
||||||
// ------------------------------------------
|
|
||||||
// return
|
|
||||||
_end:
|
|
||||||
stw rg1, current
|
|
||||||
|
|
||||||
mov bpr, spr
|
|
||||||
pop bpr
|
|
||||||
return
|
|
||||||
@@ -0,0 +1,80 @@
|
|||||||
|
include fib: "./lib/maths/fib.dsa"
|
||||||
|
include maths: "./lib/maths/core.dsa"
|
||||||
|
include print: "./lib/io/print.dsa"
|
||||||
|
|
||||||
|
dw idt: 0xFFFF0000
|
||||||
|
dw stack: 0x10000
|
||||||
|
init:
|
||||||
|
// setup interrupt handlers
|
||||||
|
ldw idt, idr
|
||||||
|
lwi handle_hard_fault, rg0
|
||||||
|
stw rg0, idr, 4
|
||||||
|
// set up a stack.
|
||||||
|
ldw stack, bpr
|
||||||
|
mov bpr, spr
|
||||||
|
|
||||||
|
dw string: "hello world"
|
||||||
|
start:
|
||||||
|
|
||||||
|
lwi 37, rg0
|
||||||
|
lwi 12, rg1
|
||||||
|
push rg0
|
||||||
|
push rg1
|
||||||
|
call maths::divmod
|
||||||
|
pop rg0 // result
|
||||||
|
pop rg1 // remainder
|
||||||
|
|
||||||
|
push rg1
|
||||||
|
push rg0
|
||||||
|
call print::print_hex_byte
|
||||||
|
call print::print_whitespace
|
||||||
|
pop zero
|
||||||
|
call print::print_hex_byte
|
||||||
|
call print::print_newline
|
||||||
|
|
||||||
|
lwi string, rg0
|
||||||
|
//lwi 10, rg0
|
||||||
|
pusha 4
|
||||||
|
push rg0
|
||||||
|
call print::print
|
||||||
|
//call fib::fib_n
|
||||||
|
pop zero
|
||||||
|
call print::print_newline
|
||||||
|
popa 4
|
||||||
|
|
||||||
|
pusha 4
|
||||||
|
push rg0
|
||||||
|
call print::print
|
||||||
|
//call fib::fib_n
|
||||||
|
pop zero
|
||||||
|
call print::print_newline
|
||||||
|
popa 4
|
||||||
|
|
||||||
|
pusha 4
|
||||||
|
push rg0
|
||||||
|
call print::print
|
||||||
|
//call fib::fib_n
|
||||||
|
pop zero
|
||||||
|
call print::print_newline
|
||||||
|
popa 4
|
||||||
|
|
||||||
|
pusha 4
|
||||||
|
push rg0
|
||||||
|
call print::print
|
||||||
|
//call fib::fib_n
|
||||||
|
pop zero
|
||||||
|
call print::print_newline
|
||||||
|
popa 4
|
||||||
|
|
||||||
|
hlt
|
||||||
|
|
||||||
|
// fault handler in case we fail DSA.
|
||||||
|
dw hard_fault_err: "FATAL: Illegal Instruction or Memory Access!"
|
||||||
|
handle_hard_fault:
|
||||||
|
call print::clear
|
||||||
|
call print::reset
|
||||||
|
lwi hard_fault_err, rg0
|
||||||
|
push rg0
|
||||||
|
call print::print
|
||||||
|
pop zero
|
||||||
|
hlt
|
||||||
@@ -1,18 +0,0 @@
|
|||||||
include print "./lib/print.dsa"
|
|
||||||
|
|
||||||
dw stack: 0x10000
|
|
||||||
db string: "Hello world"
|
|
||||||
|
|
||||||
init:
|
|
||||||
// set up a stack.
|
|
||||||
ldw stack, bpr
|
|
||||||
mov bpr, spr
|
|
||||||
|
|
||||||
start:
|
|
||||||
lwi string, rg1
|
|
||||||
|
|
||||||
push rg1
|
|
||||||
call print::print
|
|
||||||
pop rg1
|
|
||||||
|
|
||||||
hlt
|
|
||||||
@@ -0,0 +1,80 @@
|
|||||||
|
include print "./lib/io/print.dsa"
|
||||||
|
|
||||||
|
dw idt: 0xFFFF0000
|
||||||
|
dw stack: 0x10000
|
||||||
|
init:
|
||||||
|
// setup interrupt handlers
|
||||||
|
ldw idt, idr
|
||||||
|
lwi handle_hard_fault, rg0
|
||||||
|
stw rg0, idr, 4
|
||||||
|
// set up a stack.
|
||||||
|
ldw stack, bpr
|
||||||
|
mov bpr, spr
|
||||||
|
|
||||||
|
|
||||||
|
db string: "I won, the game!"
|
||||||
|
db hexbyte: 0xab
|
||||||
|
dw hexword: 0x1234abcd
|
||||||
|
db replace: "I lost"
|
||||||
|
|
||||||
|
start:
|
||||||
|
// test print string
|
||||||
|
lwi string, rg0
|
||||||
|
push rg0
|
||||||
|
call print::print
|
||||||
|
pop zero
|
||||||
|
|
||||||
|
// test print hex byte.
|
||||||
|
ldb hexbyte, rg0
|
||||||
|
push rg0
|
||||||
|
call print::print_hex_byte
|
||||||
|
pop zero
|
||||||
|
|
||||||
|
// test print hex word.
|
||||||
|
ldw hexword, rg0
|
||||||
|
push rg0
|
||||||
|
call print::print_hex_word
|
||||||
|
pop zero
|
||||||
|
|
||||||
|
// test print char
|
||||||
|
lli 0x40, rg0 // print @
|
||||||
|
push rg0
|
||||||
|
call print::print_byte
|
||||||
|
pop zero
|
||||||
|
|
||||||
|
// test newline
|
||||||
|
call print::print_newline
|
||||||
|
|
||||||
|
lwi string rg0
|
||||||
|
push rg0
|
||||||
|
call print::print
|
||||||
|
|
||||||
|
// test print word
|
||||||
|
lwi 0x31323334, rg0 // print 1234
|
||||||
|
push rg0
|
||||||
|
call print::print_word
|
||||||
|
pop zero
|
||||||
|
|
||||||
|
// test reset cursor pos
|
||||||
|
call print::reset
|
||||||
|
|
||||||
|
// test print string at reset pos
|
||||||
|
lwi replace, rg0
|
||||||
|
push rg0
|
||||||
|
call print::print
|
||||||
|
pop zero
|
||||||
|
|
||||||
|
hlt
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
// fault handler in case we fail DSA.
|
||||||
|
dw hard_fault_err: "FATAL: Illegal Instruction or Memory Access!"
|
||||||
|
handle_hard_fault:
|
||||||
|
call print::clear
|
||||||
|
call print::reset
|
||||||
|
lwi hard_fault_err, rg0
|
||||||
|
push rg0
|
||||||
|
call print::print
|
||||||
|
pop zero
|
||||||
|
hlt
|
||||||
Binary file not shown.
Reference in New Issue
Block a user