Compare commits

...

2 Commits

Author SHA1 Message Date
core 65f375dd97
panic hook 2024-01-21 01:42:39 -05:00
core 7fdc97b619
lexer v2 2024-01-21 01:42:38 -05:00
17 changed files with 586 additions and 321 deletions

View File

@ -2,8 +2,10 @@
<module type="EMPTY_MODULE" version="4"> <module type="EMPTY_MODULE" version="4">
<component name="NewModuleRootManager"> <component name="NewModuleRootManager">
<content url="file://$MODULE_DIR$"> <content url="file://$MODULE_DIR$">
<sourceFolder url="file://$MODULE_DIR$/kabel-rs/src" isTestSource="false" />
<sourceFolder url="file://$MODULE_DIR$/kabel/src" isTestSource="false" /> <sourceFolder url="file://$MODULE_DIR$/kabel/src" isTestSource="false" />
<sourceFolder url="file://$MODULE_DIR$/libkabel/src" isTestSource="false" /> <sourceFolder url="file://$MODULE_DIR$/libkabel/src" isTestSource="false" />
<excludeFolder url="file://$MODULE_DIR$/kabel-rs/target" />
<excludeFolder url="file://$MODULE_DIR$/target" /> <excludeFolder url="file://$MODULE_DIR$/target" />
</content> </content>
<orderEntry type="inheritedJdk" /> <orderEntry type="inheritedJdk" />

7
Cargo.lock generated
View File

@ -40,6 +40,12 @@ version = "0.3.3"
source = "registry+https://github.com/rust-lang/crates.io-index" source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "d77f7ec81a6d05a3abb01ab6eb7590f6083d08449fe5a1c8b1e620283546ccb7" checksum = "d77f7ec81a6d05a3abb01ab6eb7590f6083d08449fe5a1c8b1e620283546ccb7"
[[package]]
name = "hex"
version = "0.4.3"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "7f24254aa9a54b5c858eaee2f5bccdb46aaf0e486a595ed5fd8f86ba55232a70"
[[package]] [[package]]
name = "is-terminal" name = "is-terminal"
version = "0.4.10" version = "0.4.10"
@ -56,6 +62,7 @@ name = "kabel"
version = "0.1.0" version = "0.1.0"
dependencies = [ dependencies = [
"colored", "colored",
"hex",
"is-terminal", "is-terminal",
"libkabel", "libkabel",
"tracing-subscriber", "tracing-subscriber",

View File

@ -12,3 +12,4 @@ libkabel = { version = "0.1", path = "../libkabel", features = ["pretty-emitter"
is-terminal = "0.4" is-terminal = "0.4"
tracing-subscriber = "0.3" tracing-subscriber = "0.3"
colored = "2" colored = "2"
hex = "0.4"

View File

@ -1,26 +1,46 @@
use std::env; use colored::Colorize;
use std::error::Error;
use std::fs::File;
use std::io::{self, Read};
use libkabel::diagnostics::emitters::Emitter; use libkabel::diagnostics::emitters::Emitter;
use libkabel::error::KError; use libkabel::error::KError;
use libkabel::formatter::print_tts;
use libkabel::lexer::token::Token; use libkabel::lexer::token::Token;
use colored::Colorize; use libkabel::source::SourceFile;
use std::error::Error;
use std::io;
use std::{env, fs};
use std::fmt::Write;
fn main() -> Result<(), Box<dyn Error>> { fn main() -> Result<(), Box<dyn Error>> {
std::panic::set_hook(Box::new(|i| {
eprintln!("{}", "----- Kabel has crashed! -----".red());
eprintln!("{} {} {}", "--".red(), "THIS IS NOT YOUR FAULT".bold().red(), "--".red());
eprintln!("{}", "Please report the following Error ID to the Kabel developers, along with your program's complete source code.".red());
let mut panic_info = String::new();
write!(panic_info, "{i}").unwrap();
let error_id = hex::encode(panic_info);
eprintln!("{}{}", "Error ID: ".red(), error_id.italic().red());
eprintln!("{}", "Please, either:".red());
eprintln!("{}", "- Open an issue at https://git.e3t.cc/tm85/kabel, or".red());
eprintln!("{}", "- E-Mail the developers at kabel@e3t.cc".red());
eprintln!("{} {} {}", "-- Remember:".red(), "THIS IS NOT YOUR FAULT".bold().red(), "--".red());
eprintln!("{}", "----- Kabel has crashed! -----".red());
}));
let argv: Vec<String> = env::args().collect(); let argv: Vec<String> = env::args().collect();
if argv.len() != 2 { if argv.len() != 2 {
println!("Usage: {} <file.kab>", &argv[0]); println!("Usage: {} <file.kab>", &argv[0]);
std::process::exit(1); std::process::exit(1);
} }
let mut source_fd = match File::open(&argv[1]) { let text_source = match fs::read_to_string(&argv[1]) {
Err(e) if e.kind() == io::ErrorKind::NotFound => { Err(e) if e.kind() == io::ErrorKind::NotFound => {
std::process::exit(1); std::process::exit(1);
} }
Err(e) => { Err(e) => {
eprintln!( eprintln!(
"error: Tried opening file `{}' and got unexpected error: {}", "error: Tried reading file `{}' and got unexpected error: {}",
argv[1], argv[1],
e.kind() e.kind()
); );
@ -31,26 +51,42 @@ fn main() -> Result<(), Box<dyn Error>> {
tracing_subscriber::fmt::init(); tracing_subscriber::fmt::init();
let mut text_source = String::new(); let source = SourceFile::new(text_source, argv[1].clone());
source_fd.read_to_string(&mut text_source)?;
// Lex! // Lex!
let lexed: Vec<Token> = match libkabel::lexer::lexer(&text_source) { let lexed: Vec<Token> = match libkabel::lexer::lexer(source) {
Err(e) => { Err(e) => {
match e { match e {
KError::InternalError(e) => { KError::InternalError(e) => {
eprintln!("{} {}", eprintln!(
"error: Internal Kabel error!".red(), "{} {}",
"THIS IS NOT YOUR FAULT.".bold().red()); "error: Internal Kabel error!".red(),
eprintln!("{}", "error: Please report this error to the kabel developers along with your".red()); "THIS IS NOT YOUR FAULT.".bold().red()
eprintln!("{}", "fail: program's complete source code. Either"); );
eprintln!("{}", "fail: - Open an Issue at https://git.e3t.cc/tm85/kabel, or".red()); eprintln!(
eprintln!("{}", "fail: - E-Mail the developers at kabel@e3t.cc".red()); "{}",
"error: Please report this error to the kabel developers along with your"
.red()
);
eprintln!("{}", "fail: program's complete source code. Either".red());
eprintln!(
"{}",
"fail: - Open an Issue at https://git.e3t.cc/tm85/kabel, or".red()
);
eprintln!(
"{}",
"fail: - E-Mail the developers at kabel@e3t.cc".red()
);
eprintln!("{} {:?}", "fail: Error message follows:".red(), e); eprintln!("{} {:?}", "fail: Error message follows:".red(), e);
} }
KError::UserError(diags) => { KError::UserError(diags, src_map) => {
//eprintln!("{}", libkabel::diagnostics::emitters::basic::BasicEmitter::emit(diags, text_source)); //eprintln!("{}", libkabel::diagnostics::emitters::basic::BasicEmitter::emit(diags, text_source));
eprintln!("{}", libkabel::diagnostics::emitters::pretty::PrettyEmitter::emit(diags, text_source, argv[1].clone())); eprintln!(
"{}",
libkabel::diagnostics::emitters::pretty::PrettyEmitter::emit(
diags, src_map
)
);
} }
} }
std::process::exit(1); std::process::exit(1);
@ -58,7 +94,7 @@ fn main() -> Result<(), Box<dyn Error>> {
Ok(lexed) => lexed, Ok(lexed) => lexed,
}; };
println!("{:#?}", lexed); print_tts(&lexed);
Ok(()) Ok(())
} }

View File

@ -1,5 +1,6 @@
use crate::diagnostics::Diagnostic;
use crate::diagnostics::emitters::Emitter; use crate::diagnostics::emitters::Emitter;
use crate::diagnostics::Diagnostic;
use crate::source::SourceFile;
use std::fmt::Write; use std::fmt::Write;
pub struct BasicEmitter; pub struct BasicEmitter;
@ -7,7 +8,7 @@ pub struct BasicEmitter;
impl Emitter for BasicEmitter { impl Emitter for BasicEmitter {
type Output = String; type Output = String;
fn emit(diag: Vec<Diagnostic>, _source: String, _source_name: String) -> Self::Output { fn emit(diag: Vec<Diagnostic>, _source: SourceFile) -> Self::Output {
let mut output = String::new(); let mut output = String::new();
for msg in diag { for msg in diag {
@ -16,4 +17,4 @@ impl Emitter for BasicEmitter {
output output
} }
} }

View File

@ -1,11 +1,11 @@
use crate::diagnostics::Diagnostic; use crate::diagnostics::Diagnostic;
use crate::source::SourceFile;
pub mod basic; pub mod basic;
#[cfg(feature = "pretty-emitter")] #[cfg(feature = "pretty-emitter")]
pub mod pretty; pub mod pretty;
pub(crate) mod util;
pub trait Emitter { pub trait Emitter {
type Output; type Output;
fn emit(diag: Vec<Diagnostic>, source: String, source_name: String) -> Self::Output; fn emit(diag: Vec<Diagnostic>, source: SourceFile) -> Self::Output;
} }

View File

@ -1,19 +1,18 @@
use crate::diagnostics::{Diagnostic, DiagnosticType};
use crate::diagnostics::emitters::Emitter; use crate::diagnostics::emitters::Emitter;
use std::fmt::Write; use crate::diagnostics::{Diagnostic, DiagnosticType};
use crate::source::SourceFile;
use colored::{ColoredString, Colorize}; use colored::{ColoredString, Colorize};
use crate::diagnostics::emitters::util::{get_line, pos_to_line_col}; use std::fmt::Write;
pub struct PrettyEmitter; pub struct PrettyEmitter;
impl Emitter for PrettyEmitter { impl Emitter for PrettyEmitter {
type Output = String; type Output = String;
fn emit(diag: Vec<Diagnostic>, source: String, source_name: String) -> Self::Output { fn emit(diag: Vec<Diagnostic>, source_map: SourceFile) -> Self::Output {
let mut output = String::new(); let mut output = String::new();
for msg in diag { for msg in diag {
match msg.diag_type { match msg.diag_type {
DiagnosticType::Error => { DiagnosticType::Error => {
write!(output, "{}", "error".bold().red()).unwrap(); write!(output, "{}", "error".bold().red()).unwrap();
@ -21,7 +20,9 @@ impl Emitter for PrettyEmitter {
DiagnosticType::Warning => { DiagnosticType::Warning => {
write!(output, "{}", "warning".bold().yellow()).unwrap(); write!(output, "{}", "warning".bold().yellow()).unwrap();
} }
_ => { continue; } _ => {
continue;
}
} }
writeln!(output, ": {}", msg.message.bold()).unwrap(); writeln!(output, ": {}", msg.message.bold()).unwrap();
@ -29,8 +30,8 @@ impl Emitter for PrettyEmitter {
let mut biggest_line_no = 0; let mut biggest_line_no = 0;
for span in &msg.spans { for span in &msg.spans {
let (s_line, _) = pos_to_line_col(span.span.start, &source); let ((s_line, _), (e_line, _)) = source_map.span_position(&span.span);
let (e_line, _) = pos_to_line_col(span.span.start, &source);
if s_line > biggest_line_no { if s_line > biggest_line_no {
biggest_line_no = s_line; biggest_line_no = s_line;
} }
@ -42,28 +43,49 @@ impl Emitter for PrettyEmitter {
let line_no_padding = biggest_line_no.to_string().len(); let line_no_padding = biggest_line_no.to_string().len();
for labeled_span in &msg.spans { for labeled_span in &msg.spans {
let (line, start_col) = pos_to_line_col(labeled_span.span.start, &source); let ((line, start_col), (_, end_col)) =
let (_, end_col) = pos_to_line_col(labeled_span.span.end, &source); source_map.span_position(&labeled_span.span);
writeln!(output, "{}{} {}:{}:{}", " ".repeat(line_no_padding), "-->".bright_blue().bold(), source_name, line, start_col).unwrap(); writeln!(
output,
"{}{} {}:{}:{}",
" ".repeat(line_no_padding),
"-->".bright_blue().bold(),
source_map.filename(),
line + 1,
start_col + 1
)
.unwrap();
let line_hdr_padding = line.to_string().len() + 1; let line_hdr_padding = line.to_string().len() + 1;
writeln!(output, "{}{}", " ".repeat(line_hdr_padding), "|".bright_blue().bold()).unwrap(); writeln!(
writeln!(output, "{}{} {} {}", line.to_string().bright_blue().bold(), " ".repeat(line_no_padding - line.to_string().len()), "|".bright_blue().bold(), get_line(line-1, &source).unwrap_or("<line unavailable>")).unwrap(); output,
"{}{}",
" ".repeat(line_hdr_padding),
"|".bright_blue().bold()
)
.unwrap();
writeln!(
output,
"{}{} {} {}",
(line + 1).to_string().bright_blue().bold(),
" ".repeat(line_no_padding - line.to_string().len()),
"|".bright_blue().bold(),
source_map.line_at(line).unwrap_or("<line unavailable>")
)
.unwrap();
let mut end_char = match labeled_span.span_type { let mut end_char = match labeled_span.span_type {
DiagnosticType::Error => '^'.to_string().bold().red(), DiagnosticType::Error => '^'.to_string().bold().red(),
DiagnosticType::Warning => '^'.to_string().bold().yellow(), DiagnosticType::Warning => '^'.to_string().bold().yellow(),
DiagnosticType::Help => { DiagnosticType::Help | DiagnosticType::Hint => {
if labeled_span.label.is_some() { if labeled_span.label.is_some() {
'-'.to_string().bold().bright_blue() '-'.to_string().bold().bright_blue()
} else { } else {
'~'.to_string().bold().bright_blue() '~'.to_string().bold().bright_blue()
} }
}, }
DiagnosticType::SecondaryError => { DiagnosticType::SecondaryError => {
if labeled_span.label.is_some() { if labeled_span.label.is_some() {
'-'.to_string().bold().red() '-'.to_string().bold().red()
@ -77,13 +99,12 @@ impl Emitter for PrettyEmitter {
(_, None) => ColoredString::from(""), (_, None) => ColoredString::from(""),
(DiagnosticType::Error, Some(e)) => e.bold().red(), (DiagnosticType::Error, Some(e)) => e.bold().red(),
(DiagnosticType::Warning, Some(e)) => e.bold().yellow(), (DiagnosticType::Warning, Some(e)) => e.bold().yellow(),
(DiagnosticType::Help, Some(e)) => e.bold().bright_blue(), (DiagnosticType::Help, Some(e)) | (DiagnosticType::Hint, Some(e)) => {
(DiagnosticType::SecondaryError, Some(e)) => e.bold().red() e.bold().bright_blue()
}
(DiagnosticType::SecondaryError, Some(e)) => e.bold().red(),
}; };
println!("{} {}", labeled_span.span.start, labeled_span.span.end);
println!("{} {}", end_col, start_col);
let underline_length = if end_col == start_col { let underline_length = if end_col == start_col {
end_char = "".into(); end_char = "".into();
1 1
@ -95,14 +116,50 @@ impl Emitter for PrettyEmitter {
let underline = match labeled_span.span_type { let underline = match labeled_span.span_type {
DiagnosticType::Error => "^".repeat(underline_length).to_string().bold().red(), DiagnosticType::Error => "^".repeat(underline_length).to_string().bold().red(),
DiagnosticType::Warning => "^".repeat(underline_length).to_string().bold().yellow(), DiagnosticType::Warning => {
DiagnosticType::Help => "~".repeat(underline_length).to_string().bold().bright_blue(), "^".repeat(underline_length).to_string().bold().yellow()
DiagnosticType::SecondaryError => "~".repeat(underline_length).to_string().bold().red() }
DiagnosticType::Help | DiagnosticType::Hint => "~"
.repeat(underline_length)
.to_string()
.bold()
.bright_blue(),
DiagnosticType::SecondaryError => {
"~".repeat(underline_length).to_string().bold().red()
}
}; };
writeln!(output, "{}{} {}{}{} {}", " ".repeat(line_hdr_padding), "|".bright_blue().bold(), " ".repeat(start_col-1), underline, end_char, message).unwrap(); writeln!(
output,
"{}{}{}{}{} {}",
" ".repeat(line_hdr_padding),
"|".bright_blue().bold(),
" ".repeat(start_col),
underline,
end_char,
message
)
.unwrap();
writeln!(output).unwrap(); writeln!(output).unwrap();
} }
for hint in &msg.hints {
/*
error:
hint:
help:
warning:
*/
let hdr = match hint.hint_type {
DiagnosticType::Error => "error: ".bold().red(),
DiagnosticType::Warning => "warning: ".bold().yellow(),
DiagnosticType::Help => "help: ".bright_blue().bold(),
DiagnosticType::Hint => "hint: ".bold(),
DiagnosticType::SecondaryError => "error: ".bold().red(),
};
writeln!(output, "{}{}", hdr, hint.message).unwrap();
}
} }
output output

View File

@ -1,20 +0,0 @@
pub fn pos_to_line_col(pos: usize, source: &str) -> (usize, usize) {
let mut line = 1;
let mut col = 1;
for (n, c) in source.chars().enumerate() {
if c == '\n' {
line += 1;
col = 1;
} else {
col += 1;
}
if n == pos {
break;
}
}
(line, col)
}
pub fn get_line(line: usize, source: &str) -> Option<&str> {
source.split('\n').nth(line)
}

View File

@ -0,0 +1,111 @@
#[macro_export]
macro_rules! diag {
(error,$m:expr,$( $span:expr )*) => {
$crate::diagnostics::Diagnostic {
diag_type: $crate::diagnostics::DiagnosticType::Error,
message: $m.to_string(),
spans: vec![
$( $span )*
],
hints: vec![]
}
};
(warn,$m:expr,$( $span:expr )*) => {
$crate::diagnostics::Diagnostic {
diag_type: $crate::diagnostics::DiagnosticType::Warning,
message: $m.to_string(),
spans: vec![
$( $span )*
],
hints: vec![]
}
};
}
#[macro_export]
macro_rules! span {
(at: $at:expr) => {
$crate::diagnostics::span::Span::new($at, $at)
};
(from: $from:expr, to: $to:expr) => {
$crate::diagnostics::span::Span::new($from, $to)
};
}
#[macro_export]
macro_rules! assemble_label {
($ty:expr,$span:expr,$msg:expr) => {
$crate::diagnostics::SpanWithLabel {
span_type: $ty,
span: $span,
label: $msg,
}
};
}
#[macro_export]
macro_rules! label_span {
(type: error,$span:expr) => {
$crate::assemble_label!($crate::diagnostics::DiagnosticType::Error, $span, None)
};
(type: error,$span:expr,$msg:expr) => {
$crate::assemble_label!(
$crate::diagnostics::DiagnosticType::Error,
$span,
Some($msg.to_string())
)
};
(type: secondary_error,$span:expr) => {
$crate::assemble_label!(
$crate::diagnostics::DiagnosticType::SecondaryError,
$span,
None
)
};
(type: secondary_error,$span:expr,$msg:expr) => {
$crate::assemble_label!(
$crate::diagnostics::DiagnosticType::SecondaryError,
$span,
Some($msg.to_string())
)
};
(type: warning,$span:expr) => {
$crate::assemble_label!($crate::diagnostics::DiagnosticType::Warning, $span, None)
};
(type: warning,$span:expr,$msg:expr) => {
$crate::assemble_label!(
$crate::diagnostics::DiagnosticType::Warning,
$span,
Some($msg.to_string())
)
};
(type: help,$span:expr) => {
$crate::assemble_label!($crate::diagnostics::DiagnosticType::Help, $span, None)
};
(type: help,$span:expr,$msg:expr) => {
$crate::assemble_label!(
$crate::diagnostics::DiagnosticType::Help,
$span,
Some($msg.to_string())
)
};
}
#[macro_export]
macro_rules! hint {
(help: $msg:expr) => {
$crate::diagnostics::DiagnosticHint {
hint_type: $crate::diagnostics::DiagnosticType::Help,
message: $msg.to_string(),
}
};
(hint: $msg:expr) => {
$crate::diagnostics::DiagnosticHint {
hint_type: $crate::diagnostics::DiagnosticType::Hint,
message: $msg.to_string(),
}
};
}

View File

@ -1,13 +1,16 @@
use crate::diagnostics::span::Span; use crate::diagnostics::span::Span;
pub mod span;
pub mod emitters; pub mod emitters;
pub mod span;
#[macro_use]
pub mod macros;
#[derive(Debug, Clone, PartialEq, Eq)] #[derive(Debug, Clone, PartialEq, Eq)]
pub struct Diagnostic { pub struct Diagnostic {
pub diag_type: DiagnosticType, pub diag_type: DiagnosticType,
pub spans: Vec<SpanWithLabel>, pub spans: Vec<SpanWithLabel>,
pub message: String, pub message: String,
pub hints: Vec<DiagnosticHint>,
} }
#[derive(Debug, Clone, Copy, PartialEq, Eq)] #[derive(Debug, Clone, Copy, PartialEq, Eq)]
@ -15,7 +18,8 @@ pub enum DiagnosticType {
Error, Error,
Warning, Warning,
Help, Help,
SecondaryError Hint,
SecondaryError,
} }
#[derive(Debug, Clone, PartialEq, Eq)] #[derive(Debug, Clone, PartialEq, Eq)]
@ -23,4 +27,22 @@ pub struct SpanWithLabel {
pub span: Span, pub span: Span,
pub span_type: DiagnosticType, pub span_type: DiagnosticType,
pub label: Option<String>, pub label: Option<String>,
} }
#[derive(Debug, Clone, PartialEq, Eq)]
pub struct DiagnosticHint {
pub hint_type: DiagnosticType,
pub message: String,
}
impl Diagnostic {
pub fn with_hint(mut self, hint: DiagnosticHint) -> Self {
self.hints.push(hint);
Self {
diag_type: self.diag_type,
spans: self.spans,
message: self.message,
hints: self.hints,
}
}
}

View File

@ -1,11 +1,11 @@
#[derive(Debug, Clone, PartialEq, Eq, Copy)] #[derive(Debug, Clone, PartialEq, Eq, Copy)]
pub struct Span { pub struct Span {
pub start: usize, pub start: usize,
pub end: usize pub end: usize,
} }
impl Span { impl Span {
pub fn new(start: usize, end: usize) -> Self { pub fn new(start: usize, end: usize) -> Self {
Self { start, end } Self { start, end }
} }
} }

View File

@ -1,10 +1,11 @@
use crate::diagnostics::Diagnostic; use crate::diagnostics::Diagnostic;
use crate::source::SourceFile;
#[derive(Debug, Clone, PartialEq, Eq)] #[derive(Debug, Clone, PartialEq, Eq)]
pub enum KError { pub enum KError {
InternalError(InternalError), InternalError(InternalError),
UserError(Vec<Diagnostic>) UserError(Vec<Diagnostic>, SourceFile),
} }
#[derive(Debug, Clone, PartialEq, Eq)] #[derive(Debug, Clone, PartialEq, Eq)]
pub enum InternalError {} pub enum InternalError {}

11
libkabel/src/formatter.rs Normal file
View File

@ -0,0 +1,11 @@
use crate::lexer::token::Token;
use std::fmt::Write;
use tracing::debug;
pub fn print_tts(tokens: &[Token]) {
let mut out = String::new();
for token in tokens {
write!(out, "{:?} ", token.tt).unwrap();
}
debug!("{out}");
}

View File

@ -1,225 +1,152 @@
use token::{ArithOperator, Bracket, Literal, Statement, Token};
use tracing::debug;
use crate::diagnostics::{Diagnostic, DiagnosticType, SpanWithLabel};
use crate::diagnostics::span::Span;
use crate::error::KError; use crate::error::KError;
use crate::lexer::token::{Token, TokenType};
use crate::source::SourceFile;
use crate::{diag, hint, label_span, span};
#[macro_use]
pub mod token; pub mod token;
#[derive(Debug)] pub fn lexer(mut source: SourceFile) -> Result<Vec<Token>, KError> {
enum State { let mut tokens = vec![];
Stringing, let mut errors = vec![];
Commenting,
Numbering,
BuildingToken,
}
pub fn lexer(text_source: &str) -> Result<Vec<Token>, KError> { 'main: while let Some(c) = source.next() {
debug!("lexing!"); match c {
'(' => tokens.push(token!(at: source.pos(), TokenType::LeftParenthesis)),
')' => tokens.push(token!(at: source.pos(), TokenType::RightParenthesis)),
let mut current_token = String::new(); '-' => tokens.push(token!(at: source.pos(), TokenType::Minus)),
let mut lexed = Vec::new(); '+' => tokens.push(token!(at: source.pos(), TokenType::Plus)),
let mut state: State = State::BuildingToken; '*' => tokens.push(token!(at: source.pos(), TokenType::Star)),
let mut chars = text_source.chars().peekable(); ',' => tokens.push(token!(at: source.pos(), TokenType::Comma)),
let mut pos: usize = 0; ';' => tokens.push(token!(at: source.pos(), TokenType::Semicolon)),
let mut span_start: usize = 0; ':' => tokens.push(token!(at: source.pos(), TokenType::Colon)),
'=' => tokens.push(token!(at: source.pos(), TokenType::Equals)),
while let Some(c) = chars.next() { n1 if n1.is_ascii_digit() => {
pos += 1; source.start_token();
let mut num_lit = String::from(n1);
match state { while let Some(c) = source.peek() {
State::Commenting => { if c.is_ascii_digit() {
// Stop commenting at end of line num_lit.push(source.next().expect("unreachable"))
if c == '\n' {
state = State::BuildingToken;
}
}
State::Stringing => {
// If next char is an unescaped quote
// TODO: when possible, make this 1 `if'. Ability to
// do that remains unimplemented, hence the stupid copied
// code below.
if c != '\n' {
if let Some(c_peek) = chars.peek() {
if c != '\\' && *c_peek == '\"' {
chars.next();
pos += 1;
current_token.push(c);
let tok_cpy = current_token.clone();
lexed.push(Token::Literal(Span::new(span_start, pos), Literal::Str(tok_cpy)));
state = State::BuildingToken;
current_token = String::new();
} else {
current_token.push(c);
}
} else { } else {
return Err(KError::UserError(vec![ break;
Diagnostic {
diag_type: DiagnosticType::Error,
message: "unterminated string literal".to_string(),
spans: vec![
SpanWithLabel {
span: Span::new(span_start-1, span_start-1),
span_type: DiagnosticType::SecondaryError,
label: Some("string began here".to_string())
},
SpanWithLabel {
span: Span::new(pos, pos),
span_type: DiagnosticType::Error,
label: Some("expected end quote here".to_string())
}
]
}
]));
} }
} else { }
return Err(KError::UserError(vec![
Diagnostic { if source.peek() == Some('.') {
diag_type: DiagnosticType::Error, if let Some(two) = source.peek_two() {
message: "unterminated string literal".to_string(), if two.is_ascii_digit() {
spans: vec![ num_lit.push(source.next().expect("unreachable"));
SpanWithLabel { while let Some(c) = source.peek() {
span: Span::new(span_start-1, span_start-1), if c.is_ascii_digit() {
span_type: DiagnosticType::SecondaryError, num_lit.push(source.next().expect("unreachable"))
label: Some("string began here".to_string()) } else {
}, break;
SpanWithLabel {
span: Span::new(pos, pos),
span_type: DiagnosticType::Error,
label: Some("expected end quote here".to_string())
} }
]
}
]));
}
}
State::Numbering => {
current_token.push(c);
// If next char isn't numeric, is at end of this number literal
if let Some(c_peek) = chars.peek() {
if !c_peek.is_ascii_digit() {
let num = match current_token.parse::<f64>() {
Ok(n) => n,
Err(_) => {
debug!("{} {}", span_start, pos);
return Err(KError::UserError(vec![
Diagnostic {
message: "invalid numeric literal".to_string(),
diag_type: DiagnosticType::Error,
spans: vec![
SpanWithLabel {
span: Span::new(span_start, pos),
span_type: DiagnosticType::Error,
label: Some("this is not a valid numeric literal".to_string()),
}
],
}
]));
} }
}; }
}
}
lexed.push(Token::Literal( // try to parse the lit
Span::new(span_start, pos), let val: f64 = match num_lit.parse() {
Literal::Num(num) Ok(val) => val,
)); Err(_) => {
state = State::BuildingToken; errors.push(diag!(error, "Invalid numeric literal", label_span!(type: error, source.end_token(), "this is not a valid numeric literal")));
current_token = String::new(); break 'main;
}
};
tokens.push(token!(span: source.end_token(), TokenType::NumericLiteral(val)));
}
c1 if c1.is_ascii_alphabetic() || c1 == '_' => {
source.start_token();
let mut ident = String::from(c1);
while let Some(c) = source.peek() {
if c.is_ascii_alphanumeric() || c == '_' {
ident.push(source.next().expect("unreachable"));
} else {
break;
}
}
let span = source.end_token();
tokens.push(match ident.as_str() {
"to" => token!(span: span, TokenType::To),
"with" => token!(span: span, TokenType::With),
"for" => token!(span: span, TokenType::For),
"in" => token!(span: span, TokenType::In),
_ => token!(span: span, TokenType::Identifier(ident)),
})
}
'\"' => {
source.start_token();
let mut string_lit = String::new();
while let Some(c) = source.peek() {
if c != '\"' {
string_lit.push(source.next().expect("unreachable"));
} else {
source.next(); // consume the "
break;
}
}
let span = source.end_token();
tokens.push(token!(span: span, TokenType::StringLiteral(string_lit)));
}
'#' => {
// read until end of while
while let Some(c2) = source.next() {
if c2 == '\n' {
break;
} }
} }
} }
State::BuildingToken => { w if w.is_whitespace() => {}
if c == '\"' { unknown => {
state = State::Stringing; let mut err = diag!(
current_token = String::new(); error,
// We don't need to push c because it's the quote delimiter, format!("Unexpected character `{unknown}`"),
// which has already served its purpose as an indicator label_span!(type: error, span!(at: source.pos()), "here")
span_start = pos; );
continue;
} else if c.is_ascii_digit() { if let Some(tkn) = tokens.last() {
state = State::Numbering; match tkn.tt {
current_token = c.to_string(); TokenType::NumericLiteral(_) => {
span_start = pos; err = err
continue; .with_hint(hint!(help: "last token detected was a numeric literal"))
.with_hint(
hint!(help: "this is most likely an invalid numeric literal"),
);
if unknown == '.' {
err = err.with_hint(hint!(hint: "unexpected character was a `.`, did you forget to add a 0 at the end (e.g. `5.` instead of `5.0`)?"));
}
}
_ => {}
}
} }
// Known meaningful tokens errors.push(err);
// fatal error - exit loop
if current_token.is_empty() { break;
span_start = pos;
}
current_token.push(c);
match current_token.as_str() {
"\n" => {
continue;
}
"#" => {
state = State::Commenting;
current_token = String::new();
}
";" => {
lexed.push(Token::Terminator(Span::new(span_start, pos)));
current_token = String::new();
}
"if " => {
lexed.push(Token::Statement(Span::new(span_start, pos), Statement::Conditional));
current_token = String::new();
}
"to " => {
lexed.push(Token::Statement(Span::new(span_start, pos), Statement::FunctionDef));
current_token = String::new();
}
"for " => {
lexed.push(Token::Statement(Span::new(span_start, pos), Statement::ForLoop));
current_token = String::new();
}
"while " => {
lexed.push(Token::Statement(Span::new(span_start, pos), Statement::WhileLoop));
current_token = String::new();
}
"(" => {
lexed.push(Token::Bracket(Span::new(span_start, pos), Bracket::Open));
current_token = String::new();
}
")" => {
lexed.push(Token::Bracket(Span::new(span_start, pos), Bracket::Close));
current_token = String::new();
}
"*" => {
lexed.push(Token::ArithOperator(Span::new(span_start, pos), ArithOperator::Multiply));
current_token = String::new();
}
"/" => {
lexed.push(Token::ArithOperator(Span::new(span_start, pos), ArithOperator::Divide));
current_token = String::new();
}
"+" => {
lexed.push(Token::ArithOperator(Span::new(span_start, pos), ArithOperator::Add));
current_token = String::new();
}
"-" => {
lexed.push(Token::ArithOperator(Span::new(span_start, pos), ArithOperator::Subtract));
current_token = String::new();
}
"^" => {
lexed.push(Token::ArithOperator(Span::new(span_start, pos), ArithOperator::Exponentiate));
current_token = String::new();
}
"%" => {
lexed.push(Token::ArithOperator(Span::new(span_start, pos), ArithOperator::Reduce));
current_token = String::new();
}
_ => {}
}
} }
} }
debug!("{} {:?} {} {:?}", &c, &state, &current_token, &lexed);
} }
Ok(lexed) if !errors.is_empty() {
Err(KError::UserError(errors, source))
} else {
Ok(tokens)
}
} }

View File

@ -1,51 +1,82 @@
use crate::diagnostics::span::Span; use crate::diagnostics::span::Span;
use crate::variables; use std::fmt::{Display, Formatter};
// parts of Token #[derive(Debug, PartialEq, Clone)]
pub struct Token {
#[derive(Debug)] pub tt: TokenType,
pub enum ArithOperator { pub span: Span,
Add,
Subtract,
Multiply,
Divide,
Exponentiate,
Reduce,
} }
#[derive(Debug)] #[derive(Debug, PartialEq, Clone)]
pub enum BooleanOperator { pub enum TokenType {
And, LeftParenthesis, // (
Or, RightParenthesis, // )
Comma, // ,
Minus, // -
Plus, // +
Star, // *
Semicolon,
Colon,
Equals,
To,
With,
For,
In,
Identifier(String),
NumericLiteral(f64),
StringLiteral(String),
} }
#[derive(Debug)] impl Display for Token {
pub enum Literal { fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
Str(String), write!(f, "{}", self.tt)
Num(f64), }
} }
#[derive(Debug)] impl Display for TokenType {
pub enum Statement { fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
Conditional, match self {
ForLoop, TokenType::LeftParenthesis => write!(f, "("),
WhileLoop, TokenType::RightParenthesis => write!(f, ")"),
FunctionDef, TokenType::Comma => write!(f, ","),
TokenType::Minus => write!(f, "-"),
TokenType::Plus => write!(f, "+"),
TokenType::Star => write!(f, "*"),
TokenType::Semicolon => writeln!(f, ";"),
TokenType::To => write!(f, "to"),
TokenType::Identifier(i) => write!(f, "{i}"),
TokenType::Colon => write!(f, ":"),
TokenType::Equals => write!(f, "="),
TokenType::NumericLiteral(val) => write!(f, "{val}"),
TokenType::StringLiteral(val) => write!(f, "\"{val}\""),
TokenType::With => write!(f, "with"),
TokenType::For => write!(f, "for"),
TokenType::In => write!(f, "in"),
}
}
} }
#[derive(Debug)] macro_rules! token {
pub enum Bracket { (start: $start:expr, end: $end:expr, $tt:expr) => {
Open, $crate::lexer::token::Token {
Close, tt: $tt,
} span: $crate::diagnostics::span::Span::new($start, $end),
}
#[derive(Debug)] };
pub enum Token { (at: $at:expr, $tt:expr) => {
Literal(Span, Literal), $crate::lexer::token::Token {
ArithOperator(Span, ArithOperator), tt: $tt,
Statement(Span, Statement), span: $crate::diagnostics::span::Span::new($at, $at),
Bracket(Span, Bracket), }
Variable(Span, variables::Variable), };
Terminator(Span), (span: $span:expr, $tt:expr) => {
$crate::lexer::token::Token {
tt: $tt,
span: $span,
}
};
} }

View File

@ -1,5 +1,7 @@
pub mod modules;
pub mod variables;
pub mod diagnostics; pub mod diagnostics;
pub mod error;
pub mod formatter;
pub mod lexer; pub mod lexer;
pub mod error; pub mod modules;
pub mod source;
pub mod variables;

76
libkabel/src/source.rs Normal file
View File

@ -0,0 +1,76 @@
use crate::diagnostics::span::Span;
#[derive(PartialEq, Eq, Clone, Debug)]
pub struct SourceFile {
inner_original: String,
pos: usize,
current_token_start_pos: Option<usize>,
name: String,
}
impl SourceFile {
pub fn new(source: String, name: String) -> Self {
SourceFile {
inner_original: source,
pos: 0,
current_token_start_pos: None,
name,
}
}
pub fn next(&mut self) -> Option<char> {
self.pos += 1;
self.inner_original.chars().nth(self.pos - 1)
}
pub fn peek(&self) -> Option<char> {
self.inner_original.chars().nth(self.pos)
}
pub fn peek_two(&self) -> Option<char> {
self.inner_original.chars().nth(self.pos + 1)
}
pub fn pos(&self) -> usize {
self.pos
}
pub fn start_token(&mut self) {
self.current_token_start_pos = Some(self.pos)
}
pub fn end_token(&mut self) -> Span {
if let Some(start) = self.current_token_start_pos {
self.current_token_start_pos = None;
Span::new(start, self.pos)
} else {
panic!("tried to end a token when none was started");
}
}
pub fn position_of(&self, pos: &usize) -> (usize, usize) {
let mut line = 0;
let mut col = 0;
for (n, c) in self.inner_original.chars().enumerate() {
if c == '\n' {
line += 1;
col = 0;
} else {
col += 1;
}
if n == *pos {
break;
}
}
(line, col)
}
pub fn span_position(&self, span: &Span) -> ((usize, usize), (usize, usize)) {
(self.position_of(&span.start), self.position_of(&span.end))
}
pub fn line_at(&self, line: usize) -> Option<&str> {
self.inner_original.split('\n').nth(line)
}
pub fn filename(&self) -> &str {
&self.name
}
}