schala/schala-lang/language/src/lib.rs

336 lines
11 KiB
Rust
Raw Normal View History

2018-07-16 03:40:35 -07:00
#![feature(trace_macros)]
#![feature(custom_attribute)]
//#![feature(unrestricted_attribute_tokens)]
2018-04-03 23:24:13 -07:00
#![feature(slice_patterns, box_patterns, box_syntax)]
2018-11-11 18:04:44 -08:00
//! `schala-lang` is where the Schala programming language is actually implemented.
//! It defines the `Schala` type, which contains the state for a Schala REPL, and implements
//! `ProgrammingLanguageInterface` and the chain of compiler passes for it.
2018-03-23 18:43:43 -07:00
extern crate itertools;
#[macro_use]
extern crate lazy_static;
#[macro_use]
extern crate maplit;
extern crate schala_repl;
2018-05-02 02:14:36 -07:00
#[macro_use]
2018-10-19 09:57:35 -07:00
extern crate schala_lang_codegen;
2019-02-23 00:34:44 -08:00
extern crate ena;
2018-03-23 18:43:43 -07:00
2019-05-21 02:06:34 -07:00
use stopwatch::Stopwatch;
2019-05-27 15:06:50 -07:00
use std::time::Duration;
use std::cell::RefCell;
use std::rc::Rc;
2019-05-26 04:16:40 -07:00
use std::collections::HashSet;
use itertools::Itertools;
use schala_repl::{ProgrammingLanguageInterface,
ComputationRequest, ComputationResponse,
LangMetaRequest, LangMetaResponse, GlobalOutputStats,
2019-05-25 19:31:41 -07:00
DebugResponse, DebugAsk};
macro_rules! bx {
($e:expr) => { Box::new($e) }
}
2019-02-17 03:36:12 -08:00
#[macro_use]
mod util;
#[macro_use]
mod typechecking;
mod tokenizing;
2018-06-04 19:25:40 -07:00
mod ast;
mod parsing;
mod symbol_table;
2019-02-17 03:36:12 -08:00
mod builtin;
2018-06-04 19:12:48 -07:00
mod reduced_ast;
mod eval;
/// All the state necessary to parse and execute a Schala program are stored in this struct.
2018-11-11 18:04:44 -08:00
/// `state` represents the execution state for the AST-walking interpreter, the other fields
/// should be self-explanatory.
pub struct Schala {
2019-01-06 01:58:16 -08:00
source_reference: SourceReference,
state: eval::State<'static>,
symbol_table: Rc<RefCell<symbol_table::SymbolTable>>,
2018-11-08 20:30:17 -08:00
type_context: typechecking::TypeContext<'static>,
2018-10-20 14:27:00 -07:00
active_parser: Option<parsing::Parser>,
}
2018-09-22 00:24:27 -07:00
impl Schala {
2019-03-19 19:26:05 -07:00
fn handle_docs(&self, source: String) -> LangMetaResponse {
LangMetaResponse::Docs {
2019-05-14 11:15:12 -07:00
doc_string: format!("Schala item `{}` : <<Schala-lang documentation not yet implemented>>", source)
2019-03-19 19:26:05 -07:00
}
}
2018-09-22 00:24:27 -07:00
}
2018-07-16 03:40:35 -07:00
impl Schala {
2018-11-11 18:04:44 -08:00
/// Creates a new Schala environment *without* any prelude.
2018-06-03 18:43:31 -07:00
fn new_blank_env() -> Schala {
let symbols = Rc::new(RefCell::new(symbol_table::SymbolTable::new()));
Schala {
2019-01-06 01:58:16 -08:00
source_reference: SourceReference::new(),
symbol_table: symbols.clone(),
state: eval::State::new(symbols),
2018-11-06 13:44:52 -08:00
type_context: typechecking::TypeContext::new(),
2018-10-20 14:27:00 -07:00
active_parser: None,
}
}
2018-06-03 18:43:31 -07:00
2018-11-11 18:04:44 -08:00
/// Creates a new Schala environment with the standard prelude, which is defined as ordinary
/// Schala code in the file `prelude.schala`
2018-06-03 18:43:31 -07:00
pub fn new() -> Schala {
2018-11-05 20:55:03 -08:00
let prelude = include_str!("prelude.schala");
2018-06-03 18:43:31 -07:00
let mut s = Schala::new_blank_env();
2019-03-14 00:15:13 -07:00
2019-05-26 04:16:40 -07:00
let request = ComputationRequest { source: prelude, debug_requests: HashSet::default() };
2019-03-14 00:15:13 -07:00
s.run_computation(request);
2018-06-03 18:43:31 -07:00
s
}
2019-03-27 02:20:43 -07:00
2019-05-25 19:31:41 -07:00
fn handle_debug_immediate(&self, request: DebugAsk) -> DebugResponse {
use DebugAsk::*;
2019-05-25 19:31:41 -07:00
match request {
Timing => DebugResponse { ask: Timing, value: format!("Invalid") },
ByStage { stage_name } => match &stage_name[..] {
"symbol-table" => {
let value = self.symbol_table.borrow().debug_symbol_table();
DebugResponse {
ask: ByStage { stage_name: format!("symbol-table") },
value
}
},
s => {
DebugResponse {
ask: ByStage { stage_name: s.to_string() },
value: format!("Not-implemented")
}
}
}
2019-03-27 02:20:43 -07:00
}
}
}
2019-03-14 00:15:13 -07:00
fn tokenizing(input: &str, _handle: &mut Schala, comp: Option<&mut PassDebugArtifact>) -> Result<Vec<tokenizing::Token>, String> {
let tokens = tokenizing::tokenize(input);
comp.map(|comp| {
2019-01-08 02:11:19 -08:00
let token_string = tokens.iter().map(|t| t.to_string_with_metadata()).join(", ");
2019-03-14 00:15:13 -07:00
comp.add_artifact(token_string);
});
2018-05-02 00:27:58 -07:00
2018-05-02 01:14:46 -07:00
let errors: Vec<String> = tokens.iter().filter_map(|t| t.get_error()).collect();
if errors.len() == 0 {
Ok(tokens)
} else {
Err(format!("{:?}", errors))
}
}
2019-03-14 00:15:13 -07:00
fn parsing(input: Vec<tokenizing::Token>, handle: &mut Schala, comp: Option<&mut PassDebugArtifact>) -> Result<ast::AST, String> {
2019-01-07 13:00:37 -08:00
use crate::parsing::Parser;
2018-10-20 14:27:00 -07:00
let mut parser = match handle.active_parser.take() {
None => Parser::new(input),
Some(parser) => parser
};
let ast = parser.parse();
2019-06-19 03:27:18 -07:00
let trace = parser.format_parse_trace();
2019-06-14 00:23:32 -07:00
comp.map(|comp| {
2019-06-19 03:27:18 -07:00
let debug_info = match comp.parsing.as_ref().unwrap_or(&ParsingDebugType::CompactAST) {
ParsingDebugType::CompactAST => format!("{:?}", ast),
ParsingDebugType::ExpandedAST => format!("{:#?}", ast),
ParsingDebugType::Trace => format!("{}", trace[0]) //TODO fix this
2018-07-04 19:46:36 -07:00
};
2019-06-19 03:27:18 -07:00
comp.add_artifact(debug_info);
});
2019-01-07 01:52:31 -08:00
ast.map_err(|err| format_parse_error(err, handle))
}
fn format_parse_error(error: parsing::ParseError, handle: &mut Schala) -> String {
2019-01-08 02:11:19 -08:00
let line_num = error.token.line_num;
let ch = error.token.char_num;
2019-01-08 01:04:46 -08:00
let line_from_program = handle.source_reference.get_line(line_num);
let location_pointer = format!("{}^", " ".repeat(ch));
2019-01-07 16:52:46 -08:00
2019-01-08 01:04:46 -08:00
let line_num_digits = format!("{}", line_num).chars().count();
let space_padding = " ".repeat(line_num_digits);
2019-01-07 16:52:46 -08:00
2019-01-08 01:04:46 -08:00
format!(r#"
2019-01-07 16:52:46 -08:00
{error_msg}
{space_padding} |
{line_num} | {}
{space_padding} | {}
"#, line_from_program, location_pointer, error_msg=error.msg, space_padding=space_padding, line_num=line_num)
}
2019-03-14 00:15:13 -07:00
fn symbol_table(input: ast::AST, handle: &mut Schala, comp: Option<&mut PassDebugArtifact>) -> Result<ast::AST, String> {
let add = handle.symbol_table.borrow_mut().add_top_level_symbols(&input);
match add {
2018-04-29 22:51:01 -07:00
Ok(()) => {
2019-03-14 00:15:13 -07:00
let debug = handle.symbol_table.borrow().debug_symbol_table();
comp.map(|comp| comp.add_artifact(debug));
2018-04-29 22:51:01 -07:00
Ok(input)
},
2018-04-29 03:45:31 -07:00
Err(msg) => Err(msg)
}
}
2019-03-14 00:15:13 -07:00
fn typechecking(input: ast::AST, handle: &mut Schala, comp: Option<&mut PassDebugArtifact>) -> Result<ast::AST, String> {
2018-11-09 02:02:08 -08:00
let result = handle.type_context.typecheck(&input);
2018-11-06 13:44:52 -08:00
2018-11-09 02:02:08 -08:00
comp.map(|comp| {
2019-03-14 00:15:13 -07:00
comp.add_artifact(match result {
2019-02-20 01:33:45 -08:00
Ok(ty) => ty.to_string(),
Err(err) => format!("Type error: {}", err.msg)
2019-02-10 05:31:58 -08:00
});
2018-11-09 02:02:08 -08:00
});
2018-11-07 13:44:28 -08:00
2018-11-09 02:02:08 -08:00
Ok(input)
2018-04-29 03:45:31 -07:00
}
2019-03-14 00:15:13 -07:00
fn ast_reducing(input: ast::AST, handle: &mut Schala, comp: Option<&mut PassDebugArtifact>) -> Result<reduced_ast::ReducedAST, String> {
let ref symbol_table = handle.symbol_table.borrow();
let output = input.reduce(symbol_table);
2019-03-14 00:15:13 -07:00
comp.map(|comp| comp.add_artifact(format!("{:?}", output)));
2018-05-12 02:20:50 -07:00
Ok(output)
2018-05-09 02:02:17 -07:00
}
2019-03-14 00:15:13 -07:00
fn eval(input: reduced_ast::ReducedAST, handle: &mut Schala, comp: Option<&mut PassDebugArtifact>) -> Result<String, String> {
comp.map(|comp| comp.add_artifact(handle.state.debug_print()));
2018-05-12 02:20:50 -07:00
let evaluation_outputs = handle.state.evaluate(input, true);
2018-04-29 03:45:31 -07:00
let text_output: Result<Vec<String>, String> = evaluation_outputs
.into_iter()
.collect();
let eval_output: Result<String, String> = text_output
.map(|v| { v.into_iter().intersperse(format!("\n")).collect() });
eval_output
}
2018-05-09 02:02:17 -07:00
2019-01-10 00:31:37 -08:00
/// Represents lines of source code
2019-01-06 01:58:16 -08:00
struct SourceReference {
2019-01-07 01:52:31 -08:00
lines: Option<Vec<String>>
2019-01-06 01:58:16 -08:00
}
impl SourceReference {
fn new() -> SourceReference {
2019-01-07 01:52:31 -08:00
SourceReference { lines: None }
2019-01-06 01:58:16 -08:00
}
2019-01-07 01:52:31 -08:00
fn load_new_source(&mut self, source: &str) {
//TODO this is a lot of heap allocations - maybe there's a way to make it more efficient?
2019-01-07 16:52:46 -08:00
self.lines = Some(source.lines().map(|s| s.to_string()).collect()); }
2019-01-06 01:58:16 -08:00
2019-01-07 01:52:31 -08:00
fn get_line(&self, line: usize) -> String {
self.lines.as_ref().and_then(|x| x.get(line).map(|s| s.to_string())).unwrap_or(format!("NO LINE FOUND"))
2019-01-06 01:58:16 -08:00
}
}
2019-06-19 03:27:18 -07:00
enum ParsingDebugType {
CompactAST,
ExpandedAST,
Trace
}
2019-05-27 15:06:50 -07:00
#[derive(Default)]
2019-03-14 00:15:13 -07:00
struct PassDebugArtifact {
2019-06-19 03:27:18 -07:00
parsing: Option<ParsingDebugType>,
2019-05-27 15:06:50 -07:00
artifacts: Vec<String>
2019-06-19 03:27:18 -07:00
2019-03-14 00:15:13 -07:00
}
impl PassDebugArtifact {
fn add_artifact(&mut self, artifact: String) {
2019-05-27 15:06:50 -07:00
self.artifacts.push(artifact)
2019-03-14 00:15:13 -07:00
}
}
2019-05-25 20:09:11 -07:00
fn stage_names() -> Vec<&'static str> {
vec![
"tokenizing",
"parsing",
"symbol-table",
"typechecking",
"ast-reduction",
"ast-walking-evaluation"
]
}
2019-05-27 15:06:50 -07:00
impl ProgrammingLanguageInterface for Schala {
fn get_language_name(&self) -> String { format!("Schala") }
fn get_source_file_suffix(&self) -> String { format!("schala") }
fn run_computation(&mut self, request: ComputationRequest) -> ComputationResponse {
struct PassToken<'a> {
schala: &'a mut Schala,
stage_durations: &'a mut Vec<(String, Duration)>,
sw: &'a Stopwatch,
2019-05-28 03:41:49 -07:00
debug_requests: &'a HashSet<DebugAsk>,
debug_responses: &'a mut Vec<DebugResponse>,
}
fn output_wrapper<Input, Output, F>(n: usize, func: F, input: Input, tok: &mut PassToken) -> Result<Output, String>
where F: Fn(Input, &mut Schala, Option<&mut PassDebugArtifact>) -> Result<Output, String>
2019-05-27 15:06:50 -07:00
{
let stage_names = stage_names();
2019-06-18 18:11:17 -07:00
let ask = DebugAsk::ByStage { stage_name: stage_names[n].to_string() };
2019-06-19 03:27:18 -07:00
let mut debug_artifact = tok.debug_requests.get(&ask).map(|_|
PassDebugArtifact {
parsing: if stage_names[n] == "parsing" { Some(ParsingDebugType::CompactAST) } else { None },
..Default::default()
}
);
let output = func(input, tok.schala, debug_artifact.as_mut());
2019-06-18 18:11:17 -07:00
tok.stage_durations.push((stage_names[n].to_string(), tok.sw.elapsed()));
2019-05-28 03:41:49 -07:00
if let Some(artifact) = debug_artifact {
for value in artifact.artifacts.into_iter() {
2019-06-18 18:11:17 -07:00
let resp = DebugResponse { ask: ask.clone(), value };
2019-05-28 03:41:49 -07:00
tok.debug_responses.push(resp);
}
}
2019-05-27 15:06:50 -07:00
output
}
let ComputationRequest { source, debug_requests } = request;
self.source_reference.load_new_source(source);
2019-05-21 02:06:34 -07:00
let sw = Stopwatch::start_new();
2019-05-25 20:09:11 -07:00
let mut stage_durations = Vec::new();
2019-05-28 03:41:49 -07:00
let mut debug_responses = Vec::new();
let mut tok = PassToken { schala: self, stage_durations: &mut stage_durations, sw: &sw, debug_requests: &debug_requests, debug_responses: &mut debug_responses };
2019-05-25 20:09:11 -07:00
2019-05-27 15:06:50 -07:00
let main_output: Result<String, String> = Ok(source)
.and_then(|source| output_wrapper(0, tokenizing, source, &mut tok))
.and_then(|tokens| output_wrapper(1, parsing, tokens, &mut tok))
.and_then(|ast| output_wrapper(2, symbol_table, ast, &mut tok))
.and_then(|ast| output_wrapper(3, typechecking, ast, &mut tok))
.and_then(|ast| output_wrapper(4, ast_reducing, ast, &mut tok))
.and_then(|reduced_ast| output_wrapper(5, eval, reduced_ast, &mut tok));
2019-05-21 02:46:07 -07:00
let total_duration = sw.elapsed();
2019-05-21 02:06:34 -07:00
let global_output_stats = GlobalOutputStats {
2019-05-25 20:09:11 -07:00
total_duration, stage_durations
2019-05-21 02:06:34 -07:00
};
ComputationResponse {
main_output,
2019-05-21 02:06:34 -07:00
global_output_stats,
2019-05-28 03:41:49 -07:00
debug_responses,
}
}
2019-03-19 19:26:05 -07:00
fn request_meta(&mut self, request: LangMetaRequest) -> LangMetaResponse {
match request {
2019-05-25 20:09:11 -07:00
LangMetaRequest::StageNames => LangMetaResponse::StageNames(stage_names().iter().map(|s| s.to_string()).collect()),
2019-03-19 19:26:05 -07:00
LangMetaRequest::Docs { source } => self.handle_docs(source),
2019-03-27 02:20:43 -07:00
LangMetaRequest::ImmediateDebug(debug_request) =>
LangMetaResponse::ImmediateDebug(self.handle_debug_immediate(debug_request)),
2019-03-19 19:26:05 -07:00
LangMetaRequest::Custom { .. } => LangMetaResponse::Custom { kind: format!("not-implemented"), value: format!("") }
}
}
}