schala/schala-lang/language/src/schala.rs

219 lines
7.4 KiB
Rust
Raw Normal View History

2021-10-19 20:50:43 -07:00
use schala_repl::{
ComputationRequest, ComputationResponse, GlobalOutputStats, LangMetaRequest, LangMetaResponse,
ProgrammingLanguageInterface,
};
2021-10-27 00:39:08 -07:00
use stopwatch::Stopwatch;
use crate::{
error::SchalaError, parsing, reduced_ir, symbol_table, tokenizing, tree_walk_eval, type_inference,
2021-10-27 00:39:08 -07:00
};
/// All the state necessary to parse and execute a Schala program are stored in this struct.
pub struct Schala<'a> {
2021-10-19 20:50:43 -07:00
/// Holds a reference to the original source code, parsed into line and character
source_reference: SourceReference,
//state: eval::State<'static>,
2021-10-19 20:50:43 -07:00
/// Keeps track of symbols and scopes
symbol_table: symbol_table::SymbolTable,
/// Contains information for type-checking
type_context: type_inference::TypeContext,
2021-10-19 20:50:43 -07:00
/// Schala Parser
active_parser: parsing::Parser,
/// Execution state for AST-walking interpreter
eval_state: tree_walk_eval::State<'a>,
2021-11-02 23:34:14 -07:00
timings: Vec<(&'static str, std::time::Duration)>,
}
/*
impl Schala {
2021-10-19 20:50:43 -07:00
//TODO implement documentation for language items
/*
fn handle_docs(&self, source: String) -> LangMetaResponse {
LangMetaResponse::Docs {
doc_string: format!("Schala item `{}` : <<Schala-lang documentation not yet implemented>>", source)
}
}
2021-10-19 20:50:43 -07:00
*/
}
*/
impl<'a> Schala<'a> {
2021-10-19 20:50:43 -07:00
/// Creates a new Schala environment *without* any prelude.
fn new_blank_env() -> Schala<'a> {
2021-10-19 20:50:43 -07:00
Schala {
source_reference: SourceReference::new(),
symbol_table: symbol_table::SymbolTable::new(),
type_context: type_inference::TypeContext::new(),
2021-10-19 20:50:43 -07:00
active_parser: parsing::Parser::new(),
eval_state: tree_walk_eval::State::new(),
2021-11-02 23:34:14 -07:00
timings: Vec::new(),
2021-10-19 20:50:43 -07:00
}
}
2021-10-13 23:45:54 -07:00
2021-10-19 20:50:43 -07:00
/// Creates a new Schala environment with the standard prelude, which is defined as ordinary
/// Schala code in the file `prelude.schala`
#[allow(clippy::new_without_default)]
pub fn new() -> Schala<'a> {
2021-10-19 20:50:43 -07:00
let prelude = include_str!("../source-files/prelude.schala");
let mut env = Schala::new_blank_env();
let response = env.run_pipeline(prelude, SchalaConfig::default());
2021-10-19 20:50:43 -07:00
if let Err(err) = response {
panic!("Error in prelude, panicking: {}", err.display());
}
env
}
2021-10-13 23:45:54 -07:00
2021-10-19 20:50:43 -07:00
/// This is where the actual action of interpreting/compilation happens.
/// Note: this should eventually use a query-based system for parallelization, cf.
/// https://rustc-dev-guide.rust-lang.org/overview.html
fn run_pipeline(&mut self, source: &str, config: SchalaConfig) -> Result<String, SchalaError> {
2021-11-02 23:34:14 -07:00
self.timings = vec![];
let sw = Stopwatch::start_new();
2021-10-19 20:50:43 -07:00
// 1st stage - tokenization
// TODO tokenize should return its own error type
let tokens = tokenizing::tokenize(source);
if let Some(err) = SchalaError::from_tokens(&tokens) {
return Err(err);
}
//2nd stage - parsing
self.active_parser.add_new_tokens(tokens);
let ast = self
.active_parser
.parse()
.map_err(|err| SchalaError::from_parse_error(err, &self.source_reference))?;
2021-11-02 23:34:14 -07:00
self.timings.push(("parsing", sw.elapsed()));
2021-10-19 20:50:43 -07:00
2021-11-02 23:34:14 -07:00
let sw = Stopwatch::start_new();
2021-10-19 20:50:43 -07:00
//Perform all symbol table work
2021-10-27 15:39:09 -07:00
self.symbol_table
.process_ast(&ast, &mut self.type_context)
.map_err(SchalaError::from_symbol_table)?;
2021-10-19 20:50:43 -07:00
2021-11-02 23:34:14 -07:00
self.timings.push(("symbol_table", sw.elapsed()));
2021-10-19 20:50:43 -07:00
// Typechecking
// TODO typechecking not working
//let _overall_type = self.type_context.typecheck(&ast).map_err(SchalaError::from_type_error);
2021-10-19 20:50:43 -07:00
2021-11-02 23:34:14 -07:00
let sw = Stopwatch::start_new();
2021-10-29 22:03:34 -07:00
let reduced_ir = reduced_ir::reduce(&ast, &self.symbol_table, &self.type_context);
2021-11-02 23:34:14 -07:00
self.timings.push(("reduced_ir", sw.elapsed()));
2021-11-02 23:34:14 -07:00
let sw = Stopwatch::start_new();
let evaluation_outputs = self.eval_state.evaluate(reduced_ir, &self.type_context, config.repl);
2021-11-02 23:34:14 -07:00
self.timings.push(("tree-walking-evaluation", sw.elapsed()));
let text_output: Result<Vec<String>, String> = evaluation_outputs.into_iter().collect();
let text_output: Result<Vec<String>, SchalaError> =
text_output.map_err(|err| SchalaError::from_string(err, Stage::Evaluation));
let eval_output: String =
text_output.map(|v| Iterator::intersperse(v.into_iter(), "\n".to_owned()).collect())?;
Ok(eval_output)
2021-10-19 20:50:43 -07:00
}
}
/// Represents lines of source code
2021-10-14 04:11:53 -07:00
pub(crate) struct SourceReference {
last_source: Option<String>,
/// Offsets in *bytes* (not chars) representing a newline character
newline_offsets: Vec<usize>,
}
impl SourceReference {
2021-10-19 20:50:43 -07:00
fn new() -> SourceReference {
SourceReference { last_source: None, newline_offsets: vec![]}
2021-10-19 20:50:43 -07:00
}
2021-10-19 20:50:43 -07:00
fn load_new_source(&mut self, source: &str) {
for (offset, ch) in source.as_bytes().iter().enumerate() {
if *ch == ('\n' as u8) {
self.newline_offsets.push(offset);
}
}
self.last_source = Some(source.to_string());
2021-10-19 20:50:43 -07:00
}
2021-10-19 20:50:43 -07:00
pub fn get_line(&self, line: usize) -> String {
//TODO make sure this is utf8-safe
let start_idx = match self.newline_offsets.binary_search(&line) {
Ok(index) | Err(index) => index,
};
let last_source = self.last_source.as_ref().unwrap();
let start = self.newline_offsets[start_idx];
let end = self.newline_offsets.get(start_idx + 1).cloned().unwrap_or_else(|| last_source.len());
let slice = &last_source.as_bytes()[start..end];
std::str::from_utf8(slice).unwrap().to_string()
2021-10-19 20:50:43 -07:00
}
}
2021-10-14 04:11:53 -07:00
#[allow(dead_code)]
#[derive(Clone, Copy, Debug)]
pub(crate) enum Stage {
2021-10-19 20:50:43 -07:00
Tokenizing,
Parsing,
Symbols,
ScopeResolution,
Typechecking,
AstReduction,
Evaluation,
2021-10-14 04:11:53 -07:00
}
fn stage_names() -> Vec<&'static str> {
2021-10-27 00:39:08 -07:00
vec!["tokenizing", "parsing", "symbol-table", "typechecking", "ast-reduction", "ast-walking-evaluation"]
}
#[derive(Default, Clone)]
pub struct SchalaConfig {
pub repl: bool,
}
impl<'a> ProgrammingLanguageInterface for Schala<'a> {
2021-10-21 10:45:14 -07:00
//TODO flesh out Config
type Config = SchalaConfig;
2021-10-19 20:50:43 -07:00
fn language_name() -> String {
"Schala".to_owned()
}
fn source_file_suffix() -> String {
"schala".to_owned()
}
2021-10-27 00:39:08 -07:00
fn run_computation(&mut self, request: ComputationRequest<Self::Config>) -> ComputationResponse {
let ComputationRequest { source, debug_requests: _, config: _ } = request;
2021-10-19 20:50:43 -07:00
self.source_reference.load_new_source(source);
let sw = Stopwatch::start_new();
let main_output =
self.run_pipeline(source, request.config).map_err(|schala_err| schala_err.display());
2021-11-02 23:34:14 -07:00
let total_duration = sw.elapsed();
2021-10-19 20:50:43 -07:00
2021-11-02 23:34:14 -07:00
let stage_durations: Vec<_> = std::mem::replace(&mut self.timings, vec![])
.into_iter()
.map(|(label, duration)| (label.to_string(), duration))
.collect();
let global_output_stats = GlobalOutputStats { total_duration, stage_durations };
2021-10-19 20:50:43 -07:00
2021-10-27 00:39:08 -07:00
ComputationResponse { main_output, global_output_stats, debug_responses: vec![] }
2021-10-13 23:45:54 -07:00
}
2021-10-19 20:50:43 -07:00
fn request_meta(&mut self, request: LangMetaRequest) -> LangMetaResponse {
match request {
2021-10-27 00:39:08 -07:00
LangMetaRequest::StageNames =>
LangMetaResponse::StageNames(stage_names().iter().map(|s| s.to_string()).collect()),
_ => LangMetaResponse::Custom { kind: "not-implemented".to_string(), value: "".to_string() },
2021-10-19 20:50:43 -07:00
}
}
}