diff --git a/Cargo.lock b/Cargo.lock index 77339f6fd7..0db81d7831 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -1242,6 +1242,18 @@ name = "lazycell" version = "1.2.1" source = "registry+https://github.com/rust-lang/crates.io-index" +[[package]] +name = "lexical-core" +version = "0.4.1" +source = "registry+https://github.com/rust-lang/crates.io-index" +dependencies = [ + "cfg-if 0.1.9 (registry+https://github.com/rust-lang/crates.io-index)", + "rustc_version 0.2.3 (registry+https://github.com/rust-lang/crates.io-index)", + "ryu 0.2.8 (registry+https://github.com/rust-lang/crates.io-index)", + "stackvector 1.0.6 (registry+https://github.com/rust-lang/crates.io-index)", + "static_assertions 0.2.5 (registry+https://github.com/rust-lang/crates.io-index)", +] + [[package]] name = "libc" version = "0.2.58" @@ -1522,21 +1534,23 @@ dependencies = [ ] [[package]] -name = "nom-trace" -version = "0.1.0" -source = "git+https://github.com/pythondude325/nom-trace.git#02f45edd3aa4ca9c82addb9c9a22e81044536e99" +name = "nom" +version = "5.0.0-beta2" +source = "registry+https://github.com/rust-lang/crates.io-index" dependencies = [ - "nom 4.2.3 (registry+https://github.com/rust-lang/crates.io-index)", + "lexical-core 0.4.1 (registry+https://github.com/rust-lang/crates.io-index)", + "memchr 2.2.0 (registry+https://github.com/rust-lang/crates.io-index)", + "version_check 0.1.5 (registry+https://github.com/rust-lang/crates.io-index)", ] [[package]] name = "nom_locate" version = "0.3.1" -source = "registry+https://github.com/rust-lang/crates.io-index" +source = "git+https://github.com/wycats/nom_locate.git?branch=nom5#9383cc779b23a746ff68cc7094d9ed7baaa661b2" dependencies = [ "bytecount 0.3.2 (registry+https://github.com/rust-lang/crates.io-index)", "memchr 2.2.0 (registry+https://github.com/rust-lang/crates.io-index)", - "nom 4.2.3 (registry+https://github.com/rust-lang/crates.io-index)", + "nom 5.0.0-beta2 (registry+https://github.com/rust-lang/crates.io-index)", ] [[package]] @@ -1575,9 +1589,8 @@ dependencies = [ "log 0.4.6 (registry+https://github.com/rust-lang/crates.io-index)", "logos 0.10.0-rc2 (registry+https://github.com/rust-lang/crates.io-index)", "logos-derive 0.10.0-rc2 (registry+https://github.com/rust-lang/crates.io-index)", - "nom 4.2.3 (registry+https://github.com/rust-lang/crates.io-index)", - "nom-trace 0.1.0 (git+https://github.com/pythondude325/nom-trace.git)", - "nom_locate 0.3.1 (registry+https://github.com/rust-lang/crates.io-index)", + "nom 5.0.0-beta2 (registry+https://github.com/rust-lang/crates.io-index)", + "nom_locate 0.3.1 (git+https://github.com/wycats/nom_locate.git?branch=nom5)", "ordered-float 1.0.2 (registry+https://github.com/rust-lang/crates.io-index)", "pancurses 0.16.1 (registry+https://github.com/rust-lang/crates.io-index)", "pretty 0.5.2 (registry+https://github.com/rust-lang/crates.io-index)", @@ -1589,7 +1602,7 @@ dependencies = [ "regex 1.1.7 (registry+https://github.com/rust-lang/crates.io-index)", "reqwest 0.9.18 (registry+https://github.com/rust-lang/crates.io-index)", "roxmltree 0.6.1 (registry+https://github.com/rust-lang/crates.io-index)", - "rustyline 5.0.0 (git+https://github.com/kkawakam/rustyline.git)", + "rustyline 5.0.0 (registry+https://github.com/rust-lang/crates.io-index)", "serde 1.0.92 (registry+https://github.com/rust-lang/crates.io-index)", "serde-hjson 0.9.0 (registry+https://github.com/rust-lang/crates.io-index)", "serde_derive 1.0.92 (registry+https://github.com/rust-lang/crates.io-index)", @@ -2319,7 +2332,7 @@ dependencies = [ [[package]] name = "rustyline" version = "5.0.0" -source = "git+https://github.com/kkawakam/rustyline.git#70e45caf47b699e43bec0d2fb722aae2cdad602f" +source = "registry+https://github.com/rust-lang/crates.io-index" dependencies = [ "dirs 2.0.1 (registry+https://github.com/rust-lang/crates.io-index)", "libc 0.2.58 (registry+https://github.com/rust-lang/crates.io-index)", @@ -2573,6 +2586,20 @@ name = "stable_deref_trait" version = "1.1.1" source = "registry+https://github.com/rust-lang/crates.io-index" +[[package]] +name = "stackvector" +version = "1.0.6" +source = "registry+https://github.com/rust-lang/crates.io-index" +dependencies = [ + "rustc_version 0.2.3 (registry+https://github.com/rust-lang/crates.io-index)", + "unreachable 1.0.0 (registry+https://github.com/rust-lang/crates.io-index)", +] + +[[package]] +name = "static_assertions" +version = "0.2.5" +source = "registry+https://github.com/rust-lang/crates.io-index" + [[package]] name = "string" version = "0.2.0" @@ -3019,6 +3046,14 @@ name = "unicode-xid" version = "0.1.0" source = "registry+https://github.com/rust-lang/crates.io-index" +[[package]] +name = "unreachable" +version = "1.0.0" +source = "registry+https://github.com/rust-lang/crates.io-index" +dependencies = [ + "void 1.0.2 (registry+https://github.com/rust-lang/crates.io-index)", +] + [[package]] name = "url" version = "1.7.2" @@ -3335,6 +3370,7 @@ dependencies = [ "checksum lazy_static 0.2.11 (registry+https://github.com/rust-lang/crates.io-index)" = "76f033c7ad61445c5b347c7382dd1237847eb1bce590fe50365dcb33d546be73" "checksum lazy_static 1.3.0 (registry+https://github.com/rust-lang/crates.io-index)" = "bc5729f27f159ddd61f4df6228e827e86643d4d3e7c32183cb30a1c08f604a14" "checksum lazycell 1.2.1 (registry+https://github.com/rust-lang/crates.io-index)" = "b294d6fa9ee409a054354afc4352b0b9ef7ca222c69b8812cbea9e7d2bf3783f" +"checksum lexical-core 0.4.1 (registry+https://github.com/rust-lang/crates.io-index)" = "9d224b31f370c8dfc0dea1932d9e6bd451e65aef6f5f2318846664c04b42a796" "checksum libc 0.2.58 (registry+https://github.com/rust-lang/crates.io-index)" = "6281b86796ba5e4366000be6e9e18bf35580adf9e63fbe2294aadb587613a319" "checksum libgit2-sys 0.8.1 (registry+https://github.com/rust-lang/crates.io-index)" = "941a41e23f77323b8c9d2ee118aec9ee39dfc176078c18b4757d3bad049d9ff7" "checksum libssh2-sys 0.2.11 (registry+https://github.com/rust-lang/crates.io-index)" = "126a1f4078368b163bfdee65fbab072af08a1b374a5551b21e87ade27b1fbf9d" @@ -3365,8 +3401,8 @@ dependencies = [ "checksum nix 0.14.1 (registry+https://github.com/rust-lang/crates.io-index)" = "6c722bee1037d430d0f8e687bbdbf222f27cc6e4e68d5caf630857bb2b6dbdce" "checksum nodrop 0.1.13 (registry+https://github.com/rust-lang/crates.io-index)" = "2f9667ddcc6cc8a43afc9b7917599d7216aa09c463919ea32c59ed6cac8bc945" "checksum nom 4.2.3 (registry+https://github.com/rust-lang/crates.io-index)" = "2ad2a91a8e869eeb30b9cb3119ae87773a8f4ae617f41b1eb9c154b2905f7bd6" -"checksum nom-trace 0.1.0 (git+https://github.com/pythondude325/nom-trace.git)" = "" -"checksum nom_locate 0.3.1 (registry+https://github.com/rust-lang/crates.io-index)" = "6a47c112b3861d81f7fbf73892b9271af933af32bd5dee6889aa3c3fa9caed7e" +"checksum nom 5.0.0-beta2 (registry+https://github.com/rust-lang/crates.io-index)" = "cfa215de9f747c2b3290ceee185976eb6ffc936087e19d810b57ba3ff85ae28c" +"checksum nom_locate 0.3.1 (git+https://github.com/wycats/nom_locate.git?branch=nom5)" = "" "checksum num 0.2.0 (registry+https://github.com/rust-lang/crates.io-index)" = "cf4825417e1e1406b3782a8ce92f4d53f26ec055e3622e1881ca8e9f5f9e08db" "checksum num-complex 0.2.3 (registry+https://github.com/rust-lang/crates.io-index)" = "fcb0cf31fb3ff77e6d2a6ebd6800df7fdcd106f2ad89113c9130bcd07f93dffc" "checksum num-integer 0.1.41 (registry+https://github.com/rust-lang/crates.io-index)" = "b85e541ef8255f6cf42bbfe4ef361305c6c135d10919ecc26126c4e5ae94bc09" @@ -3442,7 +3478,7 @@ dependencies = [ "checksum rustc-demangle 0.1.15 (registry+https://github.com/rust-lang/crates.io-index)" = "a7f4dccf6f4891ebcc0c39f9b6eb1a83b9bf5d747cb439ec6fba4f3b977038af" "checksum rustc-hash 1.0.1 (registry+https://github.com/rust-lang/crates.io-index)" = "7540fc8b0c49f096ee9c961cda096467dce8084bec6bdca2fc83895fd9b28cb8" "checksum rustc_version 0.2.3 (registry+https://github.com/rust-lang/crates.io-index)" = "138e3e0acb6c9fb258b19b67cb8abd63c00679d2851805ea151465464fe9030a" -"checksum rustyline 5.0.0 (git+https://github.com/kkawakam/rustyline.git)" = "" +"checksum rustyline 5.0.0 (registry+https://github.com/rust-lang/crates.io-index)" = "67e12e40e0240de07f0dab4f4dd01bdb15d74dc977026d4ba91666c41c679ade" "checksum ryu 0.2.8 (registry+https://github.com/rust-lang/crates.io-index)" = "b96a9549dc8d48f2c283938303c4b5a77aa29bfbc5b54b084fb1630408899a8f" "checksum safemem 0.3.0 (registry+https://github.com/rust-lang/crates.io-index)" = "8dca453248a96cb0749e36ccdfe2b0b4e54a61bfef89fb97ec621eb8e0a93dd9" "checksum same-file 1.0.4 (registry+https://github.com/rust-lang/crates.io-index)" = "8f20c4be53a8a1ff4c1f1b2bd14570d2f634628709752f0702ecdd2b3f9a5267" @@ -3474,6 +3510,8 @@ dependencies = [ "checksum slab 0.4.2 (registry+https://github.com/rust-lang/crates.io-index)" = "c111b5bd5695e56cffe5129854aa230b39c93a305372fdbb2668ca2394eea9f8" "checksum smallvec 0.6.10 (registry+https://github.com/rust-lang/crates.io-index)" = "ab606a9c5e214920bb66c458cd7be8ef094f813f20fe77a54cc7dbfff220d4b7" "checksum stable_deref_trait 1.1.1 (registry+https://github.com/rust-lang/crates.io-index)" = "dba1a27d3efae4351c8051072d619e3ade2820635c3958d826bfea39d59b54c8" +"checksum stackvector 1.0.6 (registry+https://github.com/rust-lang/crates.io-index)" = "1c4725650978235083241fab0fdc8e694c3de37821524e7534a1a9061d1068af" +"checksum static_assertions 0.2.5 (registry+https://github.com/rust-lang/crates.io-index)" = "c19be23126415861cb3a23e501d34a708f7f9b2183c5252d690941c2e69199d5" "checksum string 0.2.0 (registry+https://github.com/rust-lang/crates.io-index)" = "d0bbfb8937e38e34c3444ff00afb28b0811d9554f15c5ad64d12b0308d1d1995" "checksum strsim 0.7.0 (registry+https://github.com/rust-lang/crates.io-index)" = "bb4f380125926a99e52bc279241539c018323fab05ad6368b56f93d9369ff550" "checksum strsim 0.8.0 (registry+https://github.com/rust-lang/crates.io-index)" = "8ea5119cdb4c55b55d432abb513a0429384878c15dde60cc77b1c99de1a95a6a" @@ -3521,6 +3559,7 @@ dependencies = [ "checksum unicode-segmentation 1.3.0 (registry+https://github.com/rust-lang/crates.io-index)" = "1967f4cdfc355b37fd76d2a954fb2ed3871034eb4f26d60537d88795cfc332a9" "checksum unicode-width 0.1.5 (registry+https://github.com/rust-lang/crates.io-index)" = "882386231c45df4700b275c7ff55b6f3698780a650026380e72dabe76fa46526" "checksum unicode-xid 0.1.0 (registry+https://github.com/rust-lang/crates.io-index)" = "fc72304796d0818e357ead4e000d19c9c174ab23dc11093ac919054d20a6a7fc" +"checksum unreachable 1.0.0 (registry+https://github.com/rust-lang/crates.io-index)" = "382810877fe448991dfc7f0dd6e3ae5d58088fd0ea5e35189655f84e6814fa56" "checksum url 1.7.2 (registry+https://github.com/rust-lang/crates.io-index)" = "dd4e7c0d531266369519a4aa4f399d748bd37043b00bde1e4ff1f60a120b355a" "checksum utf8-ranges 1.0.3 (registry+https://github.com/rust-lang/crates.io-index)" = "9d50aa7650df78abf942826607c62468ce18d9019673d4a2ebe1865dbb96ffde" "checksum utf8parse 0.1.1 (registry+https://github.com/rust-lang/crates.io-index)" = "8772a4ccbb4e89959023bc5b7cb8623a795caa7092d99f3aa9501b9484d4557d" diff --git a/Cargo.toml b/Cargo.toml index ba0b3b98f9..1d48b667c5 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -10,7 +10,7 @@ edition = "2018" [dependencies] #rustyline = "4.1.0" -rustyline = { git ="https://github.com/kkawakam/rustyline.git" } +rustyline = "5.0.0" sysinfo = "0.8.5" chrono = { version = "0.4.6", features = ["serde"] } chrono-tz = "0.5.1" @@ -19,7 +19,7 @@ prettytable-rs = "0.8.0" itertools = "0.8.0" ansi_term = "0.11.0" conch-parser = "0.1.1" -nom = "4.2.3" +nom = "5.0.0-beta2" dunce = "1.0.0" indexmap = { version = "1.0.2", features = ["serde-1"] } chrono-humanize = "0.0.11" @@ -61,11 +61,10 @@ clipboard = "0.5" reqwest = "0.9" roxmltree = "0.6.0" pretty = "0.5.2" -nom_locate = "0.3.1" +nom_locate = { git = "https://github.com/wycats/nom_locate.git", branch = "nom5" } derive_more = "0.15.0" enum-utils = "0.1.0" unicode-xid = "0.1.0" -nom-trace = { version = "0.1.0", git = "https://github.com/pythondude325/nom-trace.git" } serde_ini = "0.2.0" subprocess = "0.1.18" sys-info = "0.5.7" diff --git a/src/cli.rs b/src/cli.rs index 1dbba22c02..82dc18f7c9 100644 --- a/src/cli.rs +++ b/src/cli.rs @@ -11,14 +11,14 @@ use crate::commands::classified::{ use crate::context::Context; crate use crate::errors::ShellError; use crate::evaluate::Scope; +use crate::parser::parse2::span::Spanned; +use crate::parser::parse2::{PipelineElement, TokenNode}; +use crate::parser::registry; use crate::git::current_branch; use crate::object::Value; -use crate::parser::ast::{Expression, Leaf, RawExpression}; -use crate::parser::lexer::Spanned; -use crate::parser::{Args, Pipeline}; -use log::debug; +use log::{debug, trace}; use rustyline::error::ReadlineError; use rustyline::{self, ColorMode, Config, Editor}; @@ -62,19 +62,21 @@ pub async fn cli() -> Result<(), Box> { command("from-xml", from_xml::from_xml), command("from-yaml", from_yaml::from_yaml), command("get", get::get), - command("open", open::open), command("enter", enter::enter), command("exit", exit::exit), command("lines", lines::lines), command("pick", pick::pick), command("split-column", split_column::split_column), command("split-row", split_row::split_row), + command("lines", lines::lines), command("reject", reject::reject), command("trim", trim::trim), command("to-array", to_array::to_array), command("to-ini", to_ini::to_ini), command("to-json", to_json::to_json), command("to-toml", to_toml::to_toml), + command("sort-by", sort_by::sort_by), + Arc::new(Open), Arc::new(Where), Arc::new(Config), Arc::new(SkipWhile), @@ -159,7 +161,7 @@ pub async fn cli() -> Result<(), Box> { let host = context.host.lock().unwrap(); let writer = host.err_termcolor(); line.push_str(" "); - let files = crate::parser::span::Files::new(line); + let files = crate::parser::Files::new(line); language_reporting::emit( &mut writer.lock(), @@ -258,7 +260,7 @@ async fn process_line(readline: Result, ctx: &mut Context debug!("=== Parsed ==="); debug!("{:#?}", result); - let mut pipeline = classify_pipeline(&result, ctx)?; + let mut pipeline = classify_pipeline(&result, ctx, &line)?; match pipeline.commands.last() { Some(ClassifiedCommand::Sink(_)) => {} @@ -266,9 +268,9 @@ async fn process_line(readline: Result, ctx: &mut Context _ => pipeline.commands.push(ClassifiedCommand::Sink(SinkCommand { command: sink("autoview", autoview::autoview), name_span: None, - args: Args { - positional: vec![], - named: indexmap::IndexMap::new(), + args: registry::Args { + positional: None, + named: None, }, })), } @@ -371,14 +373,15 @@ async fn process_line(readline: Result, ctx: &mut Context } fn classify_pipeline( - pipeline: &Pipeline, + pipeline: &TokenNode, context: &Context, + source: &str, ) -> Result { - let commands: Result, _> = pipeline - .commands + let pipeline = pipeline.as_pipeline()?; + + let commands: Result, ShellError> = pipeline .iter() - .cloned() - .map(|item| classify_command(&item, context)) + .map(|item| classify_command(&item, context, source)) .collect(); Ok(ClassifiedPipeline { @@ -387,85 +390,69 @@ fn classify_pipeline( } fn classify_command( - command: &Expression, + command: &PipelineElement, context: &Context, + source: &str, ) -> Result { - // let command_name = &command.name[..]; - // let args = &command.args; + let call = command.call(); - if let Expression { - expr: RawExpression::Call(call), - .. - } = command - { - match (&call.name, &call.args) { - ( - Expression { - expr: RawExpression::Leaf(Leaf::Bare(name)), - span, - }, - args, - ) => match context.has_command(&name.to_string()) { + match call { + call if call.head().is_bare() => { + let head = call.head(); + let name = head.source(source); + + match context.has_command(name) { true => { - let command = context.get_command(&name.to_string()); + let command = context.get_command(name); let config = command.config(); let scope = Scope::empty(); - let args = match args { - Some(args) => config.evaluate_args(args.iter(), &scope)?, - None => Args::default(), - }; + trace!("classifying {:?}", config); + + let args = config.evaluate_args(call, context, &scope, source)?; Ok(ClassifiedCommand::Internal(InternalCommand { command, - name_span: Some(span.clone()), + name_span: Some(head.span().clone()), args, })) } - false => match context.has_sink(&name.to_string()) { + false => match context.has_sink(name) { true => { - let command = context.get_sink(&name.to_string()); + let command = context.get_sink(name); let config = command.config(); let scope = Scope::empty(); - let args = match args { - Some(args) => config.evaluate_args(args.iter(), &scope)?, - None => Args::default(), - }; + let args = config.evaluate_args(call, context, &scope, source)?; Ok(ClassifiedCommand::Sink(SinkCommand { command, - name_span: Some(span.clone()), + name_span: Some(head.span().clone()), args, })) } false => { - let arg_list_strings: Vec> = match args { + let arg_list_strings: Vec> = match call.children() { + //Some(args) => args.iter().map(|i| i.as_external_arg(source)).collect(), Some(args) => args .iter() - .map(|i| Spanned::from_item(i.as_external_arg(), i.span)) + .map(|i| Spanned::from_item(i.as_external_arg(source), i.span())) .collect(), None => vec![], }; Ok(ClassifiedCommand::External(ExternalCommand { name: name.to_string(), - name_span: Some(span.clone()), + name_span: Some(head.span().clone()), args: arg_list_strings, })) } }, - }, - - (_, None) => Err(ShellError::string( - "Unimplemented command that is just an expression (1)", - )), - (_, Some(_)) => Err(ShellError::string("Unimplemented dynamic command")), + } } - } else { - Err(ShellError::string(&format!( - "Unimplemented command that is just an expression (2) -- {:?}", - command - ))) + + _ => Err(ShellError::unimplemented( + "classify_command on command whose head is not bare", + )), } } diff --git a/src/commands.rs b/src/commands.rs index 2923d449ff..3454a0c01d 100644 --- a/src/commands.rs +++ b/src/commands.rs @@ -41,6 +41,6 @@ crate mod where_; crate use command::command; crate use config::Config; - +crate use open::Open; crate use where_::Where; crate use skip_while::SkipWhile; diff --git a/src/commands/cd.rs b/src/commands/cd.rs index 380c7d5832..bf6d581e9b 100644 --- a/src/commands/cd.rs +++ b/src/commands/cd.rs @@ -10,7 +10,8 @@ pub fn cd(args: CommandArgs) -> Result { match latest.obj { Value::Filesystem => { let cwd = latest.path().to_path_buf(); - let path = match args.positional.first() { + + let path = match args.nth(0) { None => match dirs::home_dir() { Some(o) => o, _ => { @@ -26,10 +27,10 @@ pub fn cd(args: CommandArgs) -> Result { match dunce::canonicalize(cwd.join(&target).as_path()) { Ok(p) => p, Err(_) => { - return Err(ShellError::maybe_labeled_error( + return Err(ShellError::labeled_error( "Can not change to directory", "directory not found", - Some(args.positional[0].span.clone()), + v.span.clone(), )); } } @@ -40,11 +41,11 @@ pub fn cd(args: CommandArgs) -> Result { match env::set_current_dir(&path) { Ok(_) => {} Err(_) => { - if args.positional.len() > 0 { - return Err(ShellError::maybe_labeled_error( + if args.len() > 0 { + return Err(ShellError::labeled_error( "Can not change to directory", "directory not found", - Some(args.positional[0].span.clone()), + args.nth(0).unwrap().span.clone(), )); } else { return Err(ShellError::string("Can not change to directory")); @@ -56,7 +57,7 @@ pub fn cd(args: CommandArgs) -> Result { } _ => { let mut stream = VecDeque::new(); - match args.positional.first() { + match args.nth(0) { None => { stream.push_back(ReturnValue::change_cwd(PathBuf::from("/"))); } diff --git a/src/commands/classified.rs b/src/commands/classified.rs index bb476187ee..65c5ed8753 100644 --- a/src/commands/classified.rs +++ b/src/commands/classified.rs @@ -1,15 +1,16 @@ use crate::commands::command::Sink; -use crate::parser::ast::Expression; -use crate::parser::lexer::{Span, Spanned}; -use crate::parser::registry::Args; +use crate::parser::parse2::span::Spanned; +use crate::parser::{registry::Args, Span, TokenNode}; use crate::prelude::*; use bytes::{BufMut, BytesMut}; use futures::stream::StreamExt; use futures_codec::{Decoder, Encoder, Framed}; +use log::{log_enabled, trace}; use std::io::{Error, ErrorKind}; use std::path::PathBuf; use std::sync::Arc; use subprocess::Exec; + /// A simple `Codec` implementation that splits up data into lines. pub struct LinesCodec {} @@ -80,7 +81,7 @@ crate struct ClassifiedPipeline { crate enum ClassifiedCommand { #[allow(unused)] - Expr(Expression), + Expr(TokenNode), Internal(InternalCommand), Sink(SinkCommand), External(ExternalCommand), @@ -110,18 +111,31 @@ impl InternalCommand { context: &mut Context, input: ClassifiedInputStream, ) -> Result { - let mut result = context.run_command( - self.command, - self.name_span.clone(), - self.args, - input.objects, - )?; + let objects = if log_enabled!(log::Level::Trace) { + trace!("->"); + trace!("{}", self.command.name()); + trace!("{:?}", self.args.debug()); + let objects: Vec<_> = input.objects.collect().await; + trace!( + "input = {:#?}", + objects.iter().map(|o| o.debug()).collect::>(), + ); + VecDeque::from(objects).boxed() + } else { + input.objects + }; + + let mut result = + context.run_command(self.command, self.name_span.clone(), self.args, objects)?; + let env = context.env.clone(); + let mut stream = VecDeque::new(); while let Some(item) = result.next().await { match item { ReturnValue::Value(Value::Error(err)) => { return Err(*err); } + ReturnValue::Action(action) => match action { CommandAction::ChangePath(path) => { context.env.lock().unwrap().back_mut().map(|x| { @@ -177,10 +191,12 @@ impl ExternalCommand { ) -> Result { let inputs: Vec = input.objects.collect().await; + trace!("{:?} -> {}", inputs, self.name); + let mut arg_string = format!("{}", self.name); for arg in &self.args { - arg_string.push_str(" "); - arg_string.push_str(&arg.item); + //arg_string.push_str(" "); + arg_string.push_str(&arg); } let mut process; @@ -191,6 +207,7 @@ impl ExternalCommand { if arg_string.contains("$it") { let mut first = true; + for i in &inputs { if i.as_string().is_err() { let mut span = None; @@ -217,6 +234,10 @@ impl ExternalCommand { } for arg in &self.args { + if arg.chars().all(|c| c.is_whitespace()) { + continue; + } + process = process.arg(&arg.replace("$it", &i.as_string().unwrap())); } } @@ -254,6 +275,10 @@ impl ExternalCommand { } for arg in &self.args { + if arg.chars().all(|c| c.is_whitespace()) { + continue; + } + new_arg_string.push_str(" "); new_arg_string.push_str(&arg.replace("$it", &i.as_string().unwrap())); } diff --git a/src/commands/command.rs b/src/commands/command.rs index ff2046206e..d25cf52b67 100644 --- a/src/commands/command.rs +++ b/src/commands/command.rs @@ -1,25 +1,53 @@ use crate::errors::ShellError; use crate::object::Value; -use crate::parser::lexer::Span; -use crate::parser::lexer::Spanned; -use crate::parser::CommandConfig; +use crate::parser::{ + registry::{self, Args}, + Span, Spanned, +}; use crate::prelude::*; +use getset::Getters; use std::path::PathBuf; +#[derive(Getters)] +#[get = "crate"] pub struct CommandArgs { pub host: Arc>, pub env: Arc>>, pub name_span: Option, - pub positional: Vec>, - pub named: indexmap::IndexMap, + pub args: Args, pub input: InputStream, } +impl CommandArgs { + pub fn nth(&self, pos: usize) -> Option<&Spanned> { + self.args.nth(pos) + } + + pub fn positional_iter(&self) -> impl Iterator> { + self.args.positional_iter() + } + + pub fn expect_nth(&self, pos: usize) -> Result<&Spanned, ShellError> { + self.args.expect_nth(pos) + } + + pub fn len(&self) -> usize { + self.args.len() + } + + pub fn get(&self, name: &str) -> Option<&Spanned> { + self.args.get(name) + } + + pub fn has(&self, name: &str) -> bool { + self.args.has(name) + } +} + pub struct SinkCommandArgs { pub ctx: Context, pub name_span: Option, - pub positional: Vec>, - pub named: indexmap::IndexMap, + pub args: Args, pub input: Vec, } @@ -46,8 +74,8 @@ pub trait Command { fn run(&self, args: CommandArgs) -> Result; fn name(&self) -> &str; - fn config(&self) -> CommandConfig { - CommandConfig { + fn config(&self) -> registry::CommandConfig { + registry::CommandConfig { name: self.name().to_string(), mandatory_positional: vec![], optional_positional: vec![], @@ -61,8 +89,8 @@ pub trait Sink { fn run(&self, args: SinkCommandArgs) -> Result<(), ShellError>; fn name(&self) -> &str; - fn config(&self) -> CommandConfig { - CommandConfig { + fn config(&self) -> registry::CommandConfig { + registry::CommandConfig { name: self.name().to_string(), mandatory_positional: vec![], optional_positional: vec![], diff --git a/src/commands/config.rs b/src/commands/config.rs index 11b35a84e2..d18bc2f17f 100644 --- a/src/commands/config.rs +++ b/src/commands/config.rs @@ -1,8 +1,7 @@ use crate::errors::ShellError; use crate::object::config; use crate::object::Value; -use crate::parser::registry::{NamedType, NamedValue}; -use crate::parser::CommandConfig; +use crate::parser::registry::{CommandConfig, NamedType, NamedValue}; use crate::prelude::*; use indexmap::IndexMap; use log::trace; @@ -19,7 +18,7 @@ impl Command for Config { fn config(&self) -> CommandConfig { let mut named: IndexMap = IndexMap::new(); - named.insert("set".to_string(), NamedType::Optional(NamedValue::Tuple)); + named.insert("set".to_string(), NamedType::Optional(NamedValue::Single)); named.insert("get".to_string(), NamedType::Optional(NamedValue::Single)); named.insert("clear".to_string(), NamedType::Switch); @@ -41,10 +40,10 @@ impl Command for Config { pub fn config(args: CommandArgs) -> Result { let mut result = crate::object::config::config()?; - trace!("{:#?}", args.positional); - trace!("{:#?}", args.named); + trace!("{:#?}", args.args.positional); + trace!("{:#?}", args.args.named); - if let Some(v) = args.named.get("get") { + if let Some(v) = args.get("get") { let key = v.as_string()?; let value = result .get(&key) @@ -56,7 +55,7 @@ pub fn config(args: CommandArgs) -> Result { ); } - if let Some(v) = args.named.get("set") { + if let Some(v) = args.get("set") { if let Ok((key, value)) = v.as_pair() { result.insert(key.as_string()?, value.clone()); @@ -71,7 +70,7 @@ pub fn config(args: CommandArgs) -> Result { } } - if let Some(_) = args.named.get("clear") { + if let Some(_) = args.get("clear") { result.clear(); config::write_config(&result)?; @@ -84,7 +83,7 @@ pub fn config(args: CommandArgs) -> Result { ); } - if let Some(v) = args.named.get("remove") { + if let Some(v) = args.get("remove") { let key = v.as_string()?; if result.contains_key(&key) { @@ -104,7 +103,7 @@ pub fn config(args: CommandArgs) -> Result { ); } - if args.positional.len() == 0 { + if args.len() == 0 { return Ok( futures::stream::once(futures::future::ready(ReturnValue::Value(Value::Object( result.into(), diff --git a/src/commands/enter.rs b/src/commands/enter.rs index 2ca3c2ccaf..df0315a9ba 100644 --- a/src/commands/enter.rs +++ b/src/commands/enter.rs @@ -1,32 +1,34 @@ use crate::commands::command::CommandAction; use crate::errors::ShellError; use crate::object::{Primitive, Value}; -use crate::parser::lexer::Spanned; +use crate::parser::Spanned; use crate::prelude::*; use std::path::{Path, PathBuf}; pub fn enter(args: CommandArgs) -> Result { - if args.positional.len() == 0 { - return Err(ShellError::maybe_labeled_error( + let path = match args.nth(0) { + None => return Err(ShellError::maybe_labeled_error( "open requires a path or url", "missing path", args.name_span, - )); - } + )), + Some(p) => p, + }; let span = args.name_span; let cwd = args - .env + .env() .lock() .unwrap() .front() .unwrap() .path() .to_path_buf(); + let mut full_path = PathBuf::from(cwd); - let (file_extension, contents) = match &args.positional[0].item { + let (file_extension, contents) = match path.item() { Value::Primitive(Primitive::String(s)) => { if s.starts_with("http:") || s.starts_with("https:") { let response = reqwest::get(s); @@ -49,7 +51,7 @@ pub fn enter(args: CommandArgs) -> Result { return Err(ShellError::labeled_error( "Web page contents corrupt", "received garbled data", - args.positional[0].span, + args.expect_nth(0)?.span, )); } }, @@ -57,7 +59,7 @@ pub fn enter(args: CommandArgs) -> Result { return Err(ShellError::labeled_error( "URL could not be opened", "url not found", - args.positional[0].span, + args.expect_nth(0)?.span, )); } } @@ -74,7 +76,7 @@ pub fn enter(args: CommandArgs) -> Result { return Err(ShellError::labeled_error( "File cound not be opened", "file not found", - args.positional[0].span, + args.expect_nth(0)?.span, )); } } @@ -84,14 +86,14 @@ pub fn enter(args: CommandArgs) -> Result { return Err(ShellError::labeled_error( "Expected string value for filename", "expected filename", - args.positional[0].span, + args.expect_nth(0)?.span, )); } }; let mut stream = VecDeque::new(); - let file_extension = match args.positional.get(1) { + let file_extension = match args.nth(1) { Some(Spanned { item: Value::Primitive(Primitive::String(s)), span, diff --git a/src/commands/first.rs b/src/commands/first.rs index 89bb4ff9c9..68831eeaea 100644 --- a/src/commands/first.rs +++ b/src/commands/first.rs @@ -4,7 +4,7 @@ use crate::prelude::*; // TODO: "Amount remaining" wrapper pub fn first(args: CommandArgs) -> Result { - if args.positional.len() == 0 { + if args.len() == 0 { return Err(ShellError::maybe_labeled_error( "First requires an amount", "needs parameter", @@ -12,7 +12,7 @@ pub fn first(args: CommandArgs) -> Result { )); } - let amount = args.positional[0].as_i64(); + let amount = args.expect_nth(0)?.as_i64(); let amount = match amount { Ok(o) => o, @@ -20,7 +20,7 @@ pub fn first(args: CommandArgs) -> Result { return Err(ShellError::labeled_error( "Value is not a number", "expected integer", - args.positional[0].span, + args.expect_nth(0)?.span, )) } }; diff --git a/src/commands/get.rs b/src/commands/get.rs index 60b835d62f..81a000a010 100644 --- a/src/commands/get.rs +++ b/src/commands/get.rs @@ -1,6 +1,6 @@ use crate::errors::ShellError; use crate::object::Value; -use crate::parser::lexer::Span; +use crate::parser::Span; use crate::prelude::*; fn get_member(path: &str, span: Span, obj: &Value) -> Option { @@ -22,7 +22,7 @@ fn get_member(path: &str, span: Span, obj: &Value) -> Option { } pub fn get(args: CommandArgs) -> Result { - if args.positional.len() == 0 { + if args.len() == 0 { return Err(ShellError::maybe_labeled_error( "Get requires a field or field path", "needs parameter", @@ -30,7 +30,7 @@ pub fn get(args: CommandArgs) -> Result { )); } - let amount = args.positional[0].as_i64(); + let amount = args.expect_nth(0)?.as_i64(); // If it's a number, get the row instead of the column if let Ok(amount) = amount { @@ -43,8 +43,7 @@ pub fn get(args: CommandArgs) -> Result { } let fields: Result, _> = args - .positional - .iter() + .positional_iter() .map(|a| (a.as_string().map(|x| (x, a.span)))) .collect(); let fields = fields?; diff --git a/src/commands/lines.rs b/src/commands/lines.rs index b1db3feb2f..86ac1ac09b 100644 --- a/src/commands/lines.rs +++ b/src/commands/lines.rs @@ -1,6 +1,9 @@ use crate::errors::ShellError; use crate::object::{Primitive, Value}; use crate::prelude::*; +use log::trace; + +// TODO: "Amount remaining" wrapper pub fn lines(args: CommandArgs) -> Result { let input = args.input; @@ -9,7 +12,10 @@ pub fn lines(args: CommandArgs) -> Result { let stream = input .map(move |v| match v { Value::Primitive(Primitive::String(s)) => { - let split_result: Vec<_> = s.lines().filter(|s| s.trim() != "").collect(); + let splitter = "\n"; + let split_result: Vec<_> = s.split(&splitter).filter(|s| s.trim() != "").collect(); + + trace!("split result = {:?}", split_result); let mut result = VecDeque::new(); for s in split_result { diff --git a/src/commands/ls.rs b/src/commands/ls.rs index f8205e3a1a..2f0b09156c 100644 --- a/src/commands/ls.rs +++ b/src/commands/ls.rs @@ -1,6 +1,6 @@ use crate::errors::ShellError; use crate::object::{dir_entry_dict, Primitive, Value}; -use crate::parser::lexer::Spanned; +use crate::parser::Spanned; use crate::prelude::*; use std::ffi::OsStr; use std::path::{Path, PathBuf}; @@ -10,7 +10,7 @@ pub fn ls(args: CommandArgs) -> Result { let path = env.back().unwrap().path.to_path_buf(); let obj = &env.back().unwrap().obj; let mut full_path = PathBuf::from(path); - match &args.positional.get(0) { + match &args.nth(0) { Some(Spanned { item: Value::Primitive(Primitive::String(s)), .. @@ -24,7 +24,7 @@ pub fn ls(args: CommandArgs) -> Result { let entries = match entries { Err(e) => { - if let Some(s) = args.positional.get(0) { + if let Some(s) = args.nth(0) { return Err(ShellError::labeled_error( e.to_string(), e.to_string(), @@ -97,7 +97,7 @@ pub fn ls(args: CommandArgs) -> Result { return Err(ShellError::maybe_labeled_error( "Index not closed", format!("path missing closing ']'"), - if args.positional.len() > 0 { Some(args.positional[0].span) } else { args.name_span }, + if args.len() > 0 { Some(args.nth(0).unwrap().span) } else { args.name_span }, )) } } diff --git a/src/commands/open.rs b/src/commands/open.rs index 0edce69880..17be0b7063 100644 --- a/src/commands/open.rs +++ b/src/commands/open.rs @@ -1,11 +1,37 @@ use crate::errors::ShellError; use crate::object::{Primitive, Value}; -use crate::parser::lexer::Spanned; +use crate::parser::registry::{CommandConfig, NamedType}; use crate::prelude::*; +use indexmap::IndexMap; use std::path::{Path, PathBuf}; +use crate::parser::parse2::span::Spanned; -pub fn open(args: CommandArgs) -> Result { - if args.positional.len() == 0 { +pub struct Open; + +impl Command for Open { + fn run(&self, args: CommandArgs) -> Result { + open(args) + } + fn name(&self) -> &str { + "open" + } + + fn config(&self) -> CommandConfig { + let mut named: IndexMap = IndexMap::new(); + named.insert("raw".to_string(), NamedType::Switch); + + CommandConfig { + name: self.name().to_string(), + mandatory_positional: vec![], + optional_positional: vec![], + rest_positional: false, + named, + } + } +} + +fn open(args: CommandArgs) -> Result { + if args.len() == 0 { return Err(ShellError::maybe_labeled_error( "Open requires a path or url", "needs path or url", @@ -25,7 +51,7 @@ pub fn open(args: CommandArgs) -> Result { .to_path_buf(); let mut full_path = PathBuf::from(cwd); - let (file_extension, contents) = match &args.positional[0].item { + let (file_extension, contents) = match &args.expect_nth(0)?.item { Value::Primitive(Primitive::String(s)) => { if s.starts_with("http:") || s.starts_with("https:") { let response = reqwest::get(s); @@ -48,7 +74,7 @@ pub fn open(args: CommandArgs) -> Result { return Err(ShellError::labeled_error( "Web page contents corrupt", "received garbled data", - args.positional[0].span, + args.expect_nth(0)?.span, )); } }, @@ -56,7 +82,7 @@ pub fn open(args: CommandArgs) -> Result { return Err(ShellError::labeled_error( "URL could not be opened", "url not found", - args.positional[0].span, + args.expect_nth(0)?.span, )); } } @@ -71,9 +97,9 @@ pub fn open(args: CommandArgs) -> Result { ), Err(_) => { return Err(ShellError::labeled_error( - "File could not be opened", - "could not be opened", - args.positional[0].span, + "File cound not be opened", + "file not found", + args.expect_nth(0)?.span, )); } } @@ -83,14 +109,14 @@ pub fn open(args: CommandArgs) -> Result { return Err(ShellError::labeled_error( "Expected string value for filename", "expected filename", - args.positional[0].span, + args.expect_nth(0)?.span, )); } }; let mut stream = VecDeque::new(); - let file_extension = match args.positional.get(1) { + let file_extension = match args.nth(1) { Some(Spanned { item: Value::Primitive(Primitive::String(s)), span, diff --git a/src/commands/pick.rs b/src/commands/pick.rs index 9de5e80683..12d2a271a4 100644 --- a/src/commands/pick.rs +++ b/src/commands/pick.rs @@ -4,7 +4,7 @@ use crate::object::Value; use crate::prelude::*; pub fn pick(args: CommandArgs) -> Result { - if args.positional.len() == 0 { + if args.len() == 0 { return Err(ShellError::maybe_labeled_error( "Pick requires fields", "needs parameter", @@ -12,7 +12,7 @@ pub fn pick(args: CommandArgs) -> Result { )); } - let fields: Result, _> = args.positional.iter().map(|a| a.as_string()).collect(); + let fields: Result, _> = args.positional_iter().map(|a| a.as_string()).collect(); let fields = fields?; let objects = args diff --git a/src/commands/reject.rs b/src/commands/reject.rs index ec5703738b..50bce3d724 100644 --- a/src/commands/reject.rs +++ b/src/commands/reject.rs @@ -4,7 +4,7 @@ use crate::object::Value; use crate::prelude::*; pub fn reject(args: CommandArgs) -> Result { - if args.positional.len() == 0 { + if args.len() == 0 { return Err(ShellError::maybe_labeled_error( "Reject requires fields", "needs parameter", @@ -12,7 +12,7 @@ pub fn reject(args: CommandArgs) -> Result { )); } - let fields: Result, _> = args.positional.iter().map(|a| a.as_string()).collect(); + let fields: Result, _> = args.positional_iter().map(|a| a.as_string()).collect(); let fields = fields?; let stream = args diff --git a/src/commands/save.rs b/src/commands/save.rs index 3aeb751033..6c61df3f94 100644 --- a/src/commands/save.rs +++ b/src/commands/save.rs @@ -1,11 +1,11 @@ use crate::commands::command::SinkCommandArgs; use crate::errors::ShellError; use crate::object::{Primitive, Value}; -use crate::parser::lexer::Spanned; +use crate::parser::Spanned; use std::path::{Path, PathBuf}; pub fn save(args: SinkCommandArgs) -> Result<(), ShellError> { - if args.positional.len() == 0 { + if args.args.positional.is_none() { return Err(ShellError::maybe_labeled_error( "Save requires a filepath", "needs path", @@ -13,6 +13,11 @@ pub fn save(args: SinkCommandArgs) -> Result<(), ShellError> { )); } + let positional = match args.args.positional { + None => return Err(ShellError::string("save requires a filepath")), + Some(p) => p, + }; + let cwd = args .ctx .env @@ -23,12 +28,12 @@ pub fn save(args: SinkCommandArgs) -> Result<(), ShellError> { .path() .to_path_buf(); let mut full_path = PathBuf::from(cwd); - match &(args.positional[0].item) { + match &(positional[0].item) { Value::Primitive(Primitive::String(s)) => full_path.push(Path::new(s)), _ => {} } - let save_raw = match args.positional.get(1) { + let save_raw = match positional.get(1) { Some(Spanned { item: Value::Primitive(Primitive::String(s)), .. diff --git a/src/commands/size.rs b/src/commands/size.rs index 6fdf78cfae..5d99cb5e55 100644 --- a/src/commands/size.rs +++ b/src/commands/size.rs @@ -6,7 +6,7 @@ use std::fs::File; use std::io::prelude::*; pub fn size(args: CommandArgs) -> Result { - if args.positional.len() == 0 { + if args.len() == 0 { return Err(ShellError::maybe_labeled_error( "Size requires a filepath", "needs path", @@ -25,7 +25,7 @@ pub fn size(args: CommandArgs) -> Result { let mut contents = String::new(); let mut list = VecDeque::new(); - for name in args.positional { + for name in args.positional_iter() { let name = name.as_string()?; let path = cwd.join(&name); let mut file = File::open(path)?; diff --git a/src/commands/skip.rs b/src/commands/skip.rs index d556151053..19b53ae582 100644 --- a/src/commands/skip.rs +++ b/src/commands/skip.rs @@ -2,7 +2,7 @@ use crate::errors::ShellError; use crate::prelude::*; pub fn skip(args: CommandArgs) -> Result { - if args.positional.len() == 0 { + if args.len() == 0 { return Err(ShellError::maybe_labeled_error( "Skip requires an amount", "needs parameter", @@ -10,7 +10,7 @@ pub fn skip(args: CommandArgs) -> Result { )); } - let amount = args.positional[0].as_i64(); + let amount = args.expect_nth(0)?.as_i64(); let amount = match amount { Ok(o) => o, @@ -18,7 +18,7 @@ pub fn skip(args: CommandArgs) -> Result { return Err(ShellError::labeled_error( "Value is not a number", "expected integer", - args.positional[0].span, + args.expect_nth(0)?.span, )) } }; diff --git a/src/commands/skip_while.rs b/src/commands/skip_while.rs index 15cb439812..eb6a948823 100644 --- a/src/commands/skip_while.rs +++ b/src/commands/skip_while.rs @@ -1,6 +1,6 @@ use crate::errors::ShellError; +use crate::parser::registry::CommandConfig; use crate::parser::registry::PositionalType; -use crate::parser::CommandConfig; use crate::prelude::*; pub struct SkipWhile; @@ -25,7 +25,7 @@ impl Command for SkipWhile { } pub fn skip_while(args: CommandArgs) -> Result { - if args.positional.len() == 0 { + if args.len() == 0 { return Err(ShellError::maybe_labeled_error( "Where requires a condition", "needs condition", @@ -33,7 +33,7 @@ pub fn skip_while(args: CommandArgs) -> Result { )); } - let block = args.positional[0].as_block()?; + let block = args.nth(0).unwrap().as_block()?; let input = args.input; let objects = input.skip_while(move |item| { @@ -48,4 +48,4 @@ pub fn skip_while(args: CommandArgs) -> Result { }); Ok(objects.map(|x| ReturnValue::Value(x)).boxed()) -} \ No newline at end of file +} diff --git a/src/commands/sort_by.rs b/src/commands/sort_by.rs index d488d5cbd4..9793e9b1b9 100644 --- a/src/commands/sort_by.rs +++ b/src/commands/sort_by.rs @@ -2,7 +2,7 @@ use crate::errors::ShellError; use crate::prelude::*; pub fn sort_by(args: CommandArgs) -> Result { - let fields: Result, _> = args.positional.iter().map(|a| a.as_string()).collect(); + let fields: Result, _> = args.positional_iter().map(|a| a.as_string()).collect(); let fields = fields?; let output = args.input.collect::>(); diff --git a/src/commands/split_column.rs b/src/commands/split_column.rs index 653b9e6180..e8890a1b35 100644 --- a/src/commands/split_column.rs +++ b/src/commands/split_column.rs @@ -6,28 +6,30 @@ use log::trace; // TODO: "Amount remaining" wrapper pub fn split_column(args: CommandArgs) -> Result { - if args.positional.len() == 0 { + let positional: Vec<_> = args.positional_iter().cloned().collect(); + let span = args.name_span; + + if positional.len() == 0 { return Err(ShellError::maybe_labeled_error( "Split-column needs more information", "needs parameter (eg split-column \",\")", args.name_span, )); } + let input = args.input; - let span = args.name_span; - let args = args.positional; Ok(input .map(move |v| match v { Value::Primitive(Primitive::String(s)) => { - let splitter = args[0].as_string().unwrap().replace("\\n", "\n"); + let splitter = positional[0].as_string().unwrap().replace("\\n", "\n"); trace!("splitting with {:?}", splitter); let split_result: Vec<_> = s.split(&splitter).filter(|s| s.trim() != "").collect(); trace!("split result = {:?}", split_result); // If they didn't provide column names, make up our own - if (args.len() - 1) == 0 { + if (positional.len() - 1) == 0 { let mut gen_columns = vec![]; for i in 0..split_result.len() { gen_columns.push(format!("Column{}", i + 1)); @@ -41,9 +43,9 @@ pub fn split_column(args: CommandArgs) -> Result { ); } ReturnValue::Value(Value::Object(dict)) - } else if split_result.len() == (args.len() - 1) { + } else if split_result.len() == (positional.len() - 1) { let mut dict = crate::object::Dictionary::default(); - for (k, v) in split_result.iter().zip(args.iter().skip(1)) { + for (k, v) in split_result.iter().zip(positional.iter().skip(1)) { dict.add( v.as_string().unwrap(), Value::Primitive(Primitive::String(k.to_string())), @@ -52,7 +54,7 @@ pub fn split_column(args: CommandArgs) -> Result { ReturnValue::Value(Value::Object(dict)) } else { let mut dict = crate::object::Dictionary::default(); - for k in args.iter().skip(1) { + for k in positional.iter().skip(1) { dict.add( k.as_string().unwrap().trim(), Value::Primitive(Primitive::String("".to_string())), diff --git a/src/commands/split_row.rs b/src/commands/split_row.rs index ed382bb761..f29f4bc261 100644 --- a/src/commands/split_row.rs +++ b/src/commands/split_row.rs @@ -1,12 +1,16 @@ use crate::errors::ShellError; use crate::object::{Primitive, Value}; +use crate::parser::Spanned; use crate::prelude::*; use log::trace; // TODO: "Amount remaining" wrapper pub fn split_row(args: CommandArgs) -> Result { - if args.positional.len() == 0 { + let positional: Vec> = args.positional_iter().cloned().collect(); + let span = args.name_span; + + if positional.len() == 0 { return Err(ShellError::maybe_labeled_error( "Split-row needs more information", "needs parameter (eg split-row \"\\n\")", @@ -15,13 +19,11 @@ pub fn split_row(args: CommandArgs) -> Result { } let input = args.input; - let span = args.name_span; - let args = args.positional; let stream = input .map(move |v| match v { Value::Primitive(Primitive::String(s)) => { - let splitter = args[0].as_string().unwrap().replace("\\n", "\n"); + let splitter = positional[0].as_string().unwrap().replace("\\n", "\n"); trace!("splitting with {:?}", splitter); let split_result: Vec<_> = s.split(&splitter).filter(|s| s.trim() != "").collect(); diff --git a/src/commands/view.rs b/src/commands/view.rs index 51e29cdbaa..2aba83d0bb 100644 --- a/src/commands/view.rs +++ b/src/commands/view.rs @@ -3,7 +3,7 @@ use crate::prelude::*; use prettyprint::PrettyPrinter; pub fn view(args: CommandArgs) -> Result { - if args.positional.len() == 0 { + if args.len() == 0 { return Err(ShellError::maybe_labeled_error( "View requires a filename", "needs parameter", @@ -11,7 +11,7 @@ pub fn view(args: CommandArgs) -> Result { )); } - let target = match args.positional[0].as_string() { + let target = match args.expect_nth(0)?.as_string() { Ok(s) => s.clone(), Err(e) => { if let Some(span) = args.name_span { diff --git a/src/commands/where_.rs b/src/commands/where_.rs index 045c6f7df6..e5c2279ad3 100644 --- a/src/commands/where_.rs +++ b/src/commands/where_.rs @@ -1,6 +1,5 @@ use crate::errors::ShellError; -use crate::parser::registry::PositionalType; -use crate::parser::CommandConfig; +use crate::parser::registry::{CommandConfig, PositionalType}; use crate::prelude::*; pub struct Where; @@ -25,7 +24,7 @@ impl Command for Where { } pub fn r#where(args: CommandArgs) -> Result { - if args.positional.len() == 0 { + if args.len() == 0 { return Err(ShellError::maybe_labeled_error( "Where requires a condition", "needs condition", @@ -33,7 +32,7 @@ pub fn r#where(args: CommandArgs) -> Result { )); } - let block = args.positional[0].as_block()?; + let block = args.expect_nth(0)?.as_block()?; let input = args.input; let objects = input.filter_map(move |item| { diff --git a/src/context.rs b/src/context.rs index 931190acad..aee27d17e9 100644 --- a/src/context.rs +++ b/src/context.rs @@ -1,7 +1,8 @@ -use crate::commands::command::Sink; -use crate::commands::command::SinkCommandArgs; -use crate::parser::lexer::Span; -use crate::parser::Args; +use crate::commands::command::{Sink, SinkCommandArgs}; +use crate::parser::{ + registry::{Args, CommandConfig, CommandRegistry}, + Span, +}; use crate::prelude::*; use indexmap::IndexMap; @@ -58,8 +59,7 @@ impl Context { let command_args = SinkCommandArgs { ctx: self.clone(), name_span, - positional: args.positional, - named: args.named, + args, input, }; @@ -89,11 +89,16 @@ impl Context { host: self.host.clone(), env: self.env.clone(), name_span, - positional: args.positional, - named: args.named, + args, input, }; command.run(command_args) } } + +impl CommandRegistry for Context { + fn get(&self, name: &str) -> Option { + self.commands.get(name).map(|c| c.config()) + } +} diff --git a/src/errors.rs b/src/errors.rs index 520a2633d7..88d5e78fd3 100644 --- a/src/errors.rs +++ b/src/errors.rs @@ -1,6 +1,7 @@ -use crate::parser::lexer::{Span, SpannedToken}; #[allow(unused)] use crate::prelude::*; + +use crate::parser::Span; use derive_new::new; use language_reporting::{Diagnostic, Label, Severity}; use serde::{Deserialize, Deserializer, Serialize, Serializer}; @@ -15,26 +16,40 @@ pub enum ShellError { impl ShellError { crate fn parse_error( - error: lalrpop_util::ParseError, + error: nom::Err<(nom_locate::LocatedSpan<&str>, nom::error::ErrorKind)>, ) -> ShellError { - use lalrpop_util::ParseError; use language_reporting::*; match error { - ParseError::UnrecognizedToken { - token: (start, SpannedToken { token, .. }, end), - expected, - } => { - let diagnostic = Diagnostic::new( - Severity::Error, - format!("Unexpected {:?}, expected {:?}", token, expected), - ) - .with_label(Label::new_primary(Span::from((start, end)))); + nom::Err::Incomplete(_) => unreachable!(), + nom::Err::Failure(span) | nom::Err::Error(span) => { + let diagnostic = + Diagnostic::new(Severity::Error, format!("{:?}", span)) + .with_label(Label::new_primary(Span::from(span.0))); ShellError::diagnostic(diagnostic) + // nom::Context::Code(span, kind) => { + // let diagnostic = + // Diagnostic::new(Severity::Error, format!("{}", kind.description())) + // .with_label(Label::new_primary(Span::from(span))); + + // ShellError::diagnostic(diagnostic) + // } } - ParseError::User { error } => error, - other => ShellError::string(format!("{:?}", other)), + // ParseError::UnrecognizedToken { + // token: (start, SpannedToken { token, .. }, end), + // expected, + // } => { + // let diagnostic = Diagnostic::new( + // Severity::Error, + // format!("Unexpected {:?}, expected {:?}", token, expected), + // ) + // .with_label(Label::new_primary(Span::from((start, end)))); + + // ShellError::diagnostic(diagnostic) + // } + // ParseError::User { error } => error, + // other => ShellError::string(format!("{:?}", other)), } } @@ -75,6 +90,10 @@ impl ShellError { ShellError::string(&format!("Unimplemented: {}", title.into())) } + crate fn unexpected(title: impl Into) -> ShellError { + ShellError::string(&format!("Unexpected: {}", title.into())) + } + crate fn copy_error(&self) -> ShellError { self.clone() } @@ -191,14 +210,14 @@ impl std::convert::From for ShellError { } } -impl std::convert::From> for ShellError { - fn from(input: nom::Err<(&str, nom::ErrorKind)>) -> ShellError { - ShellError::String(StringError { - title: format!("{:?}", input), - error: Value::nothing(), - }) - } -} +// impl std::convert::From> for ShellError { +// fn from(input: nom::Err<(&str, nom::ErrorKind)>) -> ShellError { +// ShellError::String(StringError { +// title: format!("{:?}", input), +// error: Value::nothing(), +// }) +// } +// } impl std::convert::From for ShellError { fn from(input: toml::ser::Error) -> ShellError { diff --git a/src/evaluate/evaluator.rs b/src/evaluate/evaluator.rs index c60b7fe08d..70cd486e71 100644 --- a/src/evaluate/evaluator.rs +++ b/src/evaluate/evaluator.rs @@ -1,6 +1,8 @@ -use crate::object::Primitive; -use crate::parser::ast; -use crate::parser::lexer::Spanned; +use crate::object::base::Block; +use crate::parser::{ + hir::{self, Expression, RawExpression}, + CommandRegistry, Span, Spanned, Text, +}; use crate::prelude::*; use derive_new::new; use indexmap::IndexMap; @@ -21,96 +23,75 @@ impl Scope { } } -crate fn evaluate_expr( - expr: &ast::Expression, +crate fn evaluate_baseline_expr( + expr: &Expression, + registry: &dyn CommandRegistry, scope: &Scope, + source: &str, ) -> Result, ShellError> { - use ast::*; - match &expr.expr { - RawExpression::Call(_) => Err(ShellError::unimplemented("Evaluating call expression")), - RawExpression::Leaf(l) => Ok(Spanned::from_item(evaluate_leaf(l), expr.span.clone())), - RawExpression::Parenthesized(p) => evaluate_expr(&p.expr, scope), - RawExpression::Flag(f) => Ok(Spanned::from_item( - Value::Primitive(Primitive::String(f.print())), - expr.span.clone(), - )), - RawExpression::Block(b) => evaluate_block(&b, scope), - RawExpression::Path(p) => evaluate_path(&p, scope), - RawExpression::Binary(b) => evaluate_binary(b, scope), - RawExpression::VariableReference(r) => { - evaluate_reference(r, scope).map(|x| Spanned::from_item(x, expr.span.clone())) - } - } -} + match &expr.item { + RawExpression::Literal(literal) => Ok(evaluate_literal(expr.copy_span(*literal), source)), + RawExpression::Variable(var) => evaluate_reference(var, scope, source), + RawExpression::Binary(binary) => { + let left = evaluate_baseline_expr(binary.left(), registry, scope, source)?; + let right = evaluate_baseline_expr(binary.right(), registry, scope, source)?; -fn evaluate_leaf(leaf: &ast::Leaf) -> Value { - use ast::*; - - match leaf { - Leaf::String(s) => Value::string(s), - Leaf::Bare(path) => Value::string(path.to_string()), - Leaf::Boolean(b) => Value::boolean(*b), - Leaf::Int(i) => Value::int(*i), - Leaf::Unit(i, unit) => unit.compute(*i), - } -} - -fn evaluate_reference(r: &ast::Variable, scope: &Scope) -> Result { - use ast::Variable::*; - - match r { - It => Ok(scope.it.copy()), - Other(s) => Ok(scope - .vars - .get(s) - .map(|v| v.copy()) - .unwrap_or_else(|| Value::nothing())), - } -} - -fn evaluate_binary(binary: &ast::Binary, scope: &Scope) -> Result, ShellError> { - let left = evaluate_expr(&binary.left, scope)?; - let right = evaluate_expr(&binary.right, scope)?; - - match left.compare(&binary.operator, &right) { - Some(v) => Ok(Spanned::from_item( - Value::boolean(v), - binary.operator.span.clone(), - )), - None => Err(ShellError::TypeError(format!( - "Can't compare {} and {}", - left.type_name(), - right.type_name() - ))), - } -} - -fn evaluate_block(block: &ast::Block, _scope: &Scope) -> Result, ShellError> { - Ok(Spanned::from_item( - Value::block(block.expr.clone()), - block.expr.span.clone(), - )) -} - -fn evaluate_path(path: &ast::Path, scope: &Scope) -> Result, ShellError> { - let head = path.head(); - let mut value = evaluate_expr(head, scope)?; - let mut seen = vec![]; - - for name in path.tail() { - let next = value.get_data_by_key(&name.item); - seen.push(name.item.clone()); - - match next { - None => { - return Err(ShellError::MissingProperty { - expr: path.print(), - subpath: itertools::join(seen, "."), - }); + match left.compare(binary.op(), &*right) { + Some(result) => Ok(Spanned::from_item(Value::boolean(result), *expr.span())), + None => Err(ShellError::unimplemented(&format!( + "Comparison failure {:?}", + binary + ))), } - Some(v) => value = Spanned::from_item(v.copy(), name.span.clone()), } - } + RawExpression::Block(block) => Ok(Spanned::from_item( + Value::Block(Block::new(*block.clone(), Text::from(source))), // TODO: Pass Text around + block.span(), + )), + RawExpression::Path(path) => { + let value = evaluate_baseline_expr(path.head(), registry, scope, source)?; + let mut value = value.item(); - Ok(value) + for name in path.tail() { + let next = value.get_data_by_key(name); + + match next { + None => return Err(ShellError::unimplemented("Invalid property from path")), + Some(next) => value = next, + }; + } + + Ok(Spanned::from_item(value.clone(), expr.span())) + } + RawExpression::Boolean(_boolean) => unimplemented!(), + } +} + +fn evaluate_literal(literal: Spanned, source: &str) -> Spanned { + let result = match literal.item { + hir::Literal::Integer(int) => Value::int(int), + hir::Literal::Size(_int, _unit) => unimplemented!(), + hir::Literal::String(span) => Value::string(span.slice(source)), + hir::Literal::Bare => Value::string(literal.span().slice(source)), + }; + + literal.map(|_| result) +} + +fn evaluate_reference( + name: &hir::Variable, + scope: &Scope, + source: &str, +) -> Result, ShellError> { + match name { + hir::Variable::It(span) => Ok(Spanned::from_item(scope.it.copy(), span)), + hir::Variable::Other(span) => Ok(Spanned::from_item( + scope + .vars + .get(span.slice(source)) + .map(|v| v.copy()) + .unwrap_or_else(|| Value::nothing()), + span, + )), + } } diff --git a/src/evaluate/mod.rs b/src/evaluate/mod.rs index febfb1bd70..09451fbb49 100644 --- a/src/evaluate/mod.rs +++ b/src/evaluate/mod.rs @@ -1,3 +1,3 @@ crate mod evaluator; -crate use evaluator::{evaluate_expr, Scope}; +crate use evaluator::{evaluate_baseline_expr, Scope}; diff --git a/src/object/base.rs b/src/object/base.rs index d9a531387c..7b4e108ab8 100644 --- a/src/object/base.rs +++ b/src/object/base.rs @@ -1,16 +1,17 @@ use crate::errors::ShellError; -use crate::evaluate::{evaluate_expr, Scope}; +use crate::evaluate::{evaluate_baseline_expr, Scope}; use crate::object::DataDescriptor; -use crate::parser::ast::{self, Operator}; -use crate::parser::lexer::Spanned; +use crate::parser::{hir, Operator, Spanned}; use crate::prelude::*; use ansi_term::Color; use chrono::{DateTime, Utc}; use chrono_humanize::Humanize; use derive_new::new; use ordered_float::OrderedFloat; +use std::fmt; use std::time::SystemTime; +use crate::parser::Text; use serde::{Deserialize, Deserializer, Serialize, Serializer}; #[derive(Debug, Clone, Copy, Ord, PartialOrd, Eq, PartialEq, new)] @@ -75,6 +76,20 @@ impl Primitive { .to_string() } + crate fn debug(&self, f: &mut fmt::Formatter) -> fmt::Result { + use Primitive::*; + + match self { + Nothing => write!(f, "Nothing"), + Int(int) => write!(f, "{}", int), + Float(float) => write!(f, "{:?}", float), + Bytes(bytes) => write!(f, "{}", bytes), + String(string) => write!(f, "{:?}", string), + Boolean(boolean) => write!(f, "{}", boolean), + Date(date) => write!(f, "{}", date), + } + } + crate fn format(&self, field_name: Option<&DataDescriptor>) -> String { match self { Primitive::Nothing => format!("{}", Color::Black.bold().paint("-")), @@ -117,7 +132,8 @@ pub struct Operation { #[derive(Debug, Ord, PartialOrd, Eq, PartialEq, Clone, new)] pub struct Block { - crate expression: ast::Expression, + crate expression: hir::Expression, + crate source: Text, } impl Serialize for Block { @@ -125,7 +141,7 @@ impl Serialize for Block { where S: Serializer, { - serializer.serialize_str(&self.expression.print()) + serializer.serialize_str(&self.expression.source(self.source.as_ref())) } } @@ -134,17 +150,19 @@ impl Deserialize<'de> for Block { where D: Deserializer<'de>, { - let mut builder = ast::ExpressionBuilder::new(); - let expr: ast::Expression = builder.string("Unserializable block"); - - Ok(Block::new(expr)) + unimplemented!("deserialize block") + // let s = "\"unimplemented deserialize block\""; + // Ok(Block::new( + // TokenTreeBuilder::spanned_string((1, s.len() - 1), (0, s.len())), + // Text::from(s), + // )) } } impl Block { pub fn invoke(&self, value: &Value) -> Result, ShellError> { let scope = Scope::new(value.copy()); - evaluate_expr(&self.expression, &scope) + evaluate_baseline_expr(&self.expression, &(), &scope, self.source.as_ref()) } } @@ -153,6 +171,7 @@ pub enum Value { Primitive(Primitive), Object(crate::object::Dictionary), List(Vec), + #[allow(unused)] Block(Block), Filesystem, @@ -160,6 +179,39 @@ pub enum Value { Error(Box), } +pub fn debug_list(values: &'a Vec) -> ValuesDebug<'a> { + ValuesDebug { values } +} + +pub struct ValuesDebug<'a> { + values: &'a Vec, +} + +impl fmt::Debug for ValuesDebug<'a> { + fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result { + f.debug_list() + .entries(self.values.iter().map(|i| i.debug())) + .finish() + } +} + +pub struct ValueDebug<'a> { + value: &'a Value, +} + +impl fmt::Debug for ValueDebug<'a> { + fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result { + match self.value { + Value::Primitive(p) => p.debug(f), + Value::Object(o) => o.debug(f), + Value::List(l) => debug_list(l).fmt(f), + Value::Block(_) => write!(f, "[[block]]"), + Value::Error(err) => write!(f, "[[error :: {} ]]", err), + Value::Filesystem => write!(f, "[[filesystem]]"), + } + } +} + impl Value { crate fn type_name(&self) -> String { match self { @@ -172,6 +224,10 @@ impl Value { } } + crate fn debug(&'a self) -> ValueDebug<'a> { + ValueDebug { value: self } + } + crate fn data_descriptors(&self) -> Vec { match self { Value::Primitive(_) => vec![DataDescriptor::value_of()], @@ -237,7 +293,7 @@ impl Value { crate fn format_leaf(&self, desc: Option<&DataDescriptor>) -> String { match self { Value::Primitive(p) => p.format(desc), - Value::Block(b) => b.expression.print(), + Value::Block(b) => b.expression.source(b.source.as_ref()).to_string(), Value::Object(_) => format!("[object Object]"), Value::List(_) => format!("[list List]"), Value::Error(e) => format!("{}", e), @@ -245,7 +301,8 @@ impl Value { } } - crate fn compare(&self, operator: &ast::Operator, other: &Value) -> Option { + #[allow(unused)] + crate fn compare(&self, operator: &Operator, other: &Value) -> Option { match operator { _ => { let coerced = coerce_compare(self, other)?; @@ -347,8 +404,9 @@ impl Value { } } - crate fn block(e: ast::Expression) -> Value { - Value::Block(Block::new(e)) + #[allow(unused)] + crate fn block(e: hir::Expression, source: Text) -> Value { + Value::Block(Block::new(e, source)) } crate fn string(s: impl Into) -> Value { diff --git a/src/object/desc.rs b/src/object/desc.rs index 8693cba1cc..d69705b466 100644 --- a/src/object/desc.rs +++ b/src/object/desc.rs @@ -16,6 +16,13 @@ impl DescriptorName { } } + crate fn debug(&self) -> &str { + match self { + DescriptorName::String(s) => s, + DescriptorName::ValueOf => "[[value]]", + } + } + crate fn as_string(&self) -> Option<&str> { match self { DescriptorName::String(s) => Some(s), diff --git a/src/object/dict.rs b/src/object/dict.rs index c9ff168a0c..3cd13261b4 100644 --- a/src/object/dict.rs +++ b/src/object/dict.rs @@ -7,6 +7,7 @@ use indexmap::IndexMap; use serde::ser::{Serialize, SerializeMap, Serializer}; use serde_derive::Deserialize; use std::cmp::{Ordering, PartialOrd}; +use std::fmt; #[derive(Debug, Default, Eq, PartialEq, Deserialize, Clone, new)] pub struct Dictionary { @@ -113,4 +114,14 @@ impl Dictionary { None => None, } } + + crate fn debug(&self, f: &mut fmt::Formatter) -> fmt::Result { + let mut debug = f.debug_struct("Dictionary"); + + for (desc, value) in self.entries.iter() { + debug.field(desc.name.debug(), &value.debug()); + } + + debug.finish() + } } diff --git a/src/parser.rs b/src/parser.rs index b2eb9f8468..3af5481c76 100644 --- a/src/parser.rs +++ b/src/parser.rs @@ -1,279 +1,275 @@ -crate mod ast; -crate mod completer; -crate mod lexer; -crate mod parser; -crate mod registry; -crate mod span; +crate mod hir; crate mod parse2; - -crate use ast::Pipeline; -crate use registry::{Args, CommandConfig}; +crate mod parse_command; +crate mod registry; use crate::errors::ShellError; -use ast::Module; -use lexer::Lexer; -use log::trace; -use parser::{ModuleParser, ReplLineParser}; -pub fn parse(input: &str) -> Result { +crate use hir::baseline_parse_tokens::baseline_parse_tokens; +crate use parse2::call_node::CallNode; +crate use parse2::files::Files; +crate use parse2::flag::Flag; +crate use parse2::operator::Operator; +crate use parse2::parser::{nom_input, pipeline}; +crate use parse2::span::{Span, Spanned}; +crate use parse2::text::Text; +crate use parse2::token_tree::TokenNode; +crate use parse2::tokens::{RawToken, Token}; +crate use parse2::unit::Unit; +crate use parse_command::parse_command; +crate use registry::CommandRegistry; + +pub fn parse(input: &str) -> Result { let _ = pretty_env_logger::try_init(); - let parser = ReplLineParser::new(); - let tokens = Lexer::new(input, false); - - trace!( - "Tokens: {:?}", - tokens.clone().collect::, _>>() - ); - - match parser.parse(tokens) { - Ok(val) => Ok(val), + match pipeline(nom_input(input)) { + Ok((_rest, val)) => Ok(val), Err(err) => Err(ShellError::parse_error(err)), } } -#[allow(unused)] -pub fn parse_module(input: &str) -> Result { - let _ = pretty_env_logger::try_init(); +// #[allow(unused)] +// pub fn parse_module(input: &str) -> Result { +// let _ = pretty_env_logger::try_init(); - let parser = ModuleParser::new(); - let tokens = Lexer::new(input, false); +// let parser = ModuleParser::new(); +// let tokens = Lexer::new(input, false); - trace!( - "Tokens: {:?}", - tokens.clone().collect::, _>>() - ); +// trace!( +// "Tokens: {:?}", +// tokens.clone().collect::, _>>() +// ); - match parser.parse(tokens) { - Ok(val) => Ok(val), - Err(err) => Err(ShellError::parse_error(err)), - } -} +// match parser.parse(tokens) { +// Ok(val) => Ok(val), +// Err(err) => Err(ShellError::parse_error(err)), +// } +// } -#[cfg(test)] -mod tests { - use super::*; - use crate::parser::ast::Pipeline; - use pretty_assertions::assert_eq; +// #[cfg(test)] +// mod tests { +// use super::*; +// use crate::parser::ast::Pipeline; +// use pretty_assertions::assert_eq; - fn assert_parse(source: &str, expected: Pipeline) { - let parsed = match parse(source) { - Ok(p) => p, - Err(ShellError::Diagnostic(diag)) => { - use language_reporting::termcolor; +// fn assert_parse(source: &str, expected: Pipeline) { +// let parsed = match parse(source) { +// Ok(p) => p, +// Err(ShellError::Diagnostic(diag)) => { +// use language_reporting::termcolor; - let writer = termcolor::StandardStream::stdout(termcolor::ColorChoice::Auto); - let files = crate::parser::span::Files::new(source.to_string()); +// let writer = termcolor::StandardStream::stdout(termcolor::ColorChoice::Auto); +// let files = crate::parser::span::Files::new(source.to_string()); - language_reporting::emit( - &mut writer.lock(), - &files, - &diag.diagnostic, - &language_reporting::DefaultConfig, - ) - .unwrap(); +// language_reporting::emit( +// &mut writer.lock(), +// &files, +// &diag.diagnostic, +// &language_reporting::DefaultConfig, +// ) +// .unwrap(); - panic!("Test failed") - } - Err(err) => panic!("Something went wrong during parse: {:#?}", err), - }; +// panic!("Test failed") +// } +// Err(err) => panic!("Something went wrong during parse: {:#?}", err), +// }; - let printed = parsed.print(); +// let printed = parsed.print(); - assert_eq!(parsed, expected); - assert_eq!(printed, source); +// assert_eq!(parsed, expected); +// assert_eq!(printed, source); - let span = expected.span; +// let span = expected.span; - let expected_module = ModuleBuilder::spanned_items( - vec![Spanned::from_item(RawItem::Expression(expected), span)], - span.start, - span.end, - ); +// let expected_module = ModuleBuilder::spanned_items( +// vec![Spanned::from_item(RawItem::Expression(expected), span)], +// span.start, +// span.end, +// ); - assert_parse_module(source, expected_module); - } +// assert_parse_module(source, expected_module); +// } - fn assert_parse_module(source: &str, expected: Module) { - let parsed = match parse_module(source) { - Ok(p) => p, - Err(ShellError::Diagnostic(diag)) => { - use language_reporting::termcolor; +// fn assert_parse_module(source: &str, expected: Module) { +// let parsed = match parse_module(source) { +// Ok(p) => p, +// Err(ShellError::Diagnostic(diag)) => { +// use language_reporting::termcolor; - let writer = termcolor::StandardStream::stdout(termcolor::ColorChoice::Auto); - let files = crate::parser::span::Files::new(source.to_string()); +// let writer = termcolor::StandardStream::stdout(termcolor::ColorChoice::Auto); +// let files = crate::parser::span::Files::new(source.to_string()); - language_reporting::emit( - &mut writer.lock(), - &files, - &diag.diagnostic, - &language_reporting::DefaultConfig, - ) - .unwrap(); +// language_reporting::emit( +// &mut writer.lock(), +// &files, +// &diag.diagnostic, +// &language_reporting::DefaultConfig, +// ) +// .unwrap(); - panic!("Test failed") - } - Err(err) => panic!("Something went wrong during parse: {:#?}", err), - }; +// panic!("Test failed") +// } +// Err(err) => panic!("Something went wrong during parse: {:#?}", err), +// }; - let printed = parsed.print(); +// let printed = parsed.print(); - assert_eq!(parsed, expected); - assert_eq!(printed, source); - } +// assert_eq!(parsed, expected); +// assert_eq!(printed, source); +// } - macro_rules! commands { - ( $( ( $name:tt $( $command:ident ( $arg:expr ) )* ) )|* ) => {{ - use $crate::parser::ast::{Expression, ExpressionBuilder}; - let mut builder = crate::parser::ast::ExpressionBuilder::new(); +// macro_rules! commands { +// ( $( ( $name:tt $( $command:ident ( $arg:expr ) )* ) )|* ) => {{ +// use $crate::parser::ast::{Expression, ExpressionBuilder}; +// let mut builder = crate::parser::ast::ExpressionBuilder::new(); - builder.pipeline(vec![ - $( - (command!($name $($command($arg))*) as (&dyn Fn(&mut ExpressionBuilder) -> Expression)) - ),* - ]) - }} - } +// builder.pipeline(vec![ +// $( +// (command!($name $($command($arg))*) as (&dyn Fn(&mut ExpressionBuilder) -> Expression)) +// ),* +// ]) +// }} +// } - macro_rules! command { - ($name:ident) => { - &|b: &mut $crate::parser::ast::ExpressionBuilder| b.call(( - &|b: &mut $crate::parser::ast::ExpressionBuilder| b.bare(stringify!($name)), - vec![] - )) - }; +// macro_rules! command { +// ($name:ident) => { +// &|b: &mut $crate::parser::ast::ExpressionBuilder| b.call(( +// &|b: &mut $crate::parser::ast::ExpressionBuilder| b.bare(stringify!($name)), +// vec![] +// )) +// }; - ($name:ident $( $command:ident ( $body:expr ) )*) => {{ - use $crate::parser::ast::{Expression, ExpressionBuilder}; - &|b: &mut ExpressionBuilder| b.call(( - (&|b: &mut ExpressionBuilder| b.bare(stringify!($name))) as (&dyn Fn(&mut ExpressionBuilder) -> Expression), - vec![$( (&|b: &mut ExpressionBuilder| b.$command($body)) as &dyn Fn(&mut ExpressionBuilder) -> Expression ),* ])) +// ($name:ident $( $command:ident ( $body:expr ) )*) => {{ +// use $crate::parser::ast::{Expression, ExpressionBuilder}; +// &|b: &mut ExpressionBuilder| b.call(( +// (&|b: &mut ExpressionBuilder| b.bare(stringify!($name))) as (&dyn Fn(&mut ExpressionBuilder) -> Expression), +// vec![$( (&|b: &mut ExpressionBuilder| b.$command($body)) as &dyn Fn(&mut ExpressionBuilder) -> Expression ),* ])) - }}; +// }}; - ($name:ident $( $command:ident ( $body:expr ) )*) => { - &|b: &mut $crate::parser::ast::ExpressionBuilder| b.call(|b| b.bare(stringify!($name)), vec![ $( |b| b.$command($body) ),* ]) - }; +// ($name:ident $( $command:ident ( $body:expr ) )*) => { +// &|b: &mut $crate::parser::ast::ExpressionBuilder| b.call(|b| b.bare(stringify!($name)), vec![ $( |b| b.$command($body) ),* ]) +// }; - ($name:tt $( $command:ident ( $body:expr ) )*) => { - &|b: &mut $crate::parser::ast::ExpressionBuilder| b.call((&|b| b.bare($name), vec![ $( &|b| b.$command($body) ),* ])) - }; - } +// ($name:tt $( $command:ident ( $body:expr ) )*) => { +// &|b: &mut $crate::parser::ast::ExpressionBuilder| b.call((&|b| b.bare($name), vec![ $( &|b| b.$command($body) ),* ])) +// }; +// } - #[test] - fn parse_simple_command() { - assert_parse("ls", commands![(ls)]); - } +// #[test] +// fn parse_simple_command() { +// assert_parse("ls", commands![(ls)]); +// } - #[test] - fn parse_command_with_args() { - assert_parse( - r#"open Cargo.toml | select package.authors | split-row " ""#, - commands![ - (open bare("Cargo.toml")) - | (select bare("package.authors")) - | ("split-row" string(" ")) - ], - ); +// #[test] +// fn parse_command_with_args() { +// assert_parse( +// r#"open Cargo.toml | select package.authors | split-row " ""#, +// commands![ +// (open bare("Cargo.toml")) +// | (select bare("package.authors")) +// | ("split-row" string(" ")) +// ], +// ); - assert_parse(r#"git add ."#, commands![("git" bare("add") bare("."))]); +// assert_parse(r#"git add ."#, commands![("git" bare("add") bare("."))]); - assert_parse( - "open Cargo.toml | select package.version | echo $it", - commands![ - (open bare("Cargo.toml")) - | (select bare("package.version")) - | (echo var("it")) - ], - ); +// assert_parse( +// "open Cargo.toml | select package.version | echo $it", +// commands![ +// (open bare("Cargo.toml")) +// | (select bare("package.version")) +// | (echo var("it")) +// ], +// ); - assert_parse( - "open Cargo.toml --raw", - commands![(open bare("Cargo.toml") flag("raw"))], - ); +// assert_parse( +// "open Cargo.toml --raw", +// commands![(open bare("Cargo.toml") flag("raw"))], +// ); - assert_parse( - "open Cargo.toml -r", - commands![(open bare("Cargo.toml") shorthand("r"))], - ); +// assert_parse( +// "open Cargo.toml -r", +// commands![(open bare("Cargo.toml") shorthand("r"))], +// ); - assert_parse( - "open Cargo.toml | from-toml | to-toml", - commands![(open bare("Cargo.toml")) | ("from-toml") | ("to-toml")], - ); +// assert_parse( +// "open Cargo.toml | from-toml | to-toml", +// commands![(open bare("Cargo.toml")) | ("from-toml") | ("to-toml")], +// ); - assert_parse( - r#"config --get "ignore dups" | format-list"#, - commands![(config flag("get") string("ignore dups")) | ("format-list")], - ); +// assert_parse( +// r#"config --get "ignore dups" | format-list"#, +// commands![(config flag("get") string("ignore dups")) | ("format-list")], +// ); - assert_parse( - "open Cargo.toml | from-toml | select dependencies | column serde", - commands![ - (open bare("Cargo.toml")) - | ("from-toml") - | (select bare("dependencies")) - | (column bare("serde")) - ], - ); +// assert_parse( +// "open Cargo.toml | from-toml | select dependencies | column serde", +// commands![ +// (open bare("Cargo.toml")) +// | ("from-toml") +// | (select bare("dependencies")) +// | (column bare("serde")) +// ], +// ); - assert_parse( - "config --set tabs 2", - commands![(config flag("set") bare("tabs") int(2))], - ); +// assert_parse( +// "config --set tabs 2", +// commands![(config flag("set") bare("tabs") int(2))], +// ); - assert_parse( - r#"ls | skip 1 | first 2 | select "file name" | rm $it"#, - commands![ - (ls) - | (skip int(1)) - | (first int(2)) - | (select string("file name")) - | (rm var("it")) - ], - ); +// assert_parse( +// r#"ls | skip 1 | first 2 | select "file name" | rm $it"#, +// commands![ +// (ls) +// | (skip int(1)) +// | (first int(2)) +// | (select string("file name")) +// | (rm var("it")) +// ], +// ); - assert_parse( - r#"git branch --merged | split-row "`n" | where $it != "* master""#, - commands![ - // TODO: Handle escapes correctly. Should we do ` escape because of paths? - (git bare("branch") flag("merged")) | ("split-row" string("`n")) | (where binary((&|b| b.var("it"), &|b| b.op("!="), &|b| b.string("* master")))) - ], - ); +// assert_parse( +// r#"git branch --merged | split-row "`n" | where $it != "* master""#, +// commands![ +// // TODO: Handle escapes correctly. Should we do ` escape because of paths? +// (git bare("branch") flag("merged")) | ("split-row" string("`n")) | (where binary((&|b| b.var("it"), &|b| b.op("!="), &|b| b.string("* master")))) +// ], +// ); - assert_parse( - r#"open input2.json | from-json | select glossary.GlossDiv.GlossList.GlossEntry.GlossDef.GlossSeeAlso | where $it > "GML""#, - commands![ - (open bare("input2.json")) - | ("from-json") - | (select bare("glossary.GlossDiv.GlossList.GlossEntry.GlossDef.GlossSeeAlso")) - | (where binary((&|b| b.var("it"), &|b| b.op(">"), &|b| b.string("GML")))) - ] - ); +// assert_parse( +// r#"open input2.json | from-json | select glossary.GlossDiv.GlossList.GlossEntry.GlossDef.GlossSeeAlso | where $it > "GML""#, +// commands![ +// (open bare("input2.json")) +// | ("from-json") +// | (select bare("glossary.GlossDiv.GlossList.GlossEntry.GlossDef.GlossSeeAlso")) +// | (where binary((&|b| b.var("it"), &|b| b.op(">"), &|b| b.string("GML")))) +// ] +// ); - assert_parse( - r"cd ..\.cargo\", - commands![ - (cd bare(r"..\.cargo\")) - ], - ); +// assert_parse( +// r"cd ..\.cargo\", +// commands![ +// (cd bare(r"..\.cargo\")) +// ], +// ); - assert_parse( - "ls | where size < 1KB", - commands![ - (ls) | (where binary((&|b| b.bare("size"), &|b| b.op("<"), &|b| b.unit((1, "KB"))))) - ], - ); +// assert_parse( +// "ls | where size < 1KB", +// commands![ +// (ls) | (where binary((&|b| b.bare("size"), &|b| b.op("<"), &|b| b.unit((1, "KB"))))) +// ], +// ); - assert_parse( - "ls | where { $it.size > 100 }", - commands![ - (ls) | (where block(&|b| b.binary((&|b| b.path((&|b| b.var("it"), vec!["size"])), &|b| b.op(">"), &|b| b.int(100))))) - ], - ) - } +// assert_parse( +// "ls | where { $it.size > 100 }", +// commands![ +// (ls) | (where block(&|b| b.binary((&|b| b.path((&|b| b.var("it"), vec!["size"])), &|b| b.op(">"), &|b| b.int(100))))) +// ], +// ) +// } - use crate::parser::ast::{ModuleBuilder, RawItem}; - use crate::parser::lexer::Spanned; +// use crate::parser::ast::{ModuleBuilder, RawItem}; +// use crate::parser::lexer::Spanned; -} +// } diff --git a/src/parser/hir.rs b/src/parser/hir.rs new file mode 100644 index 0000000000..0b7e90cdc5 --- /dev/null +++ b/src/parser/hir.rs @@ -0,0 +1,93 @@ +crate mod baseline_parse; +crate mod baseline_parse_tokens; +crate mod binary; +crate mod named; +crate mod path; + +use crate::parser::{Span, Spanned, Unit}; +use derive_new::new; +use getset::Getters; + +crate use baseline_parse::baseline_parse_single_token; +crate use baseline_parse_tokens::{ + baseline_parse_next_expr, ExpressionKindHint, +}; +crate use binary::Binary; +crate use named::NamedArguments; +crate use path::Path; + +#[derive(Debug, Clone, Eq, PartialEq, Getters, new)] +pub struct Call { + #[get = "crate"] + head: Box, + #[get = "crate"] + positional: Option>, + #[get = "crate"] + named: Option, +} + +#[derive(Debug, Clone, Eq, PartialEq, Ord, PartialOrd, Hash)] +pub enum RawExpression { + Literal(Literal), + Variable(Variable), + Binary(Box), + Block(Box), + Path(Box), + + #[allow(unused)] + Boolean(bool), +} + +pub type Expression = Spanned; + +impl Expression { + fn int(i: impl Into, span: impl Into) -> Expression { + Spanned::from_item(RawExpression::Literal(Literal::Integer(i.into())), span) + } + + fn size(i: impl Into, unit: impl Into, span: impl Into) -> Expression { + Spanned::from_item( + RawExpression::Literal(Literal::Size(i.into(), unit.into())), + span, + ) + } + + fn string(inner: impl Into, outer: impl Into) -> Expression { + Spanned::from_item( + RawExpression::Literal(Literal::String(inner.into())), + outer.into(), + ) + } + + fn bare(span: impl Into) -> Expression { + Spanned::from_item(RawExpression::Literal(Literal::Bare), span.into()) + } + + fn variable(inner: impl Into, outer: impl Into) -> Expression { + Spanned::from_item( + RawExpression::Variable(Variable::Other(inner.into())), + outer.into(), + ) + } + + fn it_variable(inner: impl Into, outer: impl Into) -> Expression { + Spanned::from_item( + RawExpression::Variable(Variable::It(inner.into())), + outer.into(), + ) + } +} + +#[derive(Debug, Clone, Copy, Eq, PartialEq, Ord, PartialOrd, Hash)] +pub enum Literal { + Integer(i64), + Size(i64, Unit), + String(Span), + Bare, +} + +#[derive(Debug, Clone, Eq, PartialEq, Ord, PartialOrd, Hash)] +pub enum Variable { + It(Span), + Other(Span), +} diff --git a/src/parser/hir/baseline_parse.rs b/src/parser/hir/baseline_parse.rs new file mode 100644 index 0000000000..1150434fcb --- /dev/null +++ b/src/parser/hir/baseline_parse.rs @@ -0,0 +1,30 @@ +use crate::errors::ShellError; +use crate::parser::{hir, CommandRegistry, RawToken, Token, TokenNode}; + +// pub fn baseline_parse_token( +// token_node: TokenNode, +// _registry: &dyn CommandRegistry, +// ) -> Result { +// match token_node { +// TokenNode::Token(token) => Ok(baseline_parse_single_token(token)), +// TokenNode::Call(_call) => Err(ShellError::unimplemented("baseline_parse Call")), +// TokenNode::Delimited(_delimited) => { +// Err(ShellError::unimplemented("baseline_parse Delimited")) +// } +// TokenNode::Pipeline(_pipeline) => Err(ShellError::unimplemented("baseline_parse Pipeline")), +// TokenNode::Path(_path) => Err(ShellError::unimplemented("baseline_parse Path")), +// } +// } + +pub fn baseline_parse_single_token(token: &Token, source: &str) -> hir::Expression { + match *token.item() { + RawToken::Integer(int) => hir::Expression::int(int, token.span), + RawToken::Size(int, unit) => hir::Expression::size(int, unit, token.span), + RawToken::String(span) => hir::Expression::string(span, token.span), + RawToken::Variable(span) if span.slice(source) == "it" => { + hir::Expression::it_variable(span, token.span) + } + RawToken::Variable(span) => hir::Expression::variable(span, token.span), + RawToken::Bare => hir::Expression::bare(token.span), + } +} diff --git a/src/parser/hir/baseline_parse_tokens.rs b/src/parser/hir/baseline_parse_tokens.rs new file mode 100644 index 0000000000..4cf8ae86bb --- /dev/null +++ b/src/parser/hir/baseline_parse_tokens.rs @@ -0,0 +1,177 @@ +use crate::errors::ShellError; +use crate::parser::registry::CommandRegistry; +use crate::parser::{hir, hir::baseline_parse_single_token, Span, Spanned, TokenNode}; + +pub fn baseline_parse_tokens( + token_nodes: &[TokenNode], + registry: &dyn CommandRegistry, + source: &str, +) -> Result, ShellError> { + let mut exprs: Vec = vec![]; + let mut rest = token_nodes; + + loop { + if rest.len() == 0 { + break; + } + + let (expr, remainder) = baseline_parse_next_expr(rest, registry, source, None)?; + exprs.push(expr); + rest = remainder; + } + + Ok(exprs) +} + +#[derive(Debug)] +pub enum ExpressionKindHint { + Literal, + Variable, + Binary, + Block, + Boolean, +} + +pub fn baseline_parse_next_expr( + token_nodes: &'nodes [TokenNode], + _registry: &dyn CommandRegistry, + source: &str, + coerce_hint: Option, +) -> Result<(hir::Expression, &'nodes [TokenNode]), ShellError> { + println!( + "baseline_parse_next_expr {:?} - {:?}", + token_nodes, coerce_hint + ); + + let mut tokens = token_nodes.iter().peekable(); + + let first = next_token(&mut tokens); + + let first = match first { + None => return Err(ShellError::unimplemented("Expected token, found none")), + Some(token) => baseline_parse_semantic_token(token, source)?, + }; + + let possible_op = tokens.peek(); + + let op = match possible_op { + Some(TokenNode::Operator(op)) => op, + _ => return Ok((first, &token_nodes[1..])), + }; + + tokens.next(); + + let second = match tokens.next() { + None => { + return Err(ShellError::unimplemented( + "Expected op followed by another expr, found nothing", + )) + } + Some(token) => baseline_parse_semantic_token(token, source)?, + }; + + // We definitely have a binary expression here -- let's see if we should coerce it into a block + + match coerce_hint { + None => { + let span = (first.span.start, second.span.end); + let binary = hir::Binary::new(first, *op, second); + let binary = hir::RawExpression::Binary(Box::new(binary)); + let binary = Spanned::from_item(binary, span); + + Ok((binary, &token_nodes[3..])) + } + + Some(hint) => match hint { + ExpressionKindHint::Block => { + let span = (first.span.start, second.span.end); + + let string: Spanned = match first { + Spanned { + item: hir::RawExpression::Literal(hir::Literal::Bare), + span, + } => Spanned::from_item(span.slice(source).to_string(), span), + Spanned { + item: hir::RawExpression::Literal(hir::Literal::String(inner)), + span, + } => Spanned::from_item(inner.slice(source).to_string(), span), + _ => { + return Err(ShellError::unimplemented( + "The first part of a block must be a string", + )) + } + }; + + let path = hir::Path::new( + Spanned::from_item( + // TODO: Deal with synthetic nodes that have no representation at all in source + hir::RawExpression::Variable(hir::Variable::It(Span::from((0, 0)))), + (0, 0), + ), + vec![string], + ); + let path = hir::RawExpression::Path(Box::new(path)); + let path = Spanned::from_item(path, first.span); + + let binary = hir::Binary::new(path, *op, second); + let binary = hir::RawExpression::Binary(Box::new(binary)); + let binary = Spanned::from_item(binary, span); + + let block = hir::RawExpression::Block(Box::new(binary)); + let block = Spanned::from_item(block, span); + + Ok((block, &token_nodes[3..])) + } + + other => unimplemented!("coerce hint {:?}", other), + }, + } +} + +pub fn baseline_parse_semantic_token( + token: &TokenNode, + source: &str, +) -> Result { + match token { + TokenNode::Token(token) => Ok(baseline_parse_single_token(token, source)), + TokenNode::Call(call) => unimplemented!(), + TokenNode::Delimited(delimited) => unimplemented!(), + TokenNode::Pipeline(pipeline) => unimplemented!(), + TokenNode::Operator(_op) => unreachable!(), + TokenNode::Flag(flag) => unimplemented!(), + TokenNode::Identifier(_span) => unreachable!(), + TokenNode::Whitespace(_span) => unreachable!(), + TokenNode::Error(error) => Err(*error.item.clone()), + TokenNode::Path(path) => unimplemented!(), + } +} + +fn next_token(nodes: &mut impl Iterator) -> Option<&'a TokenNode> { + loop { + match nodes.next() { + Some(TokenNode::Whitespace(_)) => continue, + other => return other, + } + } +} + +fn baseline_parse_token( + token_node: &TokenNode, + _registry: &dyn CommandRegistry, + source: &str, +) -> Result { + match token_node { + TokenNode::Token(token) => Ok(hir::baseline_parse_single_token(token, source)), + TokenNode::Call(_call) => Err(ShellError::unimplemented("baseline_parse Call")), + TokenNode::Delimited(_delimited) => { + Err(ShellError::unimplemented("baseline_parse Delimited")) + } + TokenNode::Pipeline(_pipeline) => Err(ShellError::unimplemented("baseline_parse Pipeline")), + TokenNode::Path(_path) => Err(ShellError::unimplemented("baseline_parse Path")), + TokenNode::Operator(_op) => Err(ShellError::unimplemented("baseline_parse Operator")), + TokenNode::Flag(_op) => Err(ShellError::unimplemented("baseline_parse Flag")), + TokenNode::Identifier(_op) => Err(ShellError::unimplemented("baseline_parse Identifier")), + TokenNode::Whitespace(_op) => Err(ShellError::unimplemented("baseline_parse Whitespace")), + TokenNode::Error(err) => Err(*err.item.clone()), + } +} diff --git a/src/parser/hir/binary.rs b/src/parser/hir/binary.rs new file mode 100644 index 0000000000..315964ed5f --- /dev/null +++ b/src/parser/hir/binary.rs @@ -0,0 +1,11 @@ +use crate::parser::{hir::Expression, Operator, Spanned}; +use derive_new::new; +use getset::Getters; + +#[derive(Debug, Clone, Eq, PartialEq, Ord, PartialOrd, Hash, Getters, new)] +#[get = "crate"] +pub struct Binary { + left: Expression, + op: Spanned, + right: Expression, +} diff --git a/src/parser/hir/named.rs b/src/parser/hir/named.rs new file mode 100644 index 0000000000..07c6db655e --- /dev/null +++ b/src/parser/hir/named.rs @@ -0,0 +1,44 @@ +use crate::parser::hir::Expression; +use crate::parser::{Flag, Span}; +use derive_new::new; +use indexmap::IndexMap; +use log::trace; + +#[derive(Debug, Clone, Eq, PartialEq)] +pub enum NamedValue { + AbsentSwitch, + PresentSwitch(Span), + AbsentValue, + Value(Expression), +} + +#[derive(Debug, Clone, Eq, PartialEq, new)] +pub struct NamedArguments { + #[new(default)] + crate named: IndexMap, +} + +impl NamedArguments { + pub fn insert_switch(&mut self, name: impl Into, switch: Option) { + let name = name.into(); + trace!("Inserting switch -- {} = {:?}", name, switch); + + match switch { + None => self.named.insert(name.into(), NamedValue::AbsentSwitch), + Some(flag) => self + .named + .insert(name, NamedValue::PresentSwitch(*flag.name())), + }; + } + + pub fn insert_optional(&mut self, name: impl Into, expr: Option) { + match expr { + None => self.named.insert(name.into(), NamedValue::AbsentValue), + Some(expr) => self.named.insert(name.into(), NamedValue::Value(expr)), + }; + } + + pub fn insert_mandatory(&mut self, name: impl Into, expr: Expression) { + self.named.insert(name.into(), NamedValue::Value(expr)); + } +} diff --git a/src/parser/hir/path.rs b/src/parser/hir/path.rs new file mode 100644 index 0000000000..132f3112b8 --- /dev/null +++ b/src/parser/hir/path.rs @@ -0,0 +1,10 @@ +use crate::parser::{hir::Expression, Operator, Spanned}; +use derive_new::new; +use getset::Getters; + +#[derive(Debug, Clone, Eq, PartialEq, Ord, PartialOrd, Hash, Getters, new)] +#[get = "crate"] +pub struct Path { + head: Expression, + tail: Vec>, +} diff --git a/src/parser/parse2.rs b/src/parser/parse2.rs index 9d2e522c98..b841c4e5fa 100644 --- a/src/parser/parse2.rs +++ b/src/parser/parse2.rs @@ -1,9 +1,14 @@ +crate mod call_node; +crate mod files; crate mod flag; crate mod operator; crate mod parser; crate mod span; +crate mod text; crate mod token_tree; crate mod token_tree_builder; crate mod tokens; crate mod unit; crate mod util; + +crate use token_tree::{PipelineElement, TokenNode}; diff --git a/src/parser/parse2/call_node.rs b/src/parser/parse2/call_node.rs new file mode 100644 index 0000000000..eab5c8f328 --- /dev/null +++ b/src/parser/parse2/call_node.rs @@ -0,0 +1,26 @@ +use crate::parser::TokenNode; +use getset::Getters; + +#[derive(Debug, Clone, Eq, PartialEq, Ord, PartialOrd, Getters)] +pub struct CallNode { + #[get = "crate"] + head: Box, + #[get = "crate"] + children: Option>, +} + +impl CallNode { + pub fn new(head: Box, children: Vec) -> CallNode { + if children.len() == 0 { + CallNode { + head, + children: None, + } + } else { + CallNode { + head, + children: Some(children), + } + } + } +} diff --git a/src/parser/parse2/files.rs b/src/parser/parse2/files.rs new file mode 100644 index 0000000000..c606055f6c --- /dev/null +++ b/src/parser/parse2/files.rs @@ -0,0 +1,77 @@ +use crate::parser::parse2::span::Span; +use derive_new::new; +use language_reporting::{FileName, Location}; + +#[derive(new, Debug, Clone)] +pub struct Files { + snippet: String, +} + +impl language_reporting::ReportingFiles for Files { + type Span = Span; + type FileId = usize; + + fn byte_span( + &self, + _file: Self::FileId, + from_index: usize, + to_index: usize, + ) -> Option { + Some(Span::from((from_index, to_index))) + } + fn file_id(&self, _span: Self::Span) -> Self::FileId { + 0 + } + fn file_name(&self, _file: Self::FileId) -> FileName { + FileName::Verbatim(format!("")) + } + fn byte_index(&self, _file: Self::FileId, _line: usize, _column: usize) -> Option { + unimplemented!("byte_index") + } + fn location(&self, _file: Self::FileId, byte_index: usize) -> Option { + let source = &self.snippet; + let mut seen_lines = 0; + let mut seen_bytes = 0; + + for (pos, _) in source.match_indices('\n') { + if pos > byte_index { + return Some(language_reporting::Location::new( + seen_lines, + byte_index - seen_bytes, + )); + } else { + seen_lines += 1; + seen_bytes = pos; + } + } + + if seen_lines == 0 { + Some(language_reporting::Location::new(0, byte_index)) + } else { + None + } + } + fn line_span(&self, _file: Self::FileId, lineno: usize) -> Option { + let source = &self.snippet; + let mut seen_lines = 0; + let mut seen_bytes = 0; + + for (pos, _) in source.match_indices('\n') { + if seen_lines == lineno { + return Some(Span::from((seen_bytes, pos))); + } else { + seen_lines += 1; + seen_bytes = pos + 1; + } + } + + if seen_lines == 0 { + Some(Span::from((0, self.snippet.len() - 1))) + } else { + None + } + } + fn source(&self, span: Self::Span) -> Option { + Some(self.snippet[span.start..span.end].to_string()) + } +} diff --git a/src/parser/parse2/flag.rs b/src/parser/parse2/flag.rs index 0d255e4515..3b587c3354 100644 --- a/src/parser/parse2/flag.rs +++ b/src/parser/parse2/flag.rs @@ -1,7 +1,17 @@ +use crate::parser::Span; +use derive_new::new; +use getset::Getters; use serde_derive::{Deserialize, Serialize}; #[derive(Debug, Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash, Deserialize, Serialize)] -pub enum Flag { +pub enum FlagKind { Shorthand, Longhand, } + +#[derive(Debug, Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash, Getters, new)] +#[get = "crate"] +pub struct Flag { + kind: FlagKind, + name: Span, +} diff --git a/src/parser/parse2/operator.rs b/src/parser/parse2/operator.rs index 89275afd74..c5ce66bfd8 100644 --- a/src/parser/parse2/operator.rs +++ b/src/parser/parse2/operator.rs @@ -12,6 +12,7 @@ pub enum Operator { } impl Operator { + #[allow(unused)] pub fn print(&self) -> String { self.as_str().to_string() } diff --git a/src/parser/parse2/parser.rs b/src/parser/parse2/parser.rs index 5a2f6cc130..4a9a134338 100644 --- a/src/parser/parse2/parser.rs +++ b/src/parser/parse2/parser.rs @@ -1,28 +1,43 @@ #![allow(unused)] use crate::parser::parse2::{ - flag::*, operator::*, span::*, token_tree::*, token_tree_builder::*, tokens::*, unit::*, + call_node::*, flag::*, operator::*, span::*, token_tree::*, token_tree_builder::*, tokens::*, + unit::*, }; use nom; +use nom::branch::*; +use nom::bytes::complete::*; +use nom::character::complete::*; +use nom::combinator::*; +use nom::multi::*; +use nom::sequence::*; + +use log::trace; use nom::dbg; -use nom::types::CompleteStr; use nom::*; +use nom::{AsBytes, FindSubstring, IResult, InputLength, InputTake, Slice}; use nom_locate::{position, LocatedSpan}; +use std::fmt::Debug; use std::str::FromStr; -type NomSpan<'a> = LocatedSpan>; +pub type NomSpan<'a> = LocatedSpan<&'a str>; + +pub fn nom_input(s: &'a str) -> NomSpan<'a> { + LocatedSpan::new(s) +} macro_rules! operator { ($name:tt : $token:tt ) => { - named!($name( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> t: tag!(stringify!($token)) - >> r: position!() - >> (TokenTreeBuilder::spanned_op(t.fragment.0, (l, r))) - // >> (Spanned::from_nom(RawToken::Operator(Operator::from_str(t.fragment.0).unwrap()), l, r)) - ) - ); + pub fn $name(input: NomSpan) -> IResult { + let start = input.offset; + let (input, tag) = tag(stringify!($token))(input)?; + let end = input.offset; + + Ok(( + input, + TokenTreeBuilder::spanned_op(tag.fragment, (start, end)), + )) + } }; } @@ -33,195 +48,423 @@ operator! { lte: <= } operator! { eq: == } operator! { neq: != } -named!(pub raw_integer( NomSpan ) -> Spanned, - do_parse!( - l: position!() - >> neg: opt!(tag!("-")) - >> num: digit1 - >> r: position!() - >> (Spanned::from_nom(int(num.fragment.0, neg), l, r)) +fn trace_step<'a, T: Debug>( + input: NomSpan<'a>, + name: &str, + block: impl FnOnce(NomSpan<'a>) -> IResult, T>, +) -> IResult, T> { + trace!("+ before {} @ {:?}", name, input); + match block(input) { + Ok((input, result)) => { + trace!("after {} @ {:?} -> {:?}", name, input, result); + Ok((input, result)) + } + + Err(e) => { + trace!("- failed {} :: {:?}", name, e); + Err(e) + } + } +} + +pub fn raw_integer(input: NomSpan) -> IResult> { + let start = input.offset; + trace_step(input, "raw_integer", move |input| { + let (input, neg) = opt(tag("-"))(input)?; + println!("(input,neg) = {:?} {:?}", input, neg); + let (input, num) = digit1(input)?; + println!("(input,num) = {:?} {:?}", input, num); + let end = input.offset; + + Ok(( + input, + Spanned::from_item(int(num.fragment, neg), (start, end)), + )) + }) +} + +pub fn integer(input: NomSpan) -> IResult { + trace_step(input, "integer", move |input| { + let (input, int) = raw_integer(input)?; + + Ok((input, TokenTreeBuilder::spanned_int(*int, int.span))) + }) +} + +pub fn operator(input: NomSpan) -> IResult { + trace_step(input, "operator", |input| { + let (input, operator) = alt((gte, lte, neq, gt, lt, eq))(input)?; + + Ok((input, operator)) + }) +} + +pub fn dq_string(input: NomSpan) -> IResult { + trace_step(input, "dq_string", |input| { + let start = input.offset; + let (input, _) = char('"')(input)?; + let start1 = input.offset; + let (input, _) = many0(none_of("\""))(input)?; + let end1 = input.offset; + let (input, _) = char('"')(input)?; + let end = input.offset; + Ok(( + input, + TokenTreeBuilder::spanned_string((start1, end1), (start, end)), + )) + }) +} + +pub fn sq_string(input: NomSpan) -> IResult { + trace_step(input, "sq_string", move |input| { + let start = input.offset; + let (input, _) = char('\'')(input)?; + let start1 = input.offset; + let (input, _) = many0(none_of("\'"))(input)?; + let end1 = input.offset; + let (input, _) = char('\'')(input)?; + let end = input.offset; + + Ok(( + input, + TokenTreeBuilder::spanned_string((start1, end1), (start, end)), + )) + }) +} + +pub fn string(input: NomSpan) -> IResult { + trace_step(input, "string", move |input| { + alt((sq_string, dq_string))(input) + }) +} + +pub fn bare(input: NomSpan) -> IResult { + trace_step(input, "bare", move |input| { + let start = input.offset; + let (input, _) = take_while1(is_start_bare_char)(input)?; + let (input, _) = take_while(is_bare_char)(input)?; + let end = input.offset; + + Ok((input, TokenTreeBuilder::spanned_bare((start, end)))) + }) +} + +pub fn var(input: NomSpan) -> IResult { + trace_step(input, "var", move |input| { + let start = input.offset; + let (input, _) = tag("$")(input)?; + let (input, bare) = identifier(input)?; + let end = input.offset; + + Ok(( + input, + TokenTreeBuilder::spanned_var(bare.span(), (start, end)), + )) + }) +} + +// let start = input.offset; +// let (input, _) = take_while1(is_start_bare_char)(input)?; +// let (input, _) = take_while(is_bare_char)(input)?; +// let end = input.offset; + +// Ok((input, TokenTreeBuilder::spanned_bare((start, end)))) + +pub fn identifier(input: NomSpan) -> IResult { + trace_step(input, "identifier", move |input| { + let start = input.offset; + let (input, _) = take_while1(is_id_start)(input)?; + let (input, _) = take_while(is_id_continue)(input)?; + + let end = input.offset; + + Ok((input, TokenTreeBuilder::spanned_ident((start, end)))) + }) +} + +pub fn flag(input: NomSpan) -> IResult { + trace_step(input, "flag", move |input| { + let start = input.offset; + let (input, _) = tag("--")(input)?; + let (input, bare) = bare(input)?; + let end = input.offset; + + Ok(( + input, + TokenTreeBuilder::spanned_flag(bare.span(), (start, end)), + )) + }) +} + +pub fn shorthand(input: NomSpan) -> IResult { + trace_step(input, "shorthand", move |input| { + let start = input.offset; + let (input, _) = tag("-")(input)?; + let (input, bare) = bare(input)?; + let end = input.offset; + + Ok(( + input, + TokenTreeBuilder::spanned_shorthand(bare.span(), (start, end)), + )) + }) +} + +pub fn raw_unit(input: NomSpan) -> IResult> { + trace_step(input, "raw_unit", move |input| { + let start = input.offset; + let (input, unit) = alt(( + tag("B"), + tag("KB"), + tag("MB"), + tag("GB"), + tag("TB"), + tag("PB"), + ))(input)?; + let end = input.offset; + + Ok(( + input, + Spanned::from_item(Unit::from(unit.fragment), (start, end)), + )) + }) +} + +pub fn size(input: NomSpan) -> IResult { + trace_step(input, "size", move |input| { + let start = input.offset; + let (input, int) = raw_integer(input)?; + let (input, unit) = raw_unit(input)?; + let end = input.offset; + + Ok(( + input, + TokenTreeBuilder::spanned_size((*int, *unit), (start, end)), + )) + }) +} + +pub fn leaf(input: NomSpan) -> IResult { + trace_step(input, "leaf", move |input| { + println!("alt: {:?}", input); + let (input, node) = + alt((size, integer, string, operator, flag, shorthand, var, bare))(input)?; + + Ok((input, node)) + }) +} + +pub fn token_list(input: NomSpan) -> IResult> { + trace_step(input, "token_list", move |input| { + let (input, first) = node(input)?; + let (input, list) = many0(pair(space1, node))(input)?; + + Ok((input, make_token_list(None, first, list, None))) + }) +} + +pub fn spaced_token_list(input: NomSpan) -> IResult> { + trace_step(input, "spaced_token_list", move |input| { + let (input, sp_left) = opt(space1)(input)?; + let (input, first) = node(input)?; + let (input, list) = many0(pair(space1, node))(input)?; + let (input, sp_right) = opt(space1)(input)?; + + Ok((input, make_token_list(sp_left, first, list, sp_right))) + }) +} + +fn make_token_list( + sp_left: Option, + first: TokenNode, + list: Vec<(NomSpan, TokenNode)>, + sp_right: Option, +) -> Vec { + let mut nodes = vec![]; + + if let Some(sp_left) = sp_left { + nodes.push(TokenNode::Whitespace(Span::from(sp_left))); + } + + nodes.push(first); + + for (ws, token) in list { + nodes.push(TokenNode::Whitespace(Span::from(ws))); + nodes.push(token); + } + + if let Some(sp_right) = sp_right { + nodes.push(TokenNode::Whitespace(Span::from(sp_right))); + } + + nodes +} + +pub fn whitespace(input: NomSpan) -> IResult { + trace_step(input, "whitespace", move |input| { + let left = input.offset; + let (input, ws1) = space1(input)?; + let right = input.offset; + + Ok((input, TokenTreeBuilder::spanned_ws((left, right)))) + }) +} + +pub fn delimited_paren(input: NomSpan) -> IResult { + trace_step(input, "delimited_paren", move |input| { + let left = input.offset; + let (input, _) = char('(')(input)?; + let (input, ws1) = opt(whitespace)(input)?; + let (input, inner_items) = opt(token_list)(input)?; + let (input, ws2) = opt(whitespace)(input)?; + let (input, _) = char(')')(input)?; + let right = input.offset; + + let mut items = vec![]; + + if let Some(space) = ws1 { + items.push(space); + } + + if let Some(inner_items) = inner_items { + items.extend(inner_items); + } + + if let Some(space) = ws2 { + items.push(space); + } + + Ok(( + input, + TokenTreeBuilder::spanned_parens(items, (left, right)), + )) + }) +} + +pub fn delimited_square(input: NomSpan) -> IResult { + trace_step(input, "delimited_paren", move |input| { + let left = input.offset; + let (input, _) = char('[')(input)?; + let (input, ws1) = opt(whitespace)(input)?; + let (input, inner_items) = opt(token_list)(input)?; + let (input, ws2) = opt(whitespace)(input)?; + let (input, _) = char(']')(input)?; + let right = input.offset; + + let mut items = vec![]; + + if let Some(space) = ws1 { + items.push(space); + } + + if let Some(inner_items) = inner_items { + items.extend(inner_items); + } + + if let Some(space) = ws2 { + items.push(space); + } + + Ok(( + input, + TokenTreeBuilder::spanned_square(items, (left, right)), + )) + }) +} + +pub fn delimited_brace(input: NomSpan) -> IResult { + trace_step(input, "delimited_brace", move |input| { + let left = input.offset; + let (input, _) = char('{')(input)?; + let (input, _) = opt(space1)(input)?; + let (input, items) = opt(token_list)(input)?; + let (input, _) = opt(space1)(input)?; + let (input, _) = char('}')(input)?; + let right = input.offset; + + Ok(( + input, + TokenTreeBuilder::spanned_brace(items.unwrap_or_else(|| vec![]), (left, right)), + )) + }) +} + +pub fn raw_call(input: NomSpan) -> IResult> { + trace_step(input, "raw_call", move |input| { + let left = input.offset; + let (input, items) = token_list(input)?; + let right = input.offset; + + Ok((input, TokenTreeBuilder::spanned_call(items, (left, right)))) + }) +} + +pub fn path(input: NomSpan) -> IResult { + trace_step(input, "path", move |input| { + let left = input.offset; + let (input, head) = node1(input)?; + let (input, _) = tag(".")(input)?; + let (input, tail) = separated_list(tag("."), alt((identifier, string)))(input)?; + let right = input.offset; + + Ok(( + input, + TokenTreeBuilder::spanned_path((head, tail), (left, right)), + )) + }) +} + +pub fn node1(input: NomSpan) -> IResult { + trace_step(input, "node1", alt((leaf, delimited_paren))) +} + +pub fn node(input: NomSpan) -> IResult { + trace_step( + input, + "node", + alt(( + path, + leaf, + delimited_paren, + delimited_brace, + delimited_square, + )), ) -); +} -named!(pub integer( NomSpan ) -> TokenNode, - do_parse!( - int: raw_integer - >> (TokenTreeBuilder::spanned_int(*int, int.span)) - ) -); +pub fn pipeline(input: NomSpan) -> IResult { + trace_step(input, "pipeline", |input| { + let start = input.offset; + let (input, head) = tuple((raw_call, opt(space1)))(input)?; + let (input, items) = trace_step( + input, + "many0", + many0(tuple((tag("|"), opt(space1), raw_call, opt(space1)))), + )?; + let end = input.offset; -named!(pub operator( NomSpan ) -> TokenNode, - alt!( - gte | lte | neq | gt | lt | eq - ) -); + Ok(( + input, + TokenTreeBuilder::spanned_pipeline(make_call_list(head, items), (start, end)), + )) + }) +} -named!(pub dq_string( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> char!('"') - >> l1: position!() - >> many0!(none_of!("\"")) - >> r1: position!() - >> char!('"') - >> r: position!() - >> (TokenTreeBuilder::spanned_string((l1, r1), (l, r))) - ) -); +fn make_call_list( + head: (Spanned, Option), + tail: Vec<(NomSpan, Option, Spanned, Option)>, +) -> Vec { + let mut out = vec![]; + let el = PipelineElement::new(None, head.0, head.1.map(Span::from)); + out.push(el); -named!(pub sq_string( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> char!('\'') - >> l1: position!() - >> many0!(none_of!("'")) - >> r1: position!() - >> char!('\'') - >> r: position!() - >> (TokenTreeBuilder::spanned_string((l1, r1), (l, r))) - ) -); + for (pipe, ws1, call, ws2) in tail { + let el = PipelineElement::new(ws1.map(Span::from), call, ws2.map(Span::from)); + out.push(el); + } -named!(pub string( NomSpan ) -> TokenNode, - alt!(sq_string | dq_string) -); - -named!(pub bare( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> take_while1!(is_start_bare_char) - >> take_while!(is_bare_char) - >> r: position!() - >> (TokenTreeBuilder::spanned_bare((l, r))) - ) -); - -named!(pub var( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> tag!("$") - >> bare: identifier - >> r: position!() - >> (TokenTreeBuilder::spanned_var(bare.span(), (l, r))) - ) -); - -named!(pub identifier( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> take_while1!(is_id_start) - >> take_while!(is_id_continue) - >> r: position!() - >> (TokenTreeBuilder::spanned_ident((l, r))) - ) -); - -named!(pub flag( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> tag!("--") - >> bare: bare - >> r: position!() - >> (TokenTreeBuilder::spanned_flag(bare.span(), (l, r))) - ) -); - -named!(pub shorthand( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> tag!("-") - >> bare: bare - >> r: position!() - >> (TokenTreeBuilder::spanned_shorthand(bare.span(), (l, r))) - ) -); - -named!(pub raw_unit( NomSpan ) -> Spanned, - do_parse!( - l: position!() - >> unit: alt!(tag!("B") | tag!("KB") | tag!("MB") | tag!("GB") | tag!("TB") | tag!("PB")) - >> r: position!() - >> (Spanned::from_nom(Unit::from(unit.fragment.0), l, r)) - ) -); - -named!(pub size( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> int: raw_integer - >> unit: raw_unit - >> r: position!() - >> (TokenTreeBuilder::spanned_size((*int, *unit), (l, r))) - ) -); - -named!(pub leaf( NomSpan ) -> TokenNode, - alt!(size | integer | string | operator | flag | shorthand | var | bare) -); - -named!(pub delimited_paren( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> items: delimited!( - char!('('), - delimited!(space0, separated_list!(space1, node), space0), - char!(')') - ) - >> r: position!() - >> (TokenTreeBuilder::spanned_parens(items, (l, r))) - ) -); - -named!(pub delimited_brace( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> items: delimited!( - char!('{'), - delimited!(space0, separated_list!(space1, node), space0), - char!('}') - ) - >> r: position!() - >> (TokenTreeBuilder::spanned_brace(items, (l, r))) - ) -); - -named!(pub raw_call( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> head: node - >> items: opt!(preceded!(space0, separated_nonempty_list!(space1, node))) - >> r: position!() - >> (TokenTreeBuilder::spanned_call((head, items), (l, r))) - ) -); - -named!(pub path( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> head: node1 - >> tag!(".") - >> tail: separated_list!(tag!("."), alt!(identifier | string)) - >> r: position!() - >> (TokenTreeBuilder::spanned_path((head, tail), (l, r))) - ) -); - -named!(pub node1( NomSpan ) -> TokenNode, - alt!(leaf | delimited_paren) -); - -named!(pub node( NomSpan ) -> TokenNode, - alt!(path | leaf | delimited_paren | delimited_brace) -); - -named!(pub pipeline( NomSpan ) -> TokenNode, - do_parse!( - l: position!() - >> list: separated_list!(delimited!(space0, tag!("|"), space0), raw_call) - >> r: position!() - >> (TokenTreeBuilder::spanned_pipeline(list, (l, r))) - ) -); + out +} fn int(frag: &str, neg: Option) -> i64 { let int = FromStr::from_str(frag).unwrap(); @@ -276,30 +519,29 @@ mod tests { use super::*; use crate::parser::parse2::token_tree_builder::TokenTreeBuilder as b; use crate::parser::parse2::token_tree_builder::{CurriedToken, TokenTreeBuilder}; - use nom_trace::{print_trace, reset_trace}; use pretty_assertions::assert_eq; macro_rules! assert_leaf { (parsers [ $($name:tt)* ] $input:tt -> $left:tt .. $right:tt { $kind:tt $parens:tt } ) => { $( assert_eq!( - apply($name, $input), + apply($name, stringify!($name), $input), token(RawToken::$kind $parens, $left, $right) ); )* assert_eq!( - apply(leaf, $input), + apply(leaf, "leaf", $input), token(RawToken::$kind $parens, $left, $right) ); assert_eq!( - apply(leaf, $input), + apply(leaf, "leaf", $input), token(RawToken::$kind $parens, $left, $right) ); assert_eq!( - apply(node, $input), + apply(node, "node", $input), token(RawToken::$kind $parens, $left, $right) ); }; @@ -307,7 +549,7 @@ mod tests { (parsers [ $($name:tt)* ] $input:tt -> $left:tt .. $right:tt { $kind:tt } ) => { $( assert_eq!( - apply($name, $input), + apply($name, stringify!($name), $input), token(RawToken::$kind, $left, $right) ); )* @@ -342,35 +584,32 @@ mod tests { #[test] fn test_operator() { - assert_leaf! { - parsers [ operator ] - ">" -> 0..1 { Operator(Operator::GreaterThan) } - } + assert_eq!(apply(node, "node", ">"), build_token(b::op(">"))); - assert_leaf! { - parsers [ operator ] - ">=" -> 0..2 { Operator(Operator::GreaterThanOrEqual) } - } + // assert_leaf! { + // parsers [ operator ] + // ">=" -> 0..2 { Operator(Operator::GreaterThanOrEqual) } + // } - assert_leaf! { - parsers [ operator ] - "<" -> 0..1 { Operator(Operator::LessThan) } - } + // assert_leaf! { + // parsers [ operator ] + // "<" -> 0..1 { Operator(Operator::LessThan) } + // } - assert_leaf! { - parsers [ operator ] - "<=" -> 0..2 { Operator(Operator::LessThanOrEqual) } - } + // assert_leaf! { + // parsers [ operator ] + // "<=" -> 0..2 { Operator(Operator::LessThanOrEqual) } + // } - assert_leaf! { - parsers [ operator ] - "==" -> 0..2 { Operator(Operator::Equal) } - } + // assert_leaf! { + // parsers [ operator ] + // "==" -> 0..2 { Operator(Operator::Equal) } + // } - assert_leaf! { - parsers [ operator ] - "!=" -> 0..2 { Operator(Operator::NotEqual) } - } + // assert_leaf! { + // parsers [ operator ] + // "!=" -> 0..2 { Operator(Operator::NotEqual) } + // } } #[test] @@ -411,23 +650,23 @@ mod tests { #[test] fn test_flag() { - assert_leaf! { - parsers [ flag ] - "--hello" -> 0..7 { Flag(Flag::Longhand, span(2, 7)) } - } + // assert_leaf! { + // parsers [ flag ] + // "--hello" -> 0..7 { Flag(Spanned::from_item(FlagKind::Longhand, span(2, 7))) } + // } - assert_leaf! { - parsers [ flag ] - "--hello-world" -> 0..13 { Flag(Flag::Longhand, span(2, 13)) } - } + // assert_leaf! { + // parsers [ flag ] + // "--hello-world" -> 0..13 { Flag(Spanned::from_item(FlagKind::Longhand, span(2, 13))) } + // } } #[test] fn test_shorthand() { - assert_leaf! { - parsers [ shorthand ] - "-alt" -> 0..4 { Flag(Flag::Shorthand, span(1, 4)) } - } + // assert_leaf! { + // parsers [ shorthand ] + // "-alt" -> 0..4 { Flag(Spanned::from_item(FlagKind::Shorthand, span(1, 4))) } + // } } #[test] @@ -444,17 +683,20 @@ mod tests { } #[test] - fn test_delimited() { - assert_eq!(apply(node, "(abc)"), build(b::parens(vec![b::bare("abc")]))); - + fn test_delimited_paren() { assert_eq!( - apply(node, "( abc )"), - build(b::parens(vec![b::ws(" "), b::bare("abc"), b::ws(" ")])) + apply(node, "node", "(abc)"), + build_token(b::parens(vec![b::bare("abc")])) ); assert_eq!( - apply(node, "( abc def )"), - build(b::parens(vec![ + apply(node, "node", "( abc )"), + build_token(b::parens(vec![b::ws(" "), b::bare("abc"), b::ws(" ")])) + ); + + assert_eq!( + apply(node, "node", "( abc def )"), + build_token(b::parens(vec![ b::ws(" "), b::bare("abc"), b::sp(), @@ -464,8 +706,47 @@ mod tests { ); assert_eq!( - apply(node, "( abc def 123 456GB )"), - build(b::parens(vec![ + apply(node, "node", "( abc def 123 456GB )"), + build_token(b::parens(vec![ + b::ws(" "), + b::bare("abc"), + b::sp(), + b::bare("def"), + b::sp(), + b::int(123), + b::sp(), + b::size(456, "GB"), + b::sp() + ])) + ); + } + + #[test] + fn test_delimited_square() { + assert_eq!( + apply(node, "node", "[abc]"), + build_token(b::square(vec![b::bare("abc")])) + ); + + assert_eq!( + apply(node, "node", "[ abc ]"), + build_token(b::square(vec![b::ws(" "), b::bare("abc"), b::ws(" ")])) + ); + + assert_eq!( + apply(node, "node", "[ abc def ]"), + build_token(b::square(vec![ + b::ws(" "), + b::bare("abc"), + b::sp(), + b::bare("def"), + b::sp() + ])) + ); + + assert_eq!( + apply(node, "node", "[ abc def 123 456GB ]"), + build_token(b::square(vec![ b::ws(" "), b::bare("abc"), b::sp(), @@ -481,30 +762,31 @@ mod tests { #[test] fn test_path() { + let _ = pretty_env_logger::try_init(); assert_eq!( - apply(node, "$it.print"), - build(b::path(b::var("it"), vec![b::ident("print")])) + apply(node, "node", "$it.print"), + build_token(b::path(b::var("it"), vec![b::ident("print")])) ); assert_eq!( - apply(node, "$head.part1.part2"), - build(b::path( + apply(node, "node", "$head.part1.part2"), + build_token(b::path( b::var("head"), vec![b::ident("part1"), b::ident("part2")] )) ); assert_eq!( - apply(node, "( hello ).world"), - build(b::path( + apply(node, "node", "( hello ).world"), + build_token(b::path( b::parens(vec![b::sp(), b::bare("hello"), b::sp()]), vec![b::ident("world")] )) ); assert_eq!( - apply(node, "( hello ).\"world\""), - build(b::path( + apply(node, "node", "( hello ).\"world\""), + build_token(b::path( b::parens(vec![b::sp(), b::bare("hello"), b::sp()],), vec![b::string("world")] )) @@ -514,8 +796,12 @@ mod tests { #[test] fn test_nested_path() { assert_eq!( - apply(node, "( $it.is.\"great news\".right yep $yep ).\"world\""), - build(b::path( + apply( + node, + "node", + "( $it.is.\"great news\".right yep $yep ).\"world\"" + ), + build_token(b::path( b::parens(vec![ b::sp(), b::path( @@ -536,7 +822,7 @@ mod tests { #[test] fn test_smoke_single_command() { assert_eq!( - apply(raw_call, "git add ."), + apply(raw_call, "raw_call", "git add ."), build(b::call( b::bare("git"), vec![b::sp(), b::bare("add"), b::sp(), b::bare(".")] @@ -544,7 +830,7 @@ mod tests { ); assert_eq!( - apply(raw_call, "open Cargo.toml"), + apply(raw_call, "raw_call", "open Cargo.toml"), build(b::call( b::bare("open"), vec![b::sp(), b::bare("Cargo.toml")] @@ -552,7 +838,7 @@ mod tests { ); assert_eq!( - apply(raw_call, "select package.version"), + apply(raw_call, "raw_call", "select package.version"), build(b::call( b::bare("select"), vec![b::sp(), b::bare("package.version")] @@ -560,12 +846,12 @@ mod tests { ); assert_eq!( - apply(raw_call, "echo $it"), + apply(raw_call, "raw_call", "echo $it"), build(b::call(b::bare("echo"), vec![b::sp(), b::var("it")])) ); assert_eq!( - apply(raw_call, "open Cargo.toml --raw"), + apply(raw_call, "raw_call", "open Cargo.toml --raw"), build(b::call( b::bare("open"), vec![b::sp(), b::bare("Cargo.toml"), b::sp(), b::flag("raw")] @@ -573,7 +859,7 @@ mod tests { ); assert_eq!( - apply(raw_call, "open Cargo.toml -r"), + apply(raw_call, "raw_call", "open Cargo.toml -r"), build(b::call( b::bare("open"), vec![b::sp(), b::bare("Cargo.toml"), b::sp(), b::shorthand("r")] @@ -581,7 +867,7 @@ mod tests { ); assert_eq!( - apply(raw_call, "config --set tabs 2"), + apply(raw_call, "raw_call", "config --set tabs 2"), build(b::call( b::bare("config"), vec![ @@ -598,57 +884,81 @@ mod tests { #[test] fn test_smoke_pipeline() { + let _ = pretty_env_logger::try_init(); + assert_eq!( apply( pipeline, + "pipeline", r#"git branch --merged | split-row "`n" | where $it != "* master""# ), - build(b::pipeline(vec![ - b::call( - b::bare("git"), - vec![b::sp(), b::bare("branch"), b::sp(), b::flag("merged")] + build_token(b::pipeline(vec![ + ( + None, + b::call( + b::bare("git"), + vec![b::sp(), b::bare("branch"), b::sp(), b::flag("merged")] + ), + Some(" ") ), - b::call(b::bare("split-row"), vec![b::sp(), b::string("`n")]), - b::call( - b::bare("where"), - vec![ - b::sp(), - b::var("it"), - b::sp(), - b::op("!="), - b::sp(), - b::string("* master") - ] + ( + Some(" "), + b::call(b::bare("split-row"), vec![b::sp(), b::string("`n")]), + Some(" ") + ), + ( + Some(" "), + b::call( + b::bare("where"), + vec![ + b::sp(), + b::var("it"), + b::sp(), + b::op("!="), + b::sp(), + b::string("* master") + ] + ), + None ) ])) ); assert_eq!( - apply(pipeline, "ls | where { $it.size > 100 }"), - build(b::pipeline(vec![ - b::call(b::bare("ls"), vec![]), - b::call( - b::bare("where"), - vec![ - b::sp(), - b::braced(vec![ - b::path(b::var("it"), vec![b::ident("size")]), + apply(pipeline, "pipeline", "ls | where { $it.size > 100 }"), + build_token(b::pipeline(vec![ + (None, b::call(b::bare("ls"), vec![]), Some(" ")), + ( + Some(" "), + b::call( + b::bare("where"), + vec![ b::sp(), - b::op(">"), - b::sp(), - b::int(100) - ]) - ] + b::braced(vec![ + b::path(b::var("it"), vec![b::ident("size")]), + b::sp(), + b::op(">"), + b::sp(), + b::int(100) + ]) + ] + ), + None ) ])) ) } - fn apply(f: impl Fn(NomSpan) -> Result<(NomSpan, T), nom::Err>, string: &str) -> T { - match f(NomSpan::new(CompleteStr(string))) { + fn apply( + f: impl Fn(NomSpan) -> Result<(NomSpan, T), nom::Err<(NomSpan, nom::error::ErrorKind)>>, + desc: &str, + string: &str, + ) -> T { + match f(NomSpan::new(string)) { Ok(v) => v.1, Err(other) => { println!("{:?}", other); + println!("for {} @ {}", string, desc); panic!("No dice"); } } @@ -686,8 +996,13 @@ mod tests { TokenNode::Token(Spanned::from_item(token, (left, right))) } - fn build(block: CurriedToken) -> TokenNode { + fn build(block: CurriedNode) -> T { let mut builder = TokenTreeBuilder::new(); - block(&mut builder).expect("Expected to build into a token") + block(&mut builder) + } + + fn build_token(block: CurriedToken) -> TokenNode { + let mut builder = TokenTreeBuilder::new(); + block(&mut builder) } } diff --git a/src/parser/parse2/span.rs b/src/parser/parse2/span.rs index 2d3cbe7b5e..4214d29aaa 100644 --- a/src/parser/parse2/span.rs +++ b/src/parser/parse2/span.rs @@ -1,7 +1,8 @@ use derive_new::new; -use std::ops::Range; +use getset::Getters; -#[derive(new, Debug, Clone, Copy, Eq, PartialEq, Ord, PartialOrd, Hash)] +#[derive(new, Debug, Clone, Copy, Eq, PartialEq, Ord, PartialOrd, Hash, Getters)] +#[get = "crate"] pub struct Spanned { crate span: Span, crate item: T, @@ -16,20 +17,6 @@ impl std::ops::Deref for Spanned { } impl Spanned { - crate fn from_nom( - item: T, - start: nom_locate::LocatedSpan, - end: nom_locate::LocatedSpan, - ) -> Spanned { - let start = start.offset; - let end = end.offset; - - Spanned { - span: Span::from((start, end)), - item, - } - } - crate fn from_item(item: T, span: impl Into) -> Spanned { Spanned { span: span.into(), @@ -43,6 +30,19 @@ impl Spanned { let mapped = input(item); Spanned { span, item: mapped } } + + crate fn copy_span(&self, output: U) -> Spanned { + let Spanned { span, item } = self; + + Spanned { + span: *span, + item: output, + } + } + + pub fn source(&self, source: &'source str) -> &'source str { + self.span().slice(source) + } } #[derive(Debug, Clone, Copy, PartialEq, Eq, Ord, PartialOrd, Hash)] @@ -52,6 +52,21 @@ pub struct Span { // source: &'source str, } +impl From<&Span> for Span { + fn from(input: &Span) -> Span { + *input + } +} + +impl From> for Span { + fn from(input: nom_locate::LocatedSpan<&str>) -> Span { + Span { + start: input.offset, + end: input.offset + input.fragment.len(), + } + } +} + impl From<(nom_locate::LocatedSpan, nom_locate::LocatedSpan)> for Span { fn from(input: (nom_locate::LocatedSpan, nom_locate::LocatedSpan)) -> Span { Span { @@ -80,12 +95,8 @@ impl From<&std::ops::Range> for Span { } impl Span { - fn new(range: &Range) -> Span { - Span { - start: range.start, - end: range.end, - // source, - } + pub fn slice(&self, source: &'source str) -> &'source str { + &source[self.start..self.end] } } diff --git a/src/parser/parse2/text.rs b/src/parser/parse2/text.rs new file mode 100644 index 0000000000..7246392283 --- /dev/null +++ b/src/parser/parse2/text.rs @@ -0,0 +1,204 @@ +use std::cmp::Ordering; +use std::hash::Hash; +use std::hash::Hasher; +use std::ops::Range; +use std::sync::Arc; + +/// A "Text" is like a string except that it can be cheaply cloned. +/// You can also "extract" subtexts quite cheaply. You can also deref +/// an `&Text` into a `&str` for interoperability. +/// +/// Used to represent the value of an input file. +#[derive(Clone)] +pub struct Text { + text: Arc, + start: usize, + end: usize, +} + +impl Text { + /// Modifies this restrict to a subset of its current range. + pub fn select(&mut self, range: Range) { + let len = range.end - range.start; + let new_start = self.start + range.start; + let new_end = new_start + len; + assert!(new_end <= self.end); + + self.start = new_start; + self.end = new_end; + } + + /// Extract a new `Text` that is a subset of an old `Text` + /// -- `text.extract(1..3)` is similar to `&foo[1..3]` except that + /// it gives back an owned value instead of a borrowed value. + pub fn extract(&self, range: Range) -> Self { + let mut result = self.clone(); + result.select(range); + result + } +} + +impl From> for Text { + fn from(text: Arc) -> Self { + let end = text.len(); + Self { + text, + start: 0, + end, + } + } +} + +impl AsRef for Text { + fn as_ref(&self) -> &str { + &*self + } +} + +impl From for Text { + fn from(text: String) -> Self { + Text::from(Arc::new(text)) + } +} + +impl From<&String> for Text { + fn from(text: &String) -> Self { + Text::from(text.to_string()) + } +} + +impl From<&str> for Text { + fn from(text: &str) -> Self { + Text::from(text.to_string()) + } +} + +impl std::borrow::Borrow for Text { + fn borrow(&self) -> &str { + &*self + } +} + +impl std::ops::Deref for Text { + type Target = str; + + fn deref(&self) -> &str { + &self.text[self.start..self.end] + } +} + +impl std::fmt::Display for Text { + fn fmt(&self, fmt: &mut std::fmt::Formatter<'_>) -> std::fmt::Result { + ::fmt(self, fmt) + } +} + +impl std::fmt::Debug for Text { + fn fmt(&self, fmt: &mut std::fmt::Formatter<'_>) -> std::fmt::Result { + ::fmt(self, fmt) + } +} + +impl PartialEq for Text { + fn eq(&self, other: &Text) -> bool { + let this: &str = self; + let other: &str = other; + this == other + } +} + +impl Eq for Text {} + +impl PartialEq for Text { + fn eq(&self, other: &str) -> bool { + let this: &str = self; + this == other + } +} + +impl PartialEq for Text { + fn eq(&self, other: &String) -> bool { + let this: &str = self; + let other: &str = other; + this == other + } +} + +impl PartialEq for str { + fn eq(&self, other: &Text) -> bool { + other == self + } +} + +impl PartialEq for String { + fn eq(&self, other: &Text) -> bool { + other == self + } +} + +impl PartialEq<&T> for Text +where + Text: PartialEq, +{ + fn eq(&self, other: &&T) -> bool { + self == *other + } +} + +impl Hash for Text { + fn hash(&self, state: &mut H) { + ::hash(self, state) + } +} + +impl PartialOrd for Text { + fn partial_cmp(&self, other: &Text) -> Option { + let this: &str = self; + let other: &str = other; + this.partial_cmp(other) + } +} + +impl Ord for Text { + fn cmp(&self, other: &Text) -> Ordering { + let this: &str = self; + let other: &str = other; + this.cmp(other) + } +} + +impl PartialOrd for Text { + fn partial_cmp(&self, other: &str) -> Option { + let this: &str = self; + this.partial_cmp(other) + } +} + +impl PartialOrd for Text { + fn partial_cmp(&self, other: &String) -> Option { + let this: &str = self; + let other: &str = other; + this.partial_cmp(other) + } +} + +impl PartialOrd for str { + fn partial_cmp(&self, other: &Text) -> Option { + other.partial_cmp(self) + } +} + +impl PartialOrd for String { + fn partial_cmp(&self, other: &Text) -> Option { + other.partial_cmp(self) + } +} + +impl PartialOrd<&T> for Text +where + Text: PartialOrd, +{ + fn partial_cmp(&self, other: &&T) -> Option { + self.partial_cmp(*other) + } +} diff --git a/src/parser/parse2/token_tree.rs b/src/parser/parse2/token_tree.rs index b3cd722016..9718e9def5 100644 --- a/src/parser/parse2/token_tree.rs +++ b/src/parser/parse2/token_tree.rs @@ -1,14 +1,22 @@ -use crate::parser::parse2::{operator::*, span::*, tokens::*}; +use crate::errors::ShellError; +use crate::parser::parse2::{call_node::*, flag::*, operator::*, span::*, tokens::*}; use derive_new::new; use enum_utils::FromStr; +use getset::Getters; #[derive(Debug, Clone, Eq, PartialEq, Ord, PartialOrd)] pub enum TokenNode { Token(Token), + #[allow(unused)] Call(Spanned), Delimited(Spanned), - Pipeline(Spanned>), - Binary(Spanned), + Pipeline(Spanned>), + Operator(Spanned), + Flag(Spanned), + Identifier(Span), + Whitespace(Span), + #[allow(unused)] + Error(Spanned>), Path(Spanned), } @@ -19,10 +27,71 @@ impl TokenNode { TokenNode::Call(s) => s.span, TokenNode::Delimited(s) => s.span, TokenNode::Pipeline(s) => s.span, - TokenNode::Binary(s) => s.span, + TokenNode::Operator(s) => s.span, + TokenNode::Flag(s) => s.span, + TokenNode::Identifier(s) => *s, + TokenNode::Whitespace(s) => *s, + TokenNode::Error(s) => s.span, TokenNode::Path(s) => s.span, } } + + pub fn as_external_arg(&self, source: &str) -> String { + self.span().slice(source).to_string() + } + + pub fn source(&self, source: &'source str) -> &'source str { + self.span().slice(source) + } + + pub fn is_ws(&self) -> bool { + match self { + TokenNode::Whitespace(_) => true, + _ => false, + } + } + + pub fn is_bare(&self) -> bool { + match self { + TokenNode::Token(Spanned { + item: RawToken::Bare, + .. + }) => true, + _ => false, + } + } + + crate fn as_string(&self, source: &str) -> Option> { + match self { + TokenNode::Token(Spanned { + item: RawToken::Bare, + span, + }) => Some(Spanned::from_item(span.slice(source).to_string(), span)), + TokenNode::Token(Spanned { + item: RawToken::String(inner), + span, + }) => Some(Spanned::from_item(inner.slice(source).to_string(), span)), + _ => None, + } + } + + crate fn as_flag(&self, value: &str, source: &str) -> Option> { + match self { + TokenNode::Flag( + flag @ Spanned { + item: Flag { .. }, .. + }, + ) if value == flag.name().slice(source) => Some(*flag), + _ => None, + } + } + + pub fn as_pipeline(&self) -> Result, ShellError> { + match self { + TokenNode::Pipeline(Spanned { item, .. }) => Ok(item.clone()), + _ => Err(ShellError::string("unimplemented")), + } + } } #[derive(Debug, Clone, Eq, PartialEq, Ord, PartialOrd, new)] @@ -31,12 +100,6 @@ pub struct DelimitedNode { children: Vec, } -#[derive(Debug, Clone, Eq, PartialEq, Ord, PartialOrd, new)] -pub struct CallNode { - head: Box, - children: Vec, -} - #[derive(Debug, Copy, Clone, Eq, PartialEq, Ord, PartialOrd, FromStr)] pub enum Delimiter { Paren, @@ -50,9 +113,26 @@ pub struct PathNode { tail: Vec, } -#[derive(Debug, Clone, Eq, PartialEq, Ord, PartialOrd, new)] -pub struct BinaryNode { - left: Box, - op: Operator, - right: Box, +#[derive(Debug, Clone, Eq, PartialEq, Ord, PartialOrd, Getters, new)] +pub struct PipelineElement { + pre_ws: Option, + #[get = "crate"] + call: Spanned, + post_ws: Option, +} + +impl PipelineElement { + crate fn span(&self) -> Span { + let start = match self.pre_ws { + None => self.call.span.start, + Some(span) => span.start, + }; + + let end = match self.post_ws { + None => self.call.span.end, + Some(span) => span.end, + }; + + Span::from((start, end)) + } } diff --git a/src/parser/parse2/token_tree_builder.rs b/src/parser/parse2/token_tree_builder.rs index a3fffaa8d7..08740d7b32 100644 --- a/src/parser/parse2/token_tree_builder.rs +++ b/src/parser/parse2/token_tree_builder.rs @@ -1,11 +1,15 @@ -use crate::parser::parse2::flag::Flag; +#[allow(unused)] +use crate::prelude::*; + +use crate::parser::parse2::flag::{Flag, FlagKind}; use crate::parser::parse2::operator::Operator; use crate::parser::parse2::span::{Span, Spanned}; use crate::parser::parse2::token_tree::{ - BinaryNode, CallNode, DelimitedNode, Delimiter, PathNode, TokenNode, + DelimitedNode, Delimiter, PathNode, PipelineElement, TokenNode, }; use crate::parser::parse2::tokens::{RawToken, Token}; use crate::parser::parse2::unit::Unit; +use crate::parser::CallNode; use derive_new::new; #[derive(new)] @@ -14,7 +18,10 @@ pub struct TokenTreeBuilder { pos: usize, } -pub type CurriedToken = Box Option + 'static>; +#[allow(unused)] +pub type CurriedNode = Box T + 'static>; +pub type CurriedToken = Box TokenNode + 'static>; +pub type CurriedCall = Box Spanned + 'static>; #[allow(unused)] impl TokenTreeBuilder { @@ -23,35 +30,57 @@ impl TokenTreeBuilder { block(&mut builder) } - pub fn pipeline(input: Vec) -> CurriedToken { + pub fn pipeline(input: Vec<(Option<&str>, CurriedCall, Option<&str>)>) -> CurriedToken { + let input: Vec<(Option, CurriedCall, Option)> = input + .into_iter() + .map(|(pre, call, post)| { + ( + pre.map(|s| s.to_string()), + call, + post.map(|s| s.to_string()), + ) + }) + .collect(); + Box::new(move |b| { let start = b.pos; - let mut out = vec![]; + let mut out: Vec = vec![]; let mut input = input.into_iter(); - let first = input + let (pre, call, post) = input .next() .expect("A pipeline must contain at least one element"); - out.push(first(b).expect("The first element of a pipeline must not be whitespace")); + let pre_span = pre.map(|pre| b.consume(&pre)); + let call = call(b); + let post_span = post.map(|post| b.consume(&post)); + out.push(PipelineElement::new( + pre_span.map(Span::from), + call, + post_span.map(Span::from), + )); - for item in input { - b.consume(" | "); + for (pre, call, post) in input { + b.consume("|"); + let pre_span = pre.map(|pre| b.consume(&pre)); + let call = call(b); + let post_span = post.map(|post| b.consume(&post)); - match item(b) { - None => {} - Some(v) => out.push(v), - } + out.push(PipelineElement::new( + pre_span.map(Span::from), + call, + post_span.map(Span::from), + )); } let end = b.pos; - Some(TokenTreeBuilder::spanned_pipeline(out, (start, end))) + TokenTreeBuilder::spanned_pipeline(out, (start, end)) }) } - pub fn spanned_pipeline(input: Vec, span: impl Into) -> TokenNode { + pub fn spanned_pipeline(input: Vec, span: impl Into) -> TokenNode { TokenNode::Pipeline(Spanned::from_item(input, span)) } @@ -63,15 +92,12 @@ impl TokenTreeBuilder { b.pos = end; - Some(TokenTreeBuilder::spanned_op(input, (start, end))) + TokenTreeBuilder::spanned_op(input, (start, end)) }) } pub fn spanned_op(input: impl Into, span: impl Into) -> TokenNode { - TokenNode::Token(Spanned::from_item( - RawToken::Operator(input.into()), - span.into(), - )) + TokenNode::Operator(Spanned::from_item(input.into(), span.into())) } pub fn string(input: impl Into) -> CurriedToken { @@ -83,10 +109,7 @@ impl TokenTreeBuilder { let (_, end) = b.consume("\""); b.pos = end; - Some(TokenTreeBuilder::spanned_string( - (inner_start, inner_end), - (start, end), - )) + TokenTreeBuilder::spanned_string((inner_start, inner_end), (start, end)) }) } @@ -104,7 +127,7 @@ impl TokenTreeBuilder { let (start, end) = b.consume(&input); b.pos = end; - Some(TokenTreeBuilder::spanned_bare((start, end))) + TokenTreeBuilder::spanned_bare((start, end)) }) } @@ -119,7 +142,7 @@ impl TokenTreeBuilder { let (start, end) = b.consume(&int.to_string()); b.pos = end; - Some(TokenTreeBuilder::spanned_int(int, (start, end))) + TokenTreeBuilder::spanned_int(int, (start, end)) }) } @@ -136,7 +159,7 @@ impl TokenTreeBuilder { let (_, end) = b.consume(unit.as_str()); b.pos = end; - Some(TokenTreeBuilder::spanned_size((int, unit), (start, end))) + TokenTreeBuilder::spanned_size((int, unit), (start, end)) }) } @@ -152,22 +175,19 @@ impl TokenTreeBuilder { pub fn path(head: CurriedToken, tail: Vec) -> CurriedToken { Box::new(move |b| { let start = b.pos; - let head = head(b).expect("The head of a path must not be whitespace"); + let head = head(b); let mut output = vec![]; for item in tail { b.consume("."); - match item(b) { - None => {} - Some(v) => output.push(v), - }; + output.push(item(b)); } let end = b.pos; - Some(TokenTreeBuilder::spanned_path((head, output), (start, end))) + TokenTreeBuilder::spanned_path((head, output), (start, end)) }) } @@ -185,10 +205,7 @@ impl TokenTreeBuilder { let (start, _) = b.consume("$"); let (inner_start, end) = b.consume(&input); - Some(TokenTreeBuilder::spanned_var( - (inner_start, end), - (start, end), - )) + TokenTreeBuilder::spanned_var((inner_start, end), (start, end)) }) } @@ -206,16 +223,13 @@ impl TokenTreeBuilder { let (start, _) = b.consume("--"); let (inner_start, end) = b.consume(&input); - Some(TokenTreeBuilder::spanned_flag( - (inner_start, end), - (start, end), - )) + TokenTreeBuilder::spanned_flag((inner_start, end), (start, end)) }) } pub fn spanned_flag(input: impl Into, span: impl Into) -> TokenNode { - TokenNode::Token(Spanned::from_item( - RawToken::Flag(Flag::Longhand, input.into()), + TokenNode::Flag(Spanned::from_item( + Flag::new(FlagKind::Longhand, input.into()), span.into(), )) } @@ -227,16 +241,13 @@ impl TokenTreeBuilder { let (start, _) = b.consume("-"); let (inner_start, end) = b.consume(&input); - Some(TokenTreeBuilder::spanned_shorthand( - (inner_start, end), - (start, end), - )) + TokenTreeBuilder::spanned_shorthand((inner_start, end), (start, end)) }) } pub fn spanned_shorthand(input: impl Into, span: impl Into) -> TokenNode { - TokenNode::Token(Spanned::from_item( - RawToken::Flag(Flag::Shorthand, input.into()), + TokenNode::Flag(Spanned::from_item( + Flag::new(FlagKind::Shorthand, input.into()), span.into(), )) } @@ -246,45 +257,42 @@ impl TokenTreeBuilder { Box::new(move |b| { let (start, end) = b.consume(&input); - Some(TokenTreeBuilder::spanned_ident((start, end))) + TokenTreeBuilder::spanned_ident((start, end)) }) } pub fn spanned_ident(span: impl Into) -> TokenNode { - TokenNode::Token(Spanned::from_item(RawToken::Identifier, span.into())) + TokenNode::Identifier(span.into()) } - pub fn call(head: CurriedToken, input: Vec) -> CurriedToken { + pub fn call(head: CurriedToken, input: Vec) -> CurriedCall { Box::new(move |b| { let start = b.pos; - let head_node = head(b).expect("The head of a command must not be whitespace"); + let head_node = head(b); - let mut tail_nodes = vec![]; + let mut nodes = vec![head_node]; for item in input { - match item(b) { - None => {} - Some(v) => tail_nodes.push(v), - }; + nodes.push(item(b)); } let end = b.pos; - Some(TokenTreeBuilder::spanned_call( - (head_node, Some(tail_nodes)), - (start, end), - )) + TokenTreeBuilder::spanned_call(nodes, (start, end)) }) } - pub fn spanned_call( - input: (TokenNode, Option>), - span: impl Into, - ) -> TokenNode { - TokenNode::Call(Spanned::from_item( - CallNode::new(Box::new(input.0), input.1.unwrap_or_else(|| vec![])), - span, - )) + pub fn spanned_call(input: Vec, span: impl Into) -> Spanned { + if input.len() == 0 { + panic!("BUG: spanned call (TODO)") + } + + let mut input = input.into_iter(); + + let head = input.next().unwrap(); + let tail = input.collect(); + + Spanned::from_item(CallNode::new(Box::new(head), tail), span) } pub fn parens(input: Vec) -> CurriedToken { @@ -292,15 +300,12 @@ impl TokenTreeBuilder { let (start, _) = b.consume("("); let mut output = vec![]; for item in input { - match item(b) { - None => {} - Some(v) => output.push(v), - }; + output.push(item(b)); } let (_, end) = b.consume(")"); - Some(TokenTreeBuilder::spanned_parens(output, (start, end))) + TokenTreeBuilder::spanned_parens(output, (start, end)) }) } @@ -311,20 +316,38 @@ impl TokenTreeBuilder { )) } + pub fn square(input: Vec) -> CurriedToken { + Box::new(move |b| { + let (start, _) = b.consume("["); + let mut output = vec![]; + for item in input { + output.push(item(b)); + } + + let (_, end) = b.consume("]"); + + TokenTreeBuilder::spanned_square(output, (start, end)) + }) + } + + pub fn spanned_square(input: impl Into>, span: impl Into) -> TokenNode { + TokenNode::Delimited(Spanned::from_item( + DelimitedNode::new(Delimiter::Square, input.into()), + span, + )) + } + pub fn braced(input: Vec) -> CurriedToken { Box::new(move |b| { let (start, _) = b.consume("{ "); let mut output = vec![]; for item in input { - match item(b) { - None => {} - Some(v) => output.push(v), - }; + output.push(item(b)); } let (_, end) = b.consume(" }"); - Some(TokenTreeBuilder::spanned_brace(output, (start, end))) + TokenTreeBuilder::spanned_brace(output, (start, end)) }) } @@ -335,50 +358,10 @@ impl TokenTreeBuilder { )) } - pub fn binary( - left: CurriedToken, - op: impl Into, - right: CurriedToken, - ) -> CurriedToken { - let op = op.into(); - - Box::new(move |b| { - let start = b.pos; - - let left = left(b).expect("The left side of a binary operation must not be whitespace"); - - b.consume(" "); - - b.consume(op.as_str()); - - b.consume(" "); - - let right = - right(b).expect("The right side of a binary operation must not be whitespace"); - - let end = b.pos; - - Some(TokenTreeBuilder::spanned_binary( - (left, op, right), - (start, end), - )) - }) - } - - pub fn spanned_binary( - input: (impl Into, Operator, impl Into), - span: impl Into, - ) -> TokenNode { - TokenNode::Binary(Spanned::from_item( - BinaryNode::new(Box::new(input.0.into()), input.1, Box::new(input.2.into())), - span, - )) - } - pub fn sp() -> CurriedToken { Box::new(|b| { - b.consume(" "); - None + let (start, end) = b.consume(" "); + TokenNode::Whitespace(Span::from((start, end))) }) } @@ -386,11 +369,17 @@ impl TokenTreeBuilder { let input = input.into(); Box::new(move |b| { - b.consume(&input); - None + let (start, end) = b.consume(&input); + TokenTreeBuilder::spanned_ws((start, end)) }) } + pub fn spanned_ws(span: impl Into) -> TokenNode { + let span = span.into(); + + TokenNode::Whitespace(span.into()) + } + fn consume(&mut self, input: &str) -> (usize, usize) { let start = self.pos; self.pos += input.len(); diff --git a/src/parser/parse2/tokens.rs b/src/parser/parse2/tokens.rs index d1977498ce..4e8fdcf5b1 100644 --- a/src/parser/parse2/tokens.rs +++ b/src/parser/parse2/tokens.rs @@ -1,5 +1,3 @@ -use crate::parser::parse2::flag::*; -use crate::parser::parse2::operator::*; use crate::parser::parse2::span::*; use crate::parser::parse2::unit::*; @@ -7,12 +5,34 @@ use crate::parser::parse2::unit::*; pub enum RawToken { Integer(i64), Size(i64, Unit), - Operator(Operator), String(Span), Variable(Span), - Identifier, Bare, - Flag(Flag, Span), } pub type Token = Spanned; + +impl Token { + pub fn to_semantic_token(&self) -> Option { + let semantic_token = match self.item { + RawToken::Integer(int) => RawSemanticToken::Integer(int), + RawToken::Size(int, unit) => RawSemanticToken::Size(int, unit), + RawToken::String(span) => RawSemanticToken::String(span), + RawToken::Variable(span) => RawSemanticToken::Variable(span), + RawToken::Bare => RawSemanticToken::Bare, + }; + + Some(Spanned::from_item(semantic_token, self.span)) + } +} + +#[derive(Debug, Clone, Copy, Eq, PartialEq, Ord, PartialOrd, Hash)] +pub enum RawSemanticToken { + Integer(i64), + Size(i64, Unit), + String(Span), + Variable(Span), + Bare, +} + +pub type SemanticToken = Spanned; diff --git a/src/parser/parse2/unit.rs b/src/parser/parse2/unit.rs index 883f4c5071..7e51103cfc 100644 --- a/src/parser/parse2/unit.rs +++ b/src/parser/parse2/unit.rs @@ -12,10 +12,6 @@ pub enum Unit { } impl Unit { - pub fn print(&self) -> String { - self.as_str().to_string() - } - pub fn as_str(&self) -> &str { match *self { Unit::B => "B", diff --git a/src/parser/parse_command.rs b/src/parser/parse_command.rs new file mode 100644 index 0000000000..d3064cbae0 --- /dev/null +++ b/src/parser/parse_command.rs @@ -0,0 +1,250 @@ +use crate::errors::ShellError; +use crate::parser::registry::{CommandConfig, CommandRegistry, NamedType}; +use crate::parser::{baseline_parse_tokens, CallNode, Spanned}; +use crate::parser::{ + hir::{self, NamedArguments}, + Flag, RawToken, TokenNode, +}; +use log::trace; + +pub fn parse_command( + config: &CommandConfig, + registry: &dyn CommandRegistry, + call: &Spanned, + source: &str, +) -> Result { + let Spanned { item: call, .. } = call; + + trace!("Processing {:?}", config); + + let head = parse_command_head(call.head())?; + + let children: Option> = call.children().as_ref().map(|nodes| { + nodes + .iter() + .cloned() + .filter(|node| match node { + TokenNode::Whitespace(_) => false, + _ => true, + }) + .collect() + }); + + match parse_command_tail(&config, registry, children, source)? { + None => Ok(hir::Call::new(Box::new(head), None, None)), + Some((positional, named)) => Ok(hir::Call::new(Box::new(head), positional, named)), + } +} + +fn parse_command_head(head: &TokenNode) -> Result { + match head { + TokenNode::Token( + spanned @ Spanned { + item: RawToken::Bare, + .. + }, + ) => Ok(spanned.map(|_| hir::RawExpression::Literal(hir::Literal::Bare))), + + TokenNode::Token(Spanned { + item: RawToken::String(inner_span), + span, + }) => Ok(Spanned::from_item( + hir::RawExpression::Literal(hir::Literal::String(*inner_span)), + *span, + )), + + other => Err(ShellError::unexpected(&format!( + "command head -> {:?}", + other + ))), + } +} + +fn parse_command_tail( + config: &CommandConfig, + registry: &dyn CommandRegistry, + tail: Option>, + source: &str, +) -> Result>, Option)>, ShellError> { + let mut tail = match tail { + None => return Ok(None), + Some(tail) => tail, + }; + + let mut named = NamedArguments::new(); + + for (name, kind) in config.named() { + trace!("looking for {} : {:?}", name, kind); + + match kind { + NamedType::Switch => { + let (rest, flag) = extract_switch(name, tail, source); + + tail = rest; + + named.insert_switch(name, flag); + } + NamedType::Mandatory(kind) => match extract_mandatory(name, tail, source) { + Err(err) => return Err(err), // produce a correct diagnostic + Ok((rest, pos, _flag)) => { + let (expr, rest) = hir::baseline_parse_next_expr( + &rest[pos..], + registry, + source, + kind.to_coerce_hint(), + )?; + tail = rest.to_vec(); + + named.insert_mandatory(name, expr); + } + }, + NamedType::Optional(kind) => match extract_optional(name, tail, source) { + Err(err) => return Err(err), // produce a correct diagnostic + Ok((rest, Some((pos, _flag)))) => { + let (expr, rest) = hir::baseline_parse_next_expr( + &rest[pos..], + registry, + source, + kind.to_coerce_hint(), + )?; + tail = rest.to_vec(); + + named.insert_optional(name, Some(expr)); + } + + Ok((rest, None)) => { + tail = rest; + + named.insert_optional(name, None); + } + }, + }; + } + + let mut positional = vec![]; + let mandatory = config.mandatory_positional(); + + for arg in mandatory { + if tail.len() == 0 { + return Err(ShellError::unimplemented("Missing mandatory argument")); + } + + let (result, rest) = + hir::baseline_parse_next_expr(&tail, registry, source, arg.to_coerce_hint())?; + + positional.push(result); + + tail = rest.to_vec(); + } + + let optional = config.optional_positional(); + + for arg in optional { + if tail.len() == 0 { + break; + } + + let (result, rest) = + hir::baseline_parse_next_expr(&tail, registry, source, arg.to_coerce_hint())?; + + positional.push(result); + + tail = rest.to_vec(); + } + + // TODO: Only do this if rest params are specified + let remainder = baseline_parse_tokens(&tail, registry, source)?; + positional.extend(remainder); + + trace!("Constructed positional={:?} named={:?}", positional, named); + + let positional = match positional { + positional if positional.len() == 0 => None, + positional => Some(positional), + }; + + let named = match named { + named if named.named.is_empty() => None, + named => Some(named), + }; + + trace!("Normalized positional={:?} named={:?}", positional, named); + + Ok(Some((positional, named))) +} + +fn extract_switch( + name: &str, + mut tokens: Vec, + source: &str, +) -> (Vec, Option) { + let pos = tokens + .iter() + .enumerate() + .filter_map(|(i, t)| t.as_flag(name, source).map(|f| (i, f))) + .nth(0); + + match pos { + None => (tokens, None), + Some((pos, flag)) => { + tokens.remove(pos); + (tokens, Some(*flag)) + } + } +} + +fn extract_mandatory( + name: &str, + mut tokens: Vec, + source: &str, +) -> Result<(Vec, usize, Flag), ShellError> { + let pos = tokens + .iter() + .enumerate() + .filter_map(|(i, t)| t.as_flag(name, source).map(|f| (i, f))) + .nth(0); + + match pos { + None => Err(ShellError::unimplemented( + "Better error: mandatory flags must be present", + )), + Some((pos, flag)) => { + if tokens.len() <= pos { + return Err(ShellError::unimplemented( + "Better errors: mandatory flags must be followed by values", + )); + } + + tokens.remove(pos); + + Ok((tokens, pos, *flag)) + } + } +} + +fn extract_optional( + name: &str, + mut tokens: Vec, + source: &str, +) -> Result<(Vec, Option<(usize, Flag)>), ShellError> { + let pos = tokens + .iter() + .enumerate() + .filter_map(|(i, t)| t.as_flag(name, source).map(|f| (i, f))) + .nth(0); + + match pos { + None => Ok((tokens, None)), + Some((pos, flag)) => { + if tokens.len() <= pos { + return Err(ShellError::unimplemented( + "Better errors: optional flags must be followed by values", + )); + } + + tokens.remove(pos); + + Ok((tokens, Some((pos, *flag)))) + } + } +} diff --git a/src/parser/registry.rs b/src/parser/registry.rs index a1adc63b9c..d50c67aa43 100644 --- a/src/parser/registry.rs +++ b/src/parser/registry.rs @@ -1,7 +1,11 @@ -use crate::evaluate::{evaluate_expr, Scope}; -use crate::parser::lexer::Spanned; +use crate::evaluate::{evaluate_baseline_expr, Scope}; +use crate::parser::{hir, hir::ExpressionKindHint, parse_command, CallNode, Spanned}; use crate::prelude::*; +use derive_new::new; +use getset::Getters; use indexmap::IndexMap; +use log::trace; +use std::fmt; #[allow(unused)] #[derive(Debug)] @@ -14,13 +18,18 @@ pub enum NamedType { #[derive(Debug)] pub enum NamedValue { Single, - Tuple, #[allow(unused)] Block, +} - #[allow(unused)] - Array, +impl NamedValue { + crate fn to_coerce_hint(&self) -> Option { + match self { + NamedValue::Single => None, + NamedValue::Block => Some(ExpressionKindHint::Block), + } + } } #[allow(unused)] @@ -31,61 +40,16 @@ pub enum PositionalType { } impl PositionalType { - crate fn name(&self) -> String { + crate fn to_coerce_hint(&self) -> Option { match self { - PositionalType::Value(s) => s.clone(), - PositionalType::Block(s) => s.clone(), - } - } - - crate fn evaluate( - &self, - arg: ast::Expression, - scope: &Scope, - ) -> Result, ShellError> { - match self { - PositionalType::Value(_) => evaluate_expr(&arg, scope), - PositionalType::Block(_) => match arg { - ast::Expression { - expr: ast::RawExpression::Block(b), - .. - } => Ok(Spanned::from_item(Value::block(b.expr), arg.span.clone())), - ast::Expression { - expr: ast::RawExpression::Binary(binary), - .. - } => { - // TODO: Use original spans - let mut b = ast::ExpressionBuilder::new(); - if let Some(s) = binary.left.as_string() { - Ok(Spanned::from_item( - Value::block(b.binary(( - &|b| b.path((&|b| b.var("it"), vec![s.clone()])), - &|_| binary.operator.clone(), - &|_| binary.right.clone(), - ))), - arg.span.clone(), - )) - } else { - let mut b = ast::ExpressionBuilder::new(); - let expr = b.binary(( - &|_| binary.left.clone(), - &|_| binary.operator.clone(), - &|_| binary.right.clone(), - )); - - Ok(Spanned::from_item(Value::block(expr), arg.span.clone())) - } - } - other => { - let span = other.span.clone(); - Ok(Spanned::from_item(Value::block(other), span)) - } - }, + PositionalType::Value(_) => None, + PositionalType::Block(_) => Some(ExpressionKindHint::Block), } } } -#[derive(Debug)] +#[derive(Debug, Getters)] +#[get = "crate"] pub struct CommandConfig { crate name: String, crate mandatory_positional: Vec, @@ -94,90 +58,218 @@ pub struct CommandConfig { crate named: IndexMap, } -#[derive(Debug, Default)] +#[derive(Debug, Default, new)] pub struct Args { - pub positional: Vec>, - pub named: IndexMap, + pub positional: Option>>, + pub named: Option>>, +} + +#[derive(new)] +pub struct DebugPositional<'a> { + positional: &'a Option>>, +} + +impl fmt::Debug for DebugPositional<'a> { + fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result { + match &self.positional { + None => write!(f, "None"), + Some(positional) => f + .debug_list() + .entries(positional.iter().map(|p| p.item().debug())) + .finish(), + } + } +} + +#[derive(new)] +pub struct DebugNamed<'a> { + named: &'a Option>>, +} + +impl fmt::Debug for DebugNamed<'a> { + fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result { + match &self.named { + None => write!(f, "None"), + Some(named) => f + .debug_map() + .entries(named.iter().map(|(k, v)| (k, v.item().debug()))) + .finish(), + } + } +} + +pub struct DebugArgs<'a> { + args: &'a Args, +} + +impl fmt::Debug for DebugArgs<'a> { + fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result { + let mut s = f.debug_struct("Args"); + + s.field("positional", &DebugPositional::new(&self.args.positional)); + s.field("named", &DebugNamed::new(&self.args.named)); + + s.finish() + } +} + +impl Args { + pub fn debug(&'a self) -> DebugArgs<'a> { + DebugArgs { args: self } + } + + pub fn nth(&self, pos: usize) -> Option<&Spanned> { + match &self.positional { + None => None, + Some(array) => array.iter().nth(pos), + } + } + + pub fn expect_nth(&self, pos: usize) -> Result<&Spanned, ShellError> { + match &self.positional { + None => Err(ShellError::unimplemented("Better error: expect_nth")), + Some(array) => match array.iter().nth(pos) { + None => Err(ShellError::unimplemented("Better error: expect_nth")), + Some(item) => Ok(item), + }, + } + } + + pub fn len(&self) -> usize { + match &self.positional { + None => 0, + Some(array) => array.len(), + } + } + + pub fn has(&self, name: &str) -> bool { + match &self.named { + None => false, + Some(named) => named.contains_key(name), + } + } + + pub fn get(&self, name: &str) -> Option<&Spanned> { + match &self.named { + None => None, + Some(named) => named.get(name), + } + } + + pub fn positional_iter(&'a self) -> PositionalIter<'a> { + match &self.positional { + None => PositionalIter::Empty, + Some(v) => { + let iter = v.iter(); + PositionalIter::Array(iter) + } + } + } +} + +pub enum PositionalIter<'a> { + Empty, + Array(std::slice::Iter<'a, Spanned>), +} + +impl Iterator for PositionalIter<'a> { + type Item = &'a Spanned; + + fn next(&mut self) -> Option { + match self { + PositionalIter::Empty => None, + PositionalIter::Array(iter) => iter.next(), + } + } } impl CommandConfig { crate fn evaluate_args( &self, - args: impl Iterator, + call: &Spanned, + registry: &dyn CommandRegistry, scope: &Scope, + source: &str, ) -> Result { - let mut positional: Vec> = vec![]; - let mut named: IndexMap = IndexMap::default(); + let args = parse_command(self, registry, call, source)?; - let mut args: Vec = args.cloned().collect(); + trace!("parsed args: {:?}", args); - for (key, ty) in self.named.iter() { - let index = args.iter().position(|a| a.is_flag(&key)); + evaluate_args(args, registry, scope, source) - match (index, ty) { - (Some(i), NamedType::Switch) => { - args.remove(i); - named.insert(key.clone(), Value::boolean(true)); - } + // let mut positional: Vec> = vec![]; + // let mut named: IndexMap = IndexMap::default(); - (None, NamedType::Switch) => {} + // let mut args: Vec = args.cloned().collect(); - (Some(i), NamedType::Optional(v)) => { - args.remove(i); - named.insert(key.clone(), extract_named(&mut args, i, v)?); - } + // for (key, ty) in self.named.iter() { + // let index = args.iter().position(|a| a.is_flag(&key, source)); - (None, NamedType::Optional(_)) => {} + // match (index, ty) { + // (Some(i), NamedType::Switch) => { + // args.remove(i); + // named.insert(key.clone(), Value::boolean(true)); + // } - (Some(i), NamedType::Mandatory(v)) => { - args.remove(i); - named.insert(key.clone(), extract_named(&mut args, i, v)?); - } + // (None, NamedType::Switch) => {} - (None, NamedType::Mandatory(_)) => { - return Err(ShellError::string(&format!( - "Expected mandatory argument {}, but it was missing", - key - ))) - } - } - } + // (Some(i), NamedType::Optional(v)) => { + // args.remove(i); + // named.insert(key.clone(), extract_named(&mut args, i, v)?); + // } - let mut args = args.into_iter(); + // (None, NamedType::Optional(_)) => {} - for param in &self.mandatory_positional { - let arg = args.next(); + // (Some(i), NamedType::Mandatory(v)) => { + // args.remove(i); + // named.insert(key.clone(), extract_named(&mut args, i, v)?); + // } - let value = match arg { - None => { - return Err(ShellError::string(format!( - "expected mandatory positional argument {}", - param.name() - ))) - } + // (None, NamedType::Mandatory(_)) => { + // return Err(ShellError::string(&format!( + // "Expected mandatory argument {}, but it was missing", + // key + // ))) + // } + // } + // } - Some(arg) => param.evaluate(arg.clone(), scope)?, - }; + // let mut args = args.into_iter(); - positional.push(value); - } + // for param in &self.mandatory_positional { + // let arg = args.next(); - if self.rest_positional { - let rest: Result>, _> = - args.map(|i| evaluate_expr(&i, &Scope::empty())).collect(); - positional.extend(rest?); - } else { - let rest: Vec = args.collect(); + // let value = match arg { + // None => { + // return Err(ShellError::string(format!( + // "expected mandatory positional argument {}", + // param.name() + // ))) + // } - if rest.len() > 0 { - return Err(ShellError::string(&format!( - "Too many arguments, extras: {:?}", - rest - ))); - } - } + // Some(arg) => param.evaluate(arg.clone(), scope, source)?, + // }; - Ok(Args { positional, named }) + // positional.push(value); + // } + + // if self.rest_positional { + // let rest: Result>, _> = args + // .map(|i| evaluate_baseline_expr(&i, &Scope::empty(), source)) + // .collect(); + // positional.extend(rest?); + // } else { + // let rest: Vec = args.collect(); + + // if rest.len() > 0 { + // return Err(ShellError::string(&format!( + // "Too many arguments, extras: {:?}", + // rest + // ))); + // } + // } + + // Ok(Args { positional, named }) } #[allow(unused)] @@ -186,50 +278,64 @@ impl CommandConfig { } } -fn extract_named( - v: &mut Vec, - position: usize, - ty: &NamedValue, -) -> Result { - match ty { - NamedValue::Single => { - let expr = v.remove(position); - expect_simple_expr(expr) - } +fn evaluate_args( + args: hir::Call, + registry: &dyn CommandRegistry, + scope: &Scope, + source: &str, +) -> Result { + let positional: Result>, _> = args + .positional() + .as_ref() + .map(|p| { + p.iter() + .map(|e| evaluate_baseline_expr(e, &(), scope, source)) + .collect() + }) + .transpose(); - NamedValue::Tuple => { - let expr = v.remove(position); - let next = v.remove(position); + let positional = positional?; - let list = vec![expect_simple_expr(expr)?, expect_simple_expr(next)?]; - Ok(Value::List(list)) - } + let named: Result>>, ShellError> = args + .named() + .as_ref() + .map(|n| { + let mut results = IndexMap::new(); - other => Err(ShellError::string(&format!( - "Unimplemented named argument {:?}", - other - ))), - } -} + for (name, value) in n.named.iter() { + match value { + hir::named::NamedValue::PresentSwitch(span) => { + results.insert( + name.clone(), + Spanned::from_item(Value::boolean(true), *span), + ); + } + hir::named::NamedValue::Value(expr) => { + results.insert( + name.clone(), + evaluate_baseline_expr(expr, registry, scope, source)?, + ); + } -fn expect_simple_expr(expr: ast::Expression) -> Result { - match &*expr { - ast::RawExpression::Leaf(l) => Ok(match l { - ast::Leaf::Bare(s) => Value::string(s.to_string()), - ast::Leaf::String(s) => Value::string(s), - ast::Leaf::Boolean(b) => Value::boolean(*b), - ast::Leaf::Int(i) => Value::int(*i), - ast::Leaf::Unit(i, unit) => unit.compute(*i), - }), + _ => {} + }; + } - // TODO: Diagnostic - other => Err(ShellError::string(&format!( - "Expected a value, found {}", - other.print() - ))), - } + Ok(results) + }) + .transpose(); + + let named = named?; + + Ok(Args::new(positional, named)) } pub trait CommandRegistry { - fn get(&self, name: &str) -> CommandConfig; + fn get(&self, name: &str) -> Option; +} + +impl CommandRegistry for () { + fn get(&self, _name: &str) -> Option { + None + } } diff --git a/src/prelude.rs b/src/prelude.rs index d943d90827..b9fec2540c 100644 --- a/src/prelude.rs +++ b/src/prelude.rs @@ -5,7 +5,6 @@ crate use crate::env::host::handle_unexpected; crate use crate::env::{Environment, Host}; crate use crate::errors::ShellError; crate use crate::object::Value; -crate use crate::parser::ast; crate use crate::stream::{single_output, InputStream, OutputStream}; crate use futures::{FutureExt, StreamExt}; crate use std::collections::VecDeque; diff --git a/src/shell/helper.rs b/src/shell/helper.rs index 039a0b719e..e234aca42c 100644 --- a/src/shell/helper.rs +++ b/src/shell/helper.rs @@ -1,9 +1,8 @@ use crate::shell::completer::NuCompleter; -use crate::parser::lexer::SpannedToken; +use crate::parser::nom_input; use crate::prelude::*; use ansi_term::Color; -use log::trace; use rustyline::completion::{self, Completer, FilenameCompleter}; use rustyline::error::ReadlineError; use rustyline::highlight::Highlighter; @@ -47,7 +46,7 @@ impl Hinter for Helper { } impl Highlighter for Helper { - fn highlight_prompt<'b, 's: 'b, 'p:'b>(&'s self, prompt: &'p str, _: bool) -> Cow<'b, str> { + fn highlight_prompt<'b, 's: 'b, 'p: 'b>(&'s self, prompt: &'p str, _: bool) -> Cow<'b, str> { Owned("\x1b[32m".to_owned() + &prompt[0..prompt.len() - 2] + "\x1b[m> ") } @@ -56,30 +55,42 @@ impl Highlighter for Helper { } fn highlight<'l>(&self, line: &'l str, _pos: usize) -> Cow<'l, str> { - let tokens = crate::parser::lexer::Lexer::new(line, true); - let tokens: Result, _> = tokens.collect(); + + return Cow::Borrowed(line); + + let tokens = crate::parser::pipeline(nom_input(line)); match tokens { Err(_) => Cow::Borrowed(line), - Ok(v) => { + Ok((_rest, v)) => { let mut out = String::new(); - let mut iter = v.iter(); + let tokens = match v.as_pipeline() { + Err(_) => return Cow::Borrowed(line), + Ok(v) => v, + }; - let mut state = State::Command; + let mut iter = tokens.into_iter(); + + match iter.next() { + None => return Cow::Owned(out), + Some(v) => out.push_str(v.span().slice(line)), + }; loop { match iter.next() { None => return Cow::Owned(out), - Some((start, token, end)) => { - let (style, new_state) = token_style(&token, state); + Some(token) => { + // let styled = token_style(&token, state); - trace!("token={:?}", token); - trace!("style={:?}", style); - trace!("new_state={:?}", new_state); + // trace!("token={:?}", token); + // trace!("style={:?}", style); + // trace!("new_state={:?}", new_state); - state = new_state; - let slice = &line[*start..*end]; - let styled = style.paint(slice); + // state = new_state; + // let slice = &line[*start..*end]; + // let styled = style.paint(slice); + out.push_str("|"); + let styled = Color::Black.bold().paint(token.span().slice(line)); out.push_str(&styled.to_string()); } } @@ -93,41 +104,4 @@ impl Highlighter for Helper { } } -#[derive(Debug)] -enum State { - Command, - Flag, - Var, - Bare, - None, -} - -fn token_style( - token: &crate::parser::lexer::SpannedToken, - state: State, -) -> (ansi_term::Style, State) { - use crate::parser::lexer::Token::*; - - match (state, &token.token) { - (State::Command, Bare) => (Color::Cyan.bold(), State::None), - (State::Command, Whitespace) => (Color::White.normal(), State::Command), - - (State::Flag, Bare) => (Color::Black.bold(), State::None), - - (State::Var, Variable) => (Color::Yellow.bold(), State::None), - - (State::Bare, PathDot) => (Color::Green.normal(), State::Bare), - (State::Bare, Member) => (Color::Green.normal(), State::Bare), - - (_, Dash) | (_, DashDash) => (Color::Black.bold(), State::Flag), - (_, Dollar) => (Color::Yellow.bold(), State::Var), - (_, Bare) => (Color::Green.normal(), State::Bare), - (_, Member) => (Color::Cyan.normal(), State::None), - (_, Num) => (Color::Purple.bold(), State::None), - (_, DQString) | (_, SQString) => (Color::Green.normal(), State::None), - (_, Pipe) => (Color::White.normal(), State::Command), - _ => (Color::White.normal(), State::None), - } -} - impl rustyline::Helper for Helper {} diff --git a/tests/sort_by.txt b/tests/sort_by.txt index b84c5e7ea2..aa933f8a2d 100644 --- a/tests/sort_by.txt +++ b/tests/sort_by.txt @@ -1,3 +1,3 @@ cd tests -open test.toml --raw | split-row "\n" | skip 1 | first 4 | split-column "=" | sort-by Column1 | skip 1 | first 1 | get Column1 | trim | echo $it +open test.toml --raw | lines | skip 1 | first 4 | split-column "=" | sort-by Column1 | skip 1 | first 1 | get Column1 | trim | echo $it exit diff --git a/tests/split.txt b/tests/split.txt index 5bc3d841f6..68713c675f 100644 --- a/tests/split.txt +++ b/tests/split.txt @@ -1,3 +1,3 @@ cd tests -open test.toml --raw | split-row "\n" | skip 1 | first 1 | split-column "=" | get Column1 | trim | echo $it +open test.toml --raw | lines | skip 1 | first 1 | split-column "=" | get Column1 | trim | echo $it exit