diff --git a/core/src/cache.rs b/core/src/cache.rs index e5f962f3ea..e120f1106f 100644 --- a/core/src/cache.rs +++ b/core/src/cache.rs @@ -32,7 +32,7 @@ use std::time::SystemTime; use void::Void; /// Supported input formats. -#[derive(Default, Clone, Copy, Eq, Debug, PartialEq)] +#[derive(Default, Clone, Copy, Eq, Debug, PartialEq, Hash)] pub enum InputFormat { #[default] Nickel, @@ -58,10 +58,36 @@ impl InputFormat { _ => None, } } - /// Renturns an [InputFormat] based on the extension of a source path. + + pub fn from_tag(tag: &str) -> Option { + Some(match tag { + "Json" => InputFormat::Json, + "Nickel" => InputFormat::Nickel, + "Raw" => InputFormat::Raw, + "Yaml" => InputFormat::Yaml, + "Toml" => InputFormat::Toml, + #[cfg(feature = "nix-experimental")] + "Nix" => InputFormat::Nix, + _ => return None, + }) + } + + pub fn to_tag(&self) -> &'static str { + match self { + InputFormat::Nickel => "Nickel", + InputFormat::Json => "Json", + InputFormat::Yaml => "Yaml", + InputFormat::Toml => "Toml", + InputFormat::Raw => "Raw", + #[cfg(feature = "nix-experimental")] + InputFormat::Nix => "Nix", + } + } + + /// Extracts format embedded in SourcePath pub fn from_source_path(source_path: &SourcePath) -> Option { - if let SourcePath::Path(p) = source_path { - Self::from_path(p) + if let SourcePath::Path(_p, fmt) = source_path { + Some(*fmt) } else { None } @@ -269,7 +295,7 @@ pub enum SourcePath { /// /// This is the only `SourcePath` variant that can be resolved as the target /// of an import statement. - Path(PathBuf), + Path(PathBuf, InputFormat), /// A subrange of a file at the given path. /// /// This is used by nls to analyze small parts of files that don't fully parse. The @@ -290,7 +316,7 @@ impl<'a> TryFrom<&'a SourcePath> for &'a OsStr { fn try_from(value: &'a SourcePath) -> Result { match value { - SourcePath::Path(p) | SourcePath::Snippet(p) => Ok(p.as_os_str()), + SourcePath::Path(p, _) | SourcePath::Snippet(p) => Ok(p.as_os_str()), _ => Err(()), } } @@ -302,7 +328,7 @@ impl<'a> TryFrom<&'a SourcePath> for &'a OsStr { impl From for OsString { fn from(source_path: SourcePath) -> Self { match source_path { - SourcePath::Path(p) | SourcePath::Snippet(p) => p.into(), + SourcePath::Path(p, _) | SourcePath::Snippet(p) => p.into(), SourcePath::Std(StdlibModule::Std) => "".into(), SourcePath::Std(StdlibModule::Internals) => "".into(), SourcePath::Query => "".into(), @@ -364,13 +390,18 @@ impl Cache { /// Same as [Self::add_file], but assume that the path is already normalized, and take the /// timestamp as a parameter. - fn add_file_(&mut self, path: PathBuf, timestamp: SystemTime) -> io::Result { + fn add_file_( + &mut self, + path: PathBuf, + format: InputFormat, + timestamp: SystemTime, + ) -> io::Result { let contents = std::fs::read_to_string(&path)?; let file_id = self.files.add(&path, contents); self.file_paths - .insert(file_id, SourcePath::Path(path.clone())); + .insert(file_id, SourcePath::Path(path.clone(), format)); self.file_ids.insert( - SourcePath::Path(path), + SourcePath::Path(path, format), NameIdEntry { id: file_id, source: SourceKind::Filesystem(timestamp), @@ -383,24 +414,32 @@ impl Cache { /// /// Uses the normalized path and the *modified at* timestamp as the name-id table entry. /// Overrides any existing entry with the same name. - pub fn add_file(&mut self, path: impl Into) -> io::Result { + pub fn add_file( + &mut self, + path: impl Into, + format: InputFormat, + ) -> io::Result { let path = path.into(); let timestamp = timestamp(&path)?; let normalized = normalize_path(&path)?; - self.add_file_(normalized, timestamp) + self.add_file_(normalized, format, timestamp) } /// Try to retrieve the id of a file from the cache. /// /// If it was not in cache, try to read it from the filesystem and add it as a new entry. - pub fn get_or_add_file(&mut self, path: impl Into) -> io::Result> { + pub fn get_or_add_file( + &mut self, + path: impl Into, + format: InputFormat, + ) -> io::Result> { let path = path.into(); let normalized = normalize_path(&path)?; - match self.id_or_new_timestamp_of(path.as_ref())? { + match self.id_or_new_timestamp_of(path.as_ref(), format)? { SourceState::UpToDate(id) => Ok(CacheOp::Cached(id)), - SourceState::Stale(timestamp) => { - self.add_file_(normalized, timestamp).map(CacheOp::Done) - } + SourceState::Stale(timestamp) => self + .add_file_(normalized, format, timestamp) + .map(CacheOp::Done), } } @@ -954,7 +993,7 @@ impl Cache { /// [normalize_path]). pub fn id_of(&self, name: &SourcePath) -> Option { match name { - SourcePath::Path(p) => match self.id_or_new_timestamp_of(p).ok()? { + SourcePath::Path(p, fmt) => match self.id_or_new_timestamp_of(p, *fmt).ok()? { SourceState::UpToDate(id) => Some(id), SourceState::Stale(_) => None, }, @@ -970,8 +1009,11 @@ impl Cache { /// /// The main point of this awkward signature is to minimize I/O operations: if we accessed /// the timestamp, keep it around. - fn id_or_new_timestamp_of(&self, name: &Path) -> io::Result { - match self.file_ids.get(&SourcePath::Path(name.to_owned())) { + fn id_or_new_timestamp_of(&self, name: &Path, format: InputFormat) -> io::Result { + match self + .file_ids + .get(&SourcePath::Path(name.to_owned(), format)) + { None => Ok(SourceState::Stale(timestamp(name)?)), Some(NameIdEntry { id, @@ -1319,6 +1361,7 @@ pub trait ImportResolver { fn resolve( &mut self, path: &OsStr, + format: InputFormat, parent: Option, pos: &TermPos, ) -> Result<(ResolvedTerm, FileId), ImportError>; @@ -1333,6 +1376,7 @@ impl ImportResolver for Cache { fn resolve( &mut self, path: &OsStr, + format: InputFormat, parent: Option, pos: &TermPos, ) -> Result<(ResolvedTerm, FileId), ImportError> { @@ -1353,7 +1397,9 @@ impl ImportResolver for Cache { .find_map(|parent| { let mut path_buf = parent.clone(); path_buf.push(path); - self.get_or_add_file(&path_buf).ok().map(|x| (x, path_buf)) + self.get_or_add_file(&path_buf, format) + .ok() + .map(|x| (x, path_buf)) }) .ok_or_else(|| { let parents = possible_parents @@ -1367,7 +1413,6 @@ impl ImportResolver for Cache { ) })?; - let format = InputFormat::from_path(&path_buf).unwrap_or_default(); let (result, file_id) = match id_op { CacheOp::Cached(id) => (ResolvedTerm::FromCache, id), CacheOp::Done(id) => (ResolvedTerm::FromFile { path: path_buf }, id), @@ -1467,6 +1512,7 @@ pub mod resolvers { fn resolve( &mut self, _path: &OsStr, + _format: InputFormat, _parent: Option, _pos: &TermPos, ) -> Result<(ResolvedTerm, FileId), ImportError> { @@ -1508,6 +1554,7 @@ pub mod resolvers { fn resolve( &mut self, path: &OsStr, + _format: InputFormat, _parent: Option, pos: &TermPos, ) -> Result<(ResolvedTerm, FileId), ImportError> { diff --git a/core/src/error/mod.rs b/core/src/error/mod.rs index 27a26740dc..faef695eb7 100644 --- a/core/src/error/mod.rs +++ b/core/src/error/mod.rs @@ -583,6 +583,8 @@ pub enum ParseError { /// time, there are a set of expressions that can be excluded syntactically. Currently, it's /// mostly constants. InvalidContract(RawSpan), + /// Unrecognized explicit import format tag + InvalidImportFormat { span: RawSpan }, } /// An error occurring during the resolution of an import. @@ -815,6 +817,9 @@ impl ParseError { } } InternalParseError::InvalidContract(span) => ParseError::InvalidContract(span), + InternalParseError::InvalidImportFormat { span } => { + ParseError::InvalidImportFormat { span } + } }, } } @@ -2113,6 +2118,13 @@ impl IntoDiagnostics for ParseError { .to_owned(), "Only functions and records might be valid contracts".to_owned(), ]), + ParseError::InvalidImportFormat{span} => Diagnostic::error() + .with_message("unknown import format tag") + .with_labels(vec![primary(&span)]) + .with_notes(vec![ + "Examples of valid format tags: 'Nickel 'Json 'Yaml 'Toml 'Raw" + .to_owned() + ]), }; vec![diagnostic] diff --git a/core/src/eval/mod.rs b/core/src/eval/mod.rs index 0f315b3464..e5a52e9121 100644 --- a/core/src/eval/mod.rs +++ b/core/src/eval/mod.rs @@ -796,7 +796,7 @@ impl VirtualMachine { )); } } - Term::Import(path) => { + Term::Import { path, .. } => { return Err(EvalError::InternalError( format!("Unresolved import ({})", path.to_string_lossy()), pos, @@ -1169,7 +1169,7 @@ pub fn subst( | v @ Term::ForeignId(_) | v @ Term::SealingKey(_) | v @ Term::Enum(_) - | v @ Term::Import(_) + | v @ Term::Import{..} | v @ Term::ResolvedImport(_) // We could recurse here, because types can contain terms which would then be subject to // substitution. Not recursing should be fine, though, because a type in term position diff --git a/core/src/eval/tests.rs b/core/src/eval/tests.rs index 7ff97f59fa..ea3c9f0de5 100644 --- a/core/src/eval/tests.rs +++ b/core/src/eval/tests.rs @@ -131,15 +131,15 @@ fn imports() { .add_source(String::from("bad"), String::from("^$*/.23ab 0°@")); vm.import_resolver_mut().add_source( String::from("nested"), - String::from("let x = import \"two\" in x + 1"), + String::from("let x = import 'Nickel \"two\" in x + 1"), ); vm.import_resolver_mut().add_source( String::from("cycle"), - String::from("let x = import \"cycle_b\" in {a = 1, b = x.a}"), + String::from("let x = import 'Nickel \"cycle_b\" in {a = 1, b = x.a}"), ); vm.import_resolver_mut().add_source( String::from("cycle_b"), - String::from("let x = import \"cycle\" in {a = x.a}"), + String::from("let x = import 'Nickel \"cycle\" in {a = x.a}"), ); fn mk_import( @@ -152,7 +152,11 @@ fn imports() { R: ImportResolver, { resolve_imports( - mk_term::let_one_in(var, mk_term::import(import), body), + mk_term::let_one_in( + var, + mk_term::import(import, crate::cache::InputFormat::Nickel), + body, + ), vm.import_resolver_mut(), ) .map(|resolve_result| resolve_result.transformed_term) diff --git a/core/src/parser/error.rs b/core/src/parser/error.rs index 99206e9f9d..817460d83a 100644 --- a/core/src/parser/error.rs +++ b/core/src/parser/error.rs @@ -153,4 +153,6 @@ pub enum ParseError { /// time, there are a set of expressions that can be excluded syntactically. Currently, it's /// mostly constants. InvalidContract(RawSpan), + /// Unrecognized explicit import format tag + InvalidImportFormat { span: RawSpan }, } diff --git a/core/src/parser/grammar.lalrpop b/core/src/parser/grammar.lalrpop index 991673ec80..1f504d9006 100644 --- a/core/src/parser/grammar.lalrpop +++ b/core/src/parser/grammar.lalrpop @@ -252,7 +252,12 @@ UniTerm: UniTerm = { => { UniTerm::from(err) }, - "import" => UniTerm::from(Term::Import(OsString::from(s))), + "import" =>? { + Ok(UniTerm::from(mk_import_based_on_filename(s, mk_span(src_id, l, r))?)) + }, + "import" =>? { + Ok(UniTerm::from(mk_import_explicit(s, t, mk_span(src_id, l, r))?)) + }, }; AnnotatedInfixExpr: UniTerm = { diff --git a/core/src/parser/tests.rs b/core/src/parser/tests.rs index 5d0783aec5..ef1e827013 100644 --- a/core/src/parser/tests.rs +++ b/core/src/parser/tests.rs @@ -555,7 +555,7 @@ fn ty_var_kind_mismatch() { fn import() { assert_eq!( parse_without_pos("import \"file.ncl\""), - mk_term::import("file.ncl") + mk_term::import("file.ncl", crate::cache::InputFormat::Nickel) ); assert_matches!( parse("import \"file.ncl\" some args"), @@ -564,7 +564,7 @@ fn import() { assert_eq!( parse_without_pos("(import \"file.ncl\") some args"), mk_app!( - mk_term::import("file.ncl"), + mk_term::import("file.ncl", crate::cache::InputFormat::Nickel), mk_term::var("some"), mk_term::var("args") ) diff --git a/core/src/parser/utils.rs b/core/src/parser/utils.rs index 4ac5b0ca17..1db0114ff7 100644 --- a/core/src/parser/utils.rs +++ b/core/src/parser/utils.rs @@ -1,6 +1,7 @@ //! Various helpers and companion code for the parser are put here to keep the grammar definition //! uncluttered. use indexmap::map::Entry; +use std::ffi::OsString; use std::rc::Rc; use std::{collections::HashSet, fmt::Debug}; @@ -10,6 +11,7 @@ use self::pattern::bindings::Bindings as _; use super::error::ParseError; +use crate::cache::InputFormat; use crate::{ combine::Combine, eval::{ @@ -699,6 +701,29 @@ pub fn mk_fun(pat: Pattern, body: RichTerm) -> Term { } } +pub fn mk_import_based_on_filename(path: String, _span: RawSpan) -> Result { + let path = OsString::from(path); + let format: Option = + InputFormat::from_path(std::path::Path::new(path.as_os_str())); + + // Fall back to InputFormat::Nickel in case of unknown filename extension for backwards compatiblilty. + let format = format.unwrap_or_default(); + + Ok(Term::Import { path, format }) +} + +pub fn mk_import_explicit( + path: String, + format: LocIdent, + span: RawSpan, +) -> Result { + let path = OsString::from(path); + let Some(format) = InputFormat::from_tag(format.label()) else { + return Err(ParseError::InvalidImportFormat { span }); + }; + Ok(Term::Import { path, format }) +} + /// Determine the minimal level of indentation of a multi-line string. /// /// The result is determined by computing the minimum indentation level among all lines, where the diff --git a/core/src/pretty.rs b/core/src/pretty.rs index 97f2101bd6..c1795740c2 100644 --- a/core/src/pretty.rs +++ b/core/src/pretty.rs @@ -1,5 +1,6 @@ use std::fmt; +use crate::cache::InputFormat; use crate::identifier::LocIdent; use crate::parser::lexer::KEYWORDS; use crate::term::{ @@ -143,7 +144,7 @@ fn needs_parens_in_type_pos(typ: &Type) -> bool { | Term::Let(..) | Term::LetPattern(..) | Term::Op1(UnaryOp::IfThenElse, _) - | Term::Import(..) + | Term::Import { .. } | Term::ResolvedImport(..) ) } else { @@ -1056,9 +1057,20 @@ where SealingKey(sym) => allocator.text(format!("%")), Sealed(_i, _rt, _lbl) => allocator.text("%"), Annotated(annot, rt) => allocator.atom(rt).append(annot.pretty(allocator)), - Import(f) => allocator - .text("import ") - .append(allocator.as_string(f.to_string_lossy()).double_quotes()), + Import { path, format } => { + docs![ + allocator, + "import", + if Some(*format) + != InputFormat::from_path(std::path::Path::new(path.as_os_str())) + { + docs![allocator, "'", format.to_tag(), allocator.space()] + } else { + allocator.space() + }, + allocator.as_string(path.to_string_lossy()).double_quotes() + ] + } ResolvedImport(id) => allocator.text(format!("import ")), // This type is in term position, so we don't need to add parentheses. Type { typ, contract: _ } => typ.pretty(allocator), diff --git a/core/src/program.rs b/core/src/program.rs index 34005b7df9..63e93ad407 100644 --- a/core/src/program.rs +++ b/core/src/program.rs @@ -220,10 +220,10 @@ impl Program { let mut cache = Cache::new(ErrorTolerance::Strict); let main_id = match input { - Input::Path(path) => cache.add_file(path)?, + Input::Path(path) => cache.add_file(path, InputFormat::Nickel)?, Input::Source(source, name) => { let path = PathBuf::from(name.into()); - cache.add_source(SourcePath::Path(path), source)? + cache.add_source(SourcePath::Path(path, InputFormat::Nickel), source)? } }; @@ -252,13 +252,19 @@ impl Program { let merge_term = inputs .into_iter() .map(|input| match input { - Input::Path(path) => RichTerm::from(Term::Import(path.into())), + Input::Path(path) => RichTerm::from(Term::Import { + path: path.into(), + format: InputFormat::Nickel, + }), Input::Source(source, name) => { let path = PathBuf::from(name.into()); cache - .add_source(SourcePath::Path(path.clone()), source) + .add_source(SourcePath::Path(path.clone(), InputFormat::Nickel), source) .unwrap(); - RichTerm::from(Term::Import(path.into())) + RichTerm::from(Term::Import { + path: path.into(), + format: InputFormat::Nickel, + }) } }) .reduce(|acc, f| mk_term::op2(BinaryOp::Merge(Label::default().into()), acc, f)) diff --git a/core/src/repl/mod.rs b/core/src/repl/mod.rs index 1e376a10f0..28ef952fa3 100644 --- a/core/src/repl/mod.rs +++ b/core/src/repl/mod.rs @@ -230,7 +230,7 @@ impl Repl for ReplImpl { let file_id = self .vm .import_resolver_mut() - .add_file(OsString::from(path.as_ref())) + .add_file(OsString::from(path.as_ref()), InputFormat::Nickel) .map_err(IOError::from)?; self.vm .import_resolver_mut() diff --git a/core/src/term/mod.rs b/core/src/term/mod.rs index 12b72dd7b6..28206a94c2 100644 --- a/core/src/term/mod.rs +++ b/core/src/term/mod.rs @@ -21,6 +21,7 @@ use smallvec::SmallVec; use string::NickelString; use crate::{ + cache::InputFormat, error::{EvalError, ParseError}, eval::{cache::CacheIndex, Environment}, identifier::LocIdent, @@ -207,7 +208,7 @@ pub enum Term { /// An unresolved import. #[serde(skip)] - Import(OsString), + Import { path: OsString, format: InputFormat }, /// A resolved import (which has already been loaded and parsed). #[serde(skip)] @@ -365,7 +366,16 @@ impl PartialEq for Term { l0 == r0 && l1 == r1 && l2 == r2 } (Self::Annotated(l0, l1), Self::Annotated(r0, r1)) => l0 == r0 && l1 == r1, - (Self::Import(l0), Self::Import(r0)) => l0 == r0, + ( + Self::Import { + path: l0, + format: l1, + }, + Self::Import { + path: r0, + format: r1, + }, + ) => l0 == r0 && l1 == r1, (Self::ResolvedImport(l0), Self::ResolvedImport(r0)) => l0 == r0, ( Self::Type { @@ -973,7 +983,7 @@ impl Term { | Term::Op1(_, _) | Term::Op2(_, _, _) | Term::OpN(..) - | Term::Import(_) + | Term::Import { .. } | Term::ResolvedImport(_) | Term::StrChunks(_) | Term::ParseError(_) @@ -1026,7 +1036,7 @@ impl Term { | Term::OpN(..) | Term::Sealed(..) | Term::Annotated(..) - | Term::Import(_) + | Term::Import{..} | Term::ResolvedImport(_) | Term::StrChunks(_) | Term::RecRecord(..) @@ -1088,7 +1098,7 @@ impl Term { | Term::OpN(..) | Term::Sealed(..) | Term::Annotated(..) - | Term::Import(_) + | Term::Import { .. } | Term::ResolvedImport(_) | Term::StrChunks(_) | Term::RecRecord(..) @@ -1144,7 +1154,7 @@ impl Term { | Term::OpN(..) | Term::Sealed(..) | Term::Annotated(..) - | Term::Import(..) + | Term::Import{..} | Term::ResolvedImport(..) | Term::Closure(_) | Term::ParseError(_) @@ -2383,7 +2393,7 @@ impl Traverse for RichTerm { | Term::Var(_) | Term::Closure(_) | Term::Enum(_) - | Term::Import(_) + | Term::Import { .. } | Term::ResolvedImport(_) | Term::SealingKey(_) | Term::ForeignId(_) @@ -2852,11 +2862,15 @@ pub mod make { mk_fun!("x", var("x")) } - pub fn import(path: S) -> RichTerm + pub fn import(path: S, format: InputFormat) -> RichTerm where S: Into, { - Term::Import(path.into()).into() + Term::Import { + path: path.into(), + format, + } + .into() } pub fn integer(n: impl Into) -> RichTerm { diff --git a/core/src/transform/free_vars.rs b/core/src/transform/free_vars.rs index a01643eb1c..b91395a957 100644 --- a/core/src/transform/free_vars.rs +++ b/core/src/transform/free_vars.rs @@ -42,7 +42,7 @@ impl CollectFreeVars for RichTerm { | Term::ForeignId(_) | Term::SealingKey(_) | Term::Enum(_) - | Term::Import(_) + | Term::Import { .. } | Term::ResolvedImport(_) => (), Term::Fun(id, t) => { let mut fresh = HashSet::new(); diff --git a/core/src/transform/import_resolution.rs b/core/src/transform/import_resolution.rs index f549750452..6bf9d24c91 100644 --- a/core/src/transform/import_resolution.rs +++ b/core/src/transform/import_resolution.rs @@ -144,7 +144,8 @@ pub mod tolerant { { let term = rt.as_ref(); match term { - Term::Import(path) => match resolver.resolve(path, parent, &rt.pos) { + Term::Import { path, format } => match resolver.resolve(path, *format, parent, &rt.pos) + { Ok((_, file_id)) => (RichTerm::new(Term::ResolvedImport(file_id), rt.pos), None), Err(err) => (rt, Some(err)), }, diff --git a/core/src/typecheck/mod.rs b/core/src/typecheck/mod.rs index a2c335dedc..f8f1d06f46 100644 --- a/core/src/typecheck/mod.rs +++ b/core/src/typecheck/mod.rs @@ -1449,7 +1449,7 @@ fn walk( | Term::SealingKey(_) // This function doesn't recursively typecheck imports: this is the responsibility of the // caller. - | Term::Import(_) + | Term::Import{..} | Term::ResolvedImport(_) => Ok(()), Term::Var(x) => ctxt.type_env .get(&x.ident()) @@ -2407,7 +2407,7 @@ fn check( .unify(mk_uniftype::sym(), state, &ctxt) .map_err(|err| err.into_typecheck_err(state, rt.pos)), Term::Sealed(_, t, _) => check(state, ctxt, visitor, t, ty), - Term::Import(_) => ty + Term::Import { .. } => ty .unify(mk_uniftype::dynamic(), state, &ctxt) .map_err(|err| err.into_typecheck_err(state, rt.pos)), // We use the apparent type of the import for checking. This function doesn't recursively diff --git a/core/tests/integration/inputs/imports/explicit.ncl b/core/tests/integration/inputs/imports/explicit.ncl new file mode 100644 index 0000000000..dfa8be93f0 --- /dev/null +++ b/core/tests/integration/inputs/imports/explicit.ncl @@ -0,0 +1,11 @@ +# test.type = 'pass' + +[ + (import 'Nickel "imported/file_without_extension") == 1234, + (import 'Raw "imported/file_without_extension") |> std.string.is_match "^1200\\+34\\s*$", + (import 'Nickel "imported/file_with_unknown_extension.tst") == 1234, + (import 'Raw "imported/file_with_unknown_extension.tst") |> std.string.is_match "^34\\+1200\\s*$", + (import 'Raw "imported/empty.yaml") == "", + (import 'Raw "imported/two.ncl") |> std.string.is_match "^\\s*\\#", +] +|> std.test.assert_all diff --git a/core/tests/integration/inputs/imports/explicit_unknowntag.ncl b/core/tests/integration/inputs/imports/explicit_unknowntag.ncl new file mode 100644 index 0000000000..23102f5ca1 --- /dev/null +++ b/core/tests/integration/inputs/imports/explicit_unknowntag.ncl @@ -0,0 +1,6 @@ +# test.type = 'error' +# +# [test.metadata] +# error = 'ParseError' + +import 'Qqq "imported/empty.yaml" diff --git a/core/tests/integration/inputs/imports/fallback.ncl b/core/tests/integration/inputs/imports/fallback.ncl new file mode 100644 index 0000000000..674b62c07f --- /dev/null +++ b/core/tests/integration/inputs/imports/fallback.ncl @@ -0,0 +1,8 @@ +# test.type = 'pass' + +# Testing that importing files with unknown extension interprets them as Nickel source code +[ + (import "imported/file_without_extension") == 1234, + (import "imported/file_with_unknown_extension.tst") == 1234, +] +|> std.test.assert_all diff --git a/core/tests/integration/inputs/imports/imported/file_with_unknown_extension.tst b/core/tests/integration/inputs/imports/imported/file_with_unknown_extension.tst new file mode 100644 index 0000000000..a4a447b72a --- /dev/null +++ b/core/tests/integration/inputs/imports/imported/file_with_unknown_extension.tst @@ -0,0 +1 @@ +34+1200 diff --git a/core/tests/integration/inputs/imports/imported/file_without_extension b/core/tests/integration/inputs/imports/imported/file_without_extension new file mode 100644 index 0000000000..8ea46cc466 --- /dev/null +++ b/core/tests/integration/inputs/imports/imported/file_without_extension @@ -0,0 +1 @@ +1200+34 diff --git a/doc/manual/syntax.md b/doc/manual/syntax.md index 2774bb9d5f..d8d7d6d52f 100644 --- a/doc/manual/syntax.md +++ b/doc/manual/syntax.md @@ -1305,4 +1305,26 @@ record is serialized. This includes the output of the `nickel export` command: "{\n \"foo\": 1\n}" ``` +## Imports + +There is special keyword `import`, which can be followed by either a +string literal or an enum tag and a string literal. + +This causes Nickel to read, evaluate and return the specified file. + +The file is searched in directories specified by `NICKEL_IMPORT_PATH` +environment variable or similar command line option, with default being +the current directory. + +One-argument import, like `import "myfile.ncl"`, uses filename extension +to determine the file format. Nickel embeds a short list of known filename +extensions: `ncl`, `json`, `yml`, `yaml`, `toml`, `txt` and +`nix` with a fallback to a Nickel file if there is no extetnsion +or the extension is unknown. + +Two-argument import, like `import 'Raw "test.html"` uses a special enum +tag to determine the format. Currently the tags are `'Nickel`, `'Json`, +`'Yaml`, `'Toml`, `'Raw` and `'Nix`. Some of the formats may be unavailable +depending on compilation options of the Nickel interpreter. + [nix-string-context]: https://shealevy.com/blog/2018/08/05/understanding-nixs-string-context/ diff --git a/lsp/nls/src/background.rs b/lsp/nls/src/background.rs index 1a7b10a351..e58b6419a5 100644 --- a/lsp/nls/src/background.rs +++ b/lsp/nls/src/background.rs @@ -10,7 +10,7 @@ use crossbeam::channel::{bounded, Receiver, RecvTimeoutError, Sender}; use log::warn; use lsp_types::Url; use nickel_lang_core::{ - cache::SourcePath, + cache::{InputFormat, SourcePath}, eval::{cache::CacheImpl, VirtualMachine}, }; use serde::{Deserialize, Serialize}; @@ -93,7 +93,10 @@ pub fn worker_main() -> anyhow::Result<()> { anyhow::bail!("skipping invalid uri {}", eval.eval); }; - if let Some(file_id) = world.cache.id_of(&SourcePath::Path(path.clone())) { + if let Some(file_id) = world + .cache + .id_of(&SourcePath::Path(path.clone(), InputFormat::Nickel)) + { let mut diagnostics = world.parse_and_typecheck(file_id); // Evaluation diagnostics (but only if there were no parse/type errors). diff --git a/lsp/nls/src/cache.rs b/lsp/nls/src/cache.rs index 1f7a1d71f3..5b3c788f0a 100644 --- a/lsp/nls/src/cache.rs +++ b/lsp/nls/src/cache.rs @@ -1,5 +1,6 @@ use codespan::{ByteIndex, FileId}; use lsp_types::{TextDocumentPositionParams, Url}; +use nickel_lang_core::cache::InputFormat; use nickel_lang_core::term::{RichTerm, Term, Traverse}; use nickel_lang_core::{ cache::{Cache, CacheError, CacheOp, EntryState, SourcePath, TermEntry}, @@ -112,7 +113,7 @@ impl CacheExt for Cache { let path = uri .to_file_path() .map_err(|_| crate::error::Error::FileNotFound(uri.clone()))?; - Ok(self.id_of(&SourcePath::Path(path))) + Ok(self.id_of(&SourcePath::Path(path, InputFormat::Nickel))) } fn position( diff --git a/lsp/nls/src/requests/completion.rs b/lsp/nls/src/requests/completion.rs index 4c26ed5722..e1a748a586 100644 --- a/lsp/nls/src/requests/completion.rs +++ b/lsp/nls/src/requests/completion.rs @@ -229,7 +229,7 @@ pub fn handle_completion( let term = server.world.lookup_term_by_position(pos)?.cloned(); let ident = server.world.lookup_ident_by_position(pos)?; - if let Some(Term::Import(import)) = term.as_ref().map(|t| t.term.as_ref()) { + if let Some(Term::Import { path: import, .. }) = term.as_ref().map(|t| t.term.as_ref()) { // Don't respond with anything if trigger is a `.`, as that may be the // start of a relative file path `./`, or the start of a file extension if !matches!(trigger, Some(".")) { diff --git a/lsp/nls/src/requests/formatting.rs b/lsp/nls/src/requests/formatting.rs index b5f0058fca..4c8d172667 100644 --- a/lsp/nls/src/requests/formatting.rs +++ b/lsp/nls/src/requests/formatting.rs @@ -1,6 +1,6 @@ use lsp_server::{RequestId, Response, ResponseError}; use lsp_types::{DocumentFormattingParams, Position, Range, TextEdit}; -use nickel_lang_core::cache::SourcePath; +use nickel_lang_core::cache::{InputFormat, SourcePath}; use crate::{error::Error, files::uri_to_path, server::Server}; @@ -13,7 +13,11 @@ pub fn handle_format_document( server: &mut Server, ) -> Result<(), ResponseError> { let path = uri_to_path(¶ms.text_document.uri)?; - let file_id = server.world.cache.id_of(&SourcePath::Path(path)).unwrap(); + let file_id = server + .world + .cache + .id_of(&SourcePath::Path(path, InputFormat::Nickel)) + .unwrap(); let text = server.world.cache.files().source(file_id).clone(); let document_length = text.lines().count() as u32; diff --git a/lsp/nls/src/world.rs b/lsp/nls/src/world.rs index 7c8cb0eaaa..5847e5224b 100644 --- a/lsp/nls/src/world.rs +++ b/lsp/nls/src/world.rs @@ -91,7 +91,9 @@ impl World { // Replace the path (as opposed to adding it): we may already have this file in the // cache if it was imported by an already-open file. - let file_id = self.cache.replace_string(SourcePath::Path(path), contents); + let file_id = self + .cache + .replace_string(SourcePath::Path(path, InputFormat::Nickel), contents); // The cache automatically invalidates reverse-dependencies; we also need // to track them, so that we can clear our own analysis. @@ -120,7 +122,9 @@ impl World { contents: String, ) -> anyhow::Result<(FileId, Vec)> { let path = uri_to_path(&uri)?; - let file_id = self.cache.replace_string(SourcePath::Path(path), contents); + let file_id = self + .cache + .replace_string(SourcePath::Path(path, InputFormat::Nickel), contents); let invalid = self.cache.invalidate_cache(file_id); for f in &invalid { diff --git a/utils/src/bench.rs b/utils/src/bench.rs index 6179e07266..da40fd9a22 100644 --- a/utils/src/bench.rs +++ b/utils/src/bench.rs @@ -1,6 +1,6 @@ use criterion::Criterion; use nickel_lang_core::{ - cache::{Cache, Envs, ErrorTolerance}, + cache::{Cache, Envs, ErrorTolerance, InputFormat}, eval::{ cache::{Cache as EvalCache, CacheImpl}, VirtualMachine, @@ -112,7 +112,7 @@ pub fn bench_terms<'r>(rts: Vec>) -> Box b.iter_batched( || { let mut cache = cache.clone(); - let id = cache.add_file(bench.path()).unwrap(); + let id = cache.add_file(bench.path(), InputFormat::Nickel).unwrap(); let t = import_resolution::strict::resolve_imports(t.clone(), &mut cache) .unwrap() .transformed_term; @@ -202,7 +202,7 @@ macro_rules! ncl_bench_group { b.iter_batched( || { let mut cache = cache.clone(); - let id = cache.add_file(bench.path()).unwrap(); + let id = cache.add_file(bench.path(), InputFormat::Nickel).unwrap(); let t = resolve_imports(t.clone(), &mut cache) .unwrap() .transformed_term;