diff --git a/assets/default.themedump b/assets/default.themedump index a5ed231a..0470392a 100644 Binary files a/assets/default.themedump and b/assets/default.themedump differ diff --git a/assets/default_metadata.packdump b/assets/default_metadata.packdump index f321dc61..12c5962c 100644 Binary files a/assets/default_metadata.packdump and b/assets/default_metadata.packdump differ diff --git a/assets/default_newlines.packdump b/assets/default_newlines.packdump index 9be1a3a8..5ec85dde 100644 Binary files a/assets/default_newlines.packdump and b/assets/default_newlines.packdump differ diff --git a/assets/default_nonewlines.packdump b/assets/default_nonewlines.packdump index 90f89468..0ddfbd35 100644 Binary files a/assets/default_nonewlines.packdump and b/assets/default_nonewlines.packdump differ diff --git a/src/parsing/metadata.rs b/src/parsing/metadata.rs index 36466f3d..98cfc15b 100644 --- a/src/parsing/metadata.rs +++ b/src/parsing/metadata.rs @@ -493,13 +493,13 @@ mod tests { #[test] fn load_raw() { - let comments_file: &str = "testdata/Packages/Go/Comments.tmPreferences"; + let comments_file: &str = "testdata/Packages/Go/GoCommentRules.tmPreferences"; assert!(Path::new(comments_file).exists()); let r = RawMetadataEntry::load(comments_file); assert!(r.is_ok()); - let indent_file: &str = "testdata/Packages/Go/Indentation Rules.tmPreferences"; + let indent_file: &str = "testdata/Packages/Go/Indents/GoIndent.tmPreferences"; assert!(Path::new(indent_file).exists()); let r = RawMetadataEntry::load(indent_file).unwrap(); diff --git a/src/parsing/parser.rs b/src/parsing/parser.rs index 4b319e73..46254921 100644 --- a/src/parsing/parser.rs +++ b/src/parsing/parser.rs @@ -757,24 +757,35 @@ mod tests { let ops1 = ops(&mut state, "module Bob::Wow::Troll::Five; 5; end", &ss); let test_ops1 = vec![ (0, Push(Scope::new("source.ruby.rails").unwrap())), - (0, Push(Scope::new("meta.module.ruby").unwrap())), - (0, Push(Scope::new("keyword.control.module.ruby").unwrap())), + (0, Push(Scope::new("meta.namespace.ruby").unwrap())), + (0, Push(Scope::new("storage.type.namespace.ruby").unwrap())), + ( + 0, + Push(Scope::new("keyword.declaration.namespace.ruby").unwrap()), + ), (6, Pop(2)), - (6, Push(Scope::new("meta.module.ruby").unwrap())), (7, Pop(1)), - (7, Push(Scope::new("meta.module.ruby").unwrap())), - (7, Push(Scope::new("entity.name.module.ruby").unwrap())), + (7, Push(Scope::new("meta.namespace.ruby").unwrap())), + (7, Push(Scope::new("entity.name.namespace.ruby").unwrap())), (7, Push(Scope::new("support.other.namespace.ruby").unwrap())), (10, Pop(1)), - (10, Push(Scope::new("punctuation.accessor.ruby").unwrap())), + ( + 10, + Push(Scope::new("punctuation.accessor.double-colon.ruby").unwrap()), + ), + (12, Pop(1)), ]; assert_eq!(&ops1[0..test_ops1.len()], &test_ops1[..]); let ops2 = ops(&mut state, "def lol(wow = 5)", &ss); - let test_ops2 = vec![ + let test_ops2 = [ (0, Push(Scope::new("meta.function.ruby").unwrap())), - (0, Push(Scope::new("keyword.control.def.ruby").unwrap())), - (3, Pop(2)), + (0, Push(Scope::new("storage.type.function.ruby").unwrap())), + ( + 0, + Push(Scope::new("keyword.declaration.function.ruby").unwrap()), + ), + (3, Pop(3)), (3, Push(Scope::new("meta.function.ruby").unwrap())), (4, Push(Scope::new("entity.name.function.ruby").unwrap())), (7, Pop(1)), @@ -829,6 +840,7 @@ mod tests { test_stack.push(Scope::new("text.html.basic").unwrap()); test_stack.push(Scope::new("source.js.embedded.html").unwrap()); test_stack.push(Scope::new("source.js").unwrap()); + test_stack.push(Scope::new("meta.string.js").unwrap()); test_stack.push(Scope::new("string.quoted.single.js").unwrap()); test_stack.push(Scope::new("source.ruby.rails.embedded.html").unwrap()); test_stack.push(Scope::new("meta.function.parameters.ruby").unwrap()); @@ -860,40 +872,39 @@ mod tests { Push(Scope::new("keyword.operator.assignment.ruby").unwrap()) ), (5, Pop(1)), - ( - 6, - Push(Scope::new("string.unquoted.embedded.sql.ruby").unwrap()) - ), + (6, Push(Scope::new("meta.string.heredoc.ruby").unwrap())), + (6, Push(Scope::new("string.unquoted.heredoc.ruby").unwrap())), ( 6, Push(Scope::new("punctuation.definition.string.begin.ruby").unwrap()) ), + (12, Pop(2)), (12, Pop(1)), - (12, Pop(1)), + (12, Push(Scope::new("meta.string.heredoc.ruby").unwrap())), + (12, Push(Scope::new("source.sql.embedded.ruby").unwrap())), + (12, Clear(ClearAmount::TopN(2))), ( 12, - Push(Scope::new("string.unquoted.embedded.sql.ruby").unwrap()) + Push(Scope::new("punctuation.accessor.dot.ruby").unwrap()) ), - (12, Push(Scope::new("text.sql.embedded.ruby").unwrap())), - (12, Clear(ClearAmount::TopN(2))), - (12, Push(Scope::new("punctuation.accessor.ruby").unwrap())), (13, Pop(1)), - (18, Restore), ] ); - assert_eq!(ops(&mut state, "wow", &ss), vec![]); + assert_eq!(ops(&mut state, "wow", &ss), vec![(0, Restore)]); assert_eq!( ops(&mut state, "SQL", &ss), vec![ (0, Pop(1)), + (0, Push(Scope::new("string.unquoted.heredoc.ruby").unwrap())), ( 0, Push(Scope::new("punctuation.definition.string.end.ruby").unwrap()) ), (3, Pop(1)), (3, Pop(1)), + (3, Pop(1)), ] ); } @@ -998,8 +1009,8 @@ mod tests { let mut state1 = ParseState::new(syntax); let mut state2 = ParseState::new(syntax); - assert_eq!(ops(&mut state1, "class Foo {", &ss).len(), 11); - assert_eq!(ops(&mut state2, "class Fooo {", &ss).len(), 11); + assert_eq!(ops(&mut state1, "class Foo {", &ss).len(), 12); + assert_eq!(ops(&mut state2, "class Fooo {", &ss).len(), 12); assert_eq!(state1, state2); ops(&mut state1, "}", &ss); diff --git a/src/parsing/syntax_definition.rs b/src/parsing/syntax_definition.rs index d73c3e7c..856c42e5 100644 --- a/src/parsing/syntax_definition.rs +++ b/src/parsing/syntax_definition.rs @@ -51,7 +51,7 @@ pub struct Context { pub meta_scope: Vec, pub meta_content_scope: Vec, /// This being set false in the syntax file implies this field being set false, - /// but it can also be set falso for contexts that don't include the prototype for other reasons + /// but it can also be set false for contexts that don't include the prototype for other reasons pub meta_include_prototype: bool, pub clear_scopes: Option, /// This is filled in by the linker at link time @@ -75,6 +75,27 @@ impl Context { prototype: None, } } + + pub(crate) fn extend(&mut self, other: Context) { + let Context { + meta_scope, + meta_content_scope, + meta_include_prototype, + clear_scopes, + prototype, + uses_backrefs, + patterns, + } = other; + self.meta_scope.extend(meta_scope); + self.meta_content_scope.extend(meta_content_scope); + self.meta_include_prototype = meta_include_prototype; + self.clear_scopes = clear_scopes; + if self.prototype.is_none() || prototype.is_some() { + self.prototype = prototype; + } + self.uses_backrefs |= uses_backrefs; + self.patterns.extend(patterns); + } } #[derive(Clone, Debug, Eq, PartialEq, Serialize, Deserialize)] diff --git a/src/parsing/syntax_set.rs b/src/parsing/syntax_set.rs index 3833fed4..a1dccbb5 100644 --- a/src/parsing/syntax_set.rs +++ b/src/parsing/syntax_set.rs @@ -13,6 +13,7 @@ use std::fs::File; use std::io::{self, BufRead, BufReader}; use std::mem; use std::path::Path; +use std::path::PathBuf; use super::regex::Regex; use crate::parsing::syntax_definition::ContextId; @@ -83,6 +84,7 @@ pub(crate) struct LazyContexts { pub struct SyntaxSetBuilder { syntaxes: Vec, path_syntaxes: Vec<(String, usize)>, + extends_syntaxes: Vec<(PathBuf, String)>, #[cfg(feature = "metadata")] raw_metadata: LoadMetadata, @@ -108,6 +110,23 @@ fn load_syntax_file( .map_err(|e| LoadingError::ParseSyntax(e, format!("{}", p.display()))) } +#[cfg(feature = "yaml-load")] +fn load_syntax_file_with_extends( + p: &Path, + base_syntax: &SyntaxDefinition, + lines_include_newline: bool, +) -> Result { + let s = std::fs::read_to_string(p)?; + + SyntaxDefinition::load_from_str_extended( + &s, + Some(base_syntax), + lines_include_newline, + p.file_stem().and_then(|x| x.to_str()), + ) + .map_err(|e| LoadingError::ParseSyntax(e, format!("{}", p.display()))) +} + impl Clone for SyntaxSet { fn clone(&self) -> SyntaxSet { SyntaxSet { @@ -375,6 +394,7 @@ impl SyntaxSet { SyntaxSetBuilder { syntaxes: builder_syntaxes, path_syntaxes, + extends_syntaxes: Vec::new(), #[cfg(feature = "metadata")] existing_metadata: Some(metadata), #[cfg(feature = "metadata")] @@ -516,6 +536,8 @@ impl SyntaxSetBuilder { folder: P, lines_include_newline: bool, ) -> Result<(), LoadingError> { + use super::ParseSyntaxError; + for entry in crate::utils::walk_dir(folder).sort_by(|a, b| a.file_name().cmp(b.file_name())) { let entry = entry.map_err(LoadingError::WalkDir)?; @@ -524,7 +546,27 @@ impl SyntaxSetBuilder { .extension() .map_or(false, |e| e == "sublime-syntax") { - let syntax = load_syntax_file(entry.path(), lines_include_newline)?; + let syntax = match load_syntax_file(entry.path(), lines_include_newline) { + Ok(syntax) => syntax, + // We are extending another syntax, look it up in the set first + Err(LoadingError::ParseSyntax( + ParseSyntaxError::ExtendsNotFound { name, extends }, + _, + )) => { + if let Some(ix) = self + .path_syntaxes + .iter() + .find(|(s, _)| s.ends_with(extends.as_str())) + .map(|(_, ix)| *ix) + { + todo!("lookup {ix} and pass to {name}"); + } + self.extends_syntaxes + .push((entry.path().to_path_buf(), extends)); + continue; + } + Err(err) => return Err(err), + }; if let Some(path_str) = entry.path().to_str() { // Split the path up and rejoin with slashes so that syntaxes loaded on Windows // can still be loaded the same way. @@ -550,6 +592,45 @@ impl SyntaxSetBuilder { Ok(()) } + fn resolve_extends(&mut self) { + let mut prev_len = usize::MAX; + // Loop while syntaxes are being resolved + while !self.extends_syntaxes.is_empty() && prev_len > self.extends_syntaxes.len() { + prev_len = self.extends_syntaxes.len(); + // Split borrows to make the borrow cheker happy + let syntaxes = &mut self.syntaxes; + let paths = &mut self.path_syntaxes; + // Resolve syntaxes + self.extends_syntaxes.retain(|(path, extends)| { + let Some(ix) = paths + .iter() + .find(|(s, _)| s.ends_with(extends.as_str())) + .map(|(_, ix)| *ix) + else { + return true; + }; + let base_syntax = &syntaxes[ix]; + // FIXME: don't unwrap + let syntax = load_syntax_file_with_extends(path, base_syntax, false).unwrap(); + if let Some(path_str) = path.to_str() { + // Split the path up and rejoin with slashes so that syntaxes loaded on Windows + // can still be loaded the same way. + let path = Path::new(path_str); + let path_parts: Vec<_> = path.iter().map(|c| c.to_str().unwrap()).collect(); + paths.push((path_parts.join("/").to_string(), syntaxes.len())); + } + syntaxes.push(syntax); + false + }); + } + + if !self.extends_syntaxes.is_empty() { + dbg!(&self.path_syntaxes); + dbg!(&self.extends_syntaxes); + todo!("warn, unresolved syntaxes"); + } + } + /// Build a [`SyntaxSet`] from the syntaxes that have been added to this /// builder. /// @@ -571,16 +652,20 @@ impl SyntaxSetBuilder { /// directly load the [`SyntaxSet`]. /// /// [`SyntaxSet`]: struct.SyntaxSet.html - pub fn build(self) -> SyntaxSet { + pub fn build(mut self) -> SyntaxSet { + self.resolve_extends(); + #[cfg(not(feature = "metadata"))] let SyntaxSetBuilder { syntaxes: syntax_definitions, path_syntaxes, + extends_syntaxes: _, } = self; #[cfg(feature = "metadata")] let SyntaxSetBuilder { syntaxes: syntax_definitions, path_syntaxes, + extends_syntaxes: _, raw_metadata, existing_metadata, } = self; @@ -1032,7 +1117,7 @@ mod tests { .get_context(&syntax.context_ids()["main"]) .expect("#[cfg(test)]"); let count = syntax_definition::context_iter(&ps, main_context).count(); - assert_eq!(count, 109); + assert_eq!(count, 168); } #[test] diff --git a/src/parsing/yaml_load.rs b/src/parsing/yaml_load.rs index 24f32a23..6a4733f4 100644 --- a/src/parsing/yaml_load.rs +++ b/src/parsing/yaml_load.rs @@ -32,6 +32,9 @@ pub enum ParseSyntaxError { /// Syntaxes must have a context named "main" #[error("Context 'main' is missing")] MainMissing, + /// This syntax extends another syntax which is not available + #[error("Syntax for {name} extends {extends}, but {extends} could not be found")] + ExtendsNotFound { name: String, extends: String }, /// Some part of the YAML file is the wrong type (e.g a string but should be a list) /// Sorry this doesn't give you any way to narrow down where this is. /// Maybe use Sublime Text to figure it out. @@ -86,6 +89,15 @@ impl SyntaxDefinition { s: &str, lines_include_newline: bool, fallback_name: Option<&str>, + ) -> Result { + SyntaxDefinition::load_from_str_extended(s, None, lines_include_newline, fallback_name) + } + + pub(crate) fn load_from_str_extended( + s: &str, + extends: Option<&SyntaxDefinition>, + lines_include_newline: bool, + fallback_name: Option<&str>, ) -> Result { let docs = match YamlLoader::load_from_str(s) { Ok(x) => x, @@ -98,6 +110,7 @@ impl SyntaxDefinition { let mut scope_repo = SCOPE_REPO.lock().unwrap(); SyntaxDefinition::parse_top_level( doc, + extends, scope_repo.deref_mut(), lines_include_newline, fallback_name, @@ -106,13 +119,18 @@ impl SyntaxDefinition { fn parse_top_level( doc: &Yaml, + extends: Option<&SyntaxDefinition>, scope_repo: &mut ScopeRepository, lines_include_newline: bool, fallback_name: Option<&str>, ) -> Result { let h = doc.as_hash().ok_or(ParseSyntaxError::TypeMismatch)?; - let mut variables = HashMap::new(); + // Get variables from cloned syntax, will be overritten if the same is present as detailed + // in the spec + let mut variables = extends + .map(|syntax| syntax.variables.clone()) + .unwrap_or_default(); if let Ok(map) = get_key(h, "variables", |x| x.as_hash()) { for (key, value) in map.iter() { if let (Some(key_str), Some(val_str)) = (key.as_str(), value.as_str()) { @@ -120,6 +138,21 @@ impl SyntaxDefinition { } } } + + let name = get_key(h, "name", |x| x.as_str()) + .unwrap_or_else(|_| fallback_name.unwrap_or("Unnamed")) + .to_owned(); + // FIXME: extends is allowed to be a list also + let extends = match (get_key(h, "extends", |x| x.as_str()), extends) { + (Ok(base_syntax), None) => { + return Err(ParseSyntaxError::ExtendsNotFound { + name, + extends: base_syntax.to_string(), + }) + } + (Ok(_), Some(base_syntax)) => Some(base_syntax), + (Err(_), _) => None, + }; let contexts_hash = get_key(h, "contexts", |x| x.as_hash())?; let top_level_scope = scope_repo .build(get_key(h, "scope", |x| x.as_str())?) @@ -132,7 +165,11 @@ impl SyntaxDefinition { lines_include_newline, }; - let mut contexts = SyntaxDefinition::parse_contexts(contexts_hash, &mut state)?; + let mut contexts = SyntaxDefinition::parse_contexts( + contexts_hash, + extends.map(|syntax| &syntax.contexts), + &mut state, + )?; if !contexts.contains_key("main") { return Err(ParseSyntaxError::MainMissing); } @@ -147,9 +184,7 @@ impl SyntaxDefinition { } let defn = SyntaxDefinition { - name: get_key(h, "name", |x| x.as_str()) - .unwrap_or_else(|_| fallback_name.unwrap_or("Unnamed")) - .to_owned(), + name, scope: top_level_scope, file_extensions, // TODO maybe cache a compiled version of this Regex @@ -166,9 +201,11 @@ impl SyntaxDefinition { fn parse_contexts( map: &Hash, + extends: Option<&HashMap>, state: &mut ParserState<'_>, ) -> Result, ParseSyntaxError> { - let mut contexts = HashMap::new(); + // FIXME: contexts need to be re-evaluated with the new values of the variables + let mut contexts = extends.cloned().unwrap_or_default(); for (key, value) in map.iter() { if let (Some(name), Some(val_vec)) = (key.as_str(), value.as_vec()) { let is_prototype = name == "prototype"; @@ -194,13 +231,31 @@ impl SyntaxDefinition { is_prototype: bool, namer: &mut ContextNamer, ) -> Result { + enum InsertMode { + Replace, + Prepend, + Append, + } let mut context = Context::new(!is_prototype); let name = namer.next(); + let mut insert = InsertMode::Replace; for y in vec.iter() { let map = y.as_hash().ok_or(ParseSyntaxError::TypeMismatch)?; let mut is_special = false; + if let Ok(x) = get_key(map, "meta_prepend", |x| x.as_bool()) { + if x { + insert = InsertMode::Prepend; + } + is_special = true; + } + if let Ok(x) = get_key(map, "meta_append", |x| x.as_bool()) { + if x { + insert = InsertMode::Append; + } + is_special = true; + } if let Ok(x) = get_key(map, "meta_scope", |x| x.as_str()) { context.meta_scope = str_to_scopes(x, state.scope_repo)?; is_special = true; @@ -237,7 +292,26 @@ impl SyntaxDefinition { } } - contexts.insert(name.clone(), context); + match insert { + InsertMode::Replace => { + contexts.insert(name.clone(), context); + } + InsertMode::Append => { + contexts + .entry(name.clone()) + .and_modify(|ctx| ctx.extend(context.clone())) + .or_insert(context); + } + InsertMode::Prepend => { + contexts + .entry(name.clone()) + .and_modify(|ctx| { + context.extend(ctx.clone()); + *ctx = context.clone(); + }) + .or_insert(context); + } + } Ok(name) } @@ -887,7 +961,6 @@ impl<'a> Parser<'a> { #[cfg(test)] mod tests { use super::*; - use crate::parsing::syntax_definition::*; use crate::parsing::Scope; #[test] diff --git a/testdata/Packages b/testdata/Packages index fa6b8629..40ec1f2f 160000 --- a/testdata/Packages +++ b/testdata/Packages @@ -1 +1 @@ -Subproject commit fa6b8629c95041bf262d4c1dab95c456a0530122 +Subproject commit 40ec1f2f9b56fb55d739e17ecd003cc9e8c9b096 diff --git a/testdata/known_syntest_failures.txt b/testdata/known_syntest_failures.txt index f55cff60..81b8f558 100644 --- a/testdata/known_syntest_failures.txt +++ b/testdata/known_syntest_failures.txt @@ -1,5 +1,15 @@ loading syntax definitions from testdata/Packages -FAILED testdata/Packages/C#/tests/syntax_test_Strings.cs: 38 +FAILED testdata/Packages/Clojure/tests/syntax_test_clojure.clj: 1 +FAILED testdata/Packages/Erlang/syntax_test_erlang.erl: 783 +FAILED testdata/Packages/Git Formats/syntax_test_git_config: 17 +FAILED testdata/Packages/Git Formats/syntax_test_git_rebase: 3 +FAILED testdata/Packages/JSON/syntax_test_json.json: 4 +FAILED testdata/Packages/Java/syntax_test_java.java: 817 +FAILED testdata/Packages/JavaScript/tests/syntax_test_js.js: 47 FAILED testdata/Packages/LaTeX/syntax_test_latex.tex: 1 FAILED testdata/Packages/Makefile/syntax_test_makefile.mak: 6 +FAILED testdata/Packages/Markdown/syntax_test_markdown.md: 3920 +FAILED testdata/Packages/PHP/syntax_test_php.php: 22 +FAILED testdata/Packages/Ruby/syntax_test_ruby.rb: 1 +FAILED testdata/Packages/ShellScript/test/syntax_test_bash.sh: 14 exiting with code 1 diff --git a/testdata/known_syntest_failures_fancy.txt b/testdata/known_syntest_failures_fancy.txt index c052e1e9..e8b5484e 100644 --- a/testdata/known_syntest_failures_fancy.txt +++ b/testdata/known_syntest_failures_fancy.txt @@ -1,5 +1,14 @@ loading syntax definitions from testdata/Packages -FAILED testdata/Packages/C#/tests/syntax_test_Strings.cs: 38 +FAILED testdata/Packages/Clojure/tests/syntax_test_clojure.clj: 1 +FAILED testdata/Packages/Erlang/syntax_test_erlang.erl: 783 +FAILED testdata/Packages/Git Formats/syntax_test_git_config: 17 +FAILED testdata/Packages/Git Formats/syntax_test_git_rebase: 3 +FAILED testdata/Packages/JSON/syntax_test_json.json: 4 +FAILED testdata/Packages/Java/syntax_test_java.java: 817 +FAILED testdata/Packages/JavaScript/tests/syntax_test_js.js: 47 FAILED testdata/Packages/LaTeX/syntax_test_latex.tex: 1 -FAILED testdata/Packages/Markdown/syntax_test_markdown.md: 11 +FAILED testdata/Packages/Markdown/syntax_test_markdown.md: 3920 +FAILED testdata/Packages/PHP/syntax_test_php.php: 22 +FAILED testdata/Packages/Ruby/syntax_test_ruby.rb: 1 +FAILED testdata/Packages/ShellScript/test/syntax_test_bash.sh: 14 exiting with code 1