mirror of
https://github.com/helix-editor/helix.git
synced 2025-04-04 19:37:54 +03:00
syntax: Prefer RopeSlice
for non-id language injection markers
The `Name` variant's inner type can be switched to `RopeSlice` since the parent commit removed the usage of `&str`. In doing this we need to switch from a regular `Regex` to a `rope::Regex`, which is mostly a matter of renaming the type. The `Filename` and `Shebang` variants can also switch to `RopeSlice` which avoids allocations in cases where the text doesn't reside on different chunks of the rope. Previously `Filename`'s `Cow` was always the owned variant because of the conversion to a `PathBuf`.
This commit is contained in:
parent
060255344c
commit
76a8682c4d
1 changed files with 26 additions and 20 deletions
|
@ -36,12 +36,12 @@ use helix_loader::grammar::{get_language, load_runtime_file};
|
||||||
|
|
||||||
pub use tree_cursor::TreeCursor;
|
pub use tree_cursor::TreeCursor;
|
||||||
|
|
||||||
fn deserialize_regex<'de, D>(deserializer: D) -> Result<Option<Regex>, D::Error>
|
fn deserialize_regex<'de, D>(deserializer: D) -> Result<Option<rope::Regex>, D::Error>
|
||||||
where
|
where
|
||||||
D: serde::Deserializer<'de>,
|
D: serde::Deserializer<'de>,
|
||||||
{
|
{
|
||||||
Option::<String>::deserialize(deserializer)?
|
Option::<String>::deserialize(deserializer)?
|
||||||
.map(|buf| Regex::new(&buf).map_err(serde::de::Error::custom))
|
.map(|buf| rope::Regex::new(&buf).map_err(serde::de::Error::custom))
|
||||||
.transpose()
|
.transpose()
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -135,7 +135,7 @@ pub struct LanguageConfiguration {
|
||||||
|
|
||||||
// content_regex
|
// content_regex
|
||||||
#[serde(default, skip_serializing, deserialize_with = "deserialize_regex")]
|
#[serde(default, skip_serializing, deserialize_with = "deserialize_regex")]
|
||||||
pub injection_regex: Option<Regex>,
|
pub injection_regex: Option<rope::Regex>,
|
||||||
// first_line_regex
|
// first_line_regex
|
||||||
//
|
//
|
||||||
#[serde(skip)]
|
#[serde(skip)]
|
||||||
|
@ -1003,12 +1003,12 @@ impl Loader {
|
||||||
|
|
||||||
/// Unlike language_config_for_language_id, which only returns Some for an exact id, this
|
/// Unlike language_config_for_language_id, which only returns Some for an exact id, this
|
||||||
/// function will perform a regex match on the given string to find the closest language match.
|
/// function will perform a regex match on the given string to find the closest language match.
|
||||||
pub fn language_config_for_name(&self, name: &str) -> Option<Arc<LanguageConfiguration>> {
|
pub fn language_config_for_name(&self, slice: RopeSlice) -> Option<Arc<LanguageConfiguration>> {
|
||||||
let mut best_match_length = 0;
|
let mut best_match_length = 0;
|
||||||
let mut best_match_position = None;
|
let mut best_match_position = None;
|
||||||
for (i, configuration) in self.language_configs.iter().enumerate() {
|
for (i, configuration) in self.language_configs.iter().enumerate() {
|
||||||
if let Some(injection_regex) = &configuration.injection_regex {
|
if let Some(injection_regex) = &configuration.injection_regex {
|
||||||
if let Some(mat) = injection_regex.find(name) {
|
if let Some(mat) = injection_regex.find(slice.regex_input()) {
|
||||||
let length = mat.end() - mat.start();
|
let length = mat.end() - mat.start();
|
||||||
if length > best_match_length {
|
if length > best_match_length {
|
||||||
best_match_position = Some(i);
|
best_match_position = Some(i);
|
||||||
|
@ -1027,12 +1027,17 @@ impl Loader {
|
||||||
) -> Option<Arc<LanguageConfiguration>> {
|
) -> Option<Arc<LanguageConfiguration>> {
|
||||||
match capture {
|
match capture {
|
||||||
InjectionLanguageMarker::LanguageId(id) => self.language_config_for_language_id(id),
|
InjectionLanguageMarker::LanguageId(id) => self.language_config_for_language_id(id),
|
||||||
InjectionLanguageMarker::Name(string) => self.language_config_for_name(string),
|
InjectionLanguageMarker::Name(name) => self.language_config_for_name(*name),
|
||||||
InjectionLanguageMarker::Filename(file) => self.language_config_for_file_name(file),
|
InjectionLanguageMarker::Filename(file) => {
|
||||||
InjectionLanguageMarker::Shebang(shebang) => self
|
let path_str: Cow<str> = (*file).into();
|
||||||
.language_config_ids_by_shebang
|
self.language_config_for_file_name(Path::new(path_str.as_ref()))
|
||||||
.get(shebang)
|
}
|
||||||
.and_then(|&id| self.language_configs.get(id).cloned()),
|
InjectionLanguageMarker::Shebang(shebang) => {
|
||||||
|
let shebang_str: Cow<str> = (*shebang).into();
|
||||||
|
self.language_config_ids_by_shebang
|
||||||
|
.get(shebang_str.as_ref())
|
||||||
|
.and_then(|&id| self.language_configs.get(id).cloned())
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -2031,12 +2036,13 @@ impl HighlightConfiguration {
|
||||||
for capture in query_match.captures {
|
for capture in query_match.captures {
|
||||||
let index = Some(capture.index);
|
let index = Some(capture.index);
|
||||||
if index == self.injection_language_capture_index {
|
if index == self.injection_language_capture_index {
|
||||||
let name = byte_range_to_str(capture.node.byte_range(), source);
|
injection_capture = Some(InjectionLanguageMarker::Name(
|
||||||
injection_capture = Some(InjectionLanguageMarker::Name(name));
|
source.byte_slice(capture.node.byte_range()),
|
||||||
|
));
|
||||||
} else if index == self.injection_filename_capture_index {
|
} else if index == self.injection_filename_capture_index {
|
||||||
let name = byte_range_to_str(capture.node.byte_range(), source);
|
injection_capture = Some(InjectionLanguageMarker::Filename(
|
||||||
let path = Path::new(name.as_ref()).to_path_buf();
|
source.byte_slice(capture.node.byte_range()),
|
||||||
injection_capture = Some(InjectionLanguageMarker::Filename(path.into()));
|
));
|
||||||
} else if index == self.injection_shebang_capture_index {
|
} else if index == self.injection_shebang_capture_index {
|
||||||
let node_slice = source.byte_slice(capture.node.byte_range());
|
let node_slice = source.byte_slice(capture.node.byte_range());
|
||||||
|
|
||||||
|
@ -2055,7 +2061,7 @@ impl HighlightConfiguration {
|
||||||
.captures_iter(lines.regex_input())
|
.captures_iter(lines.regex_input())
|
||||||
.map(|cap| {
|
.map(|cap| {
|
||||||
let cap = lines.byte_slice(cap.get_group(1).unwrap().range());
|
let cap = lines.byte_slice(cap.get_group(1).unwrap().range());
|
||||||
InjectionLanguageMarker::Shebang(cap.into())
|
InjectionLanguageMarker::Shebang(cap)
|
||||||
})
|
})
|
||||||
.next()
|
.next()
|
||||||
} else if index == self.injection_content_capture_index {
|
} else if index == self.injection_content_capture_index {
|
||||||
|
@ -2533,9 +2539,9 @@ pub enum InjectionLanguageMarker<'a> {
|
||||||
/// looked up by finding the language config that sets an `language_id`, this variant contains
|
/// looked up by finding the language config that sets an `language_id`, this variant contains
|
||||||
/// text from the document being highlighted, so the text is checked against each language's
|
/// text from the document being highlighted, so the text is checked against each language's
|
||||||
/// `injection_regex`.
|
/// `injection_regex`.
|
||||||
Name(Cow<'a, str>),
|
Name(RopeSlice<'a>),
|
||||||
Filename(Cow<'a, Path>),
|
Filename(RopeSlice<'a>),
|
||||||
Shebang(String),
|
Shebang(RopeSlice<'a>),
|
||||||
}
|
}
|
||||||
|
|
||||||
const SHEBANG: &str = r"#!\s*(?:\S*[/\\](?:env\s+(?:\-\S+\s+)*)?)?([^\s\.\d]+)";
|
const SHEBANG: &str = r"#!\s*(?:\S*[/\\](?:env\s+(?:\-\S+\s+)*)?)?([^\s\.\d]+)";
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue