mirror of
https://github.com/helix-editor/helix.git
synced 2025-04-04 19:37:54 +03:00
tmp
This commit is contained in:
parent
0cd8817d06
commit
1bd36f528a
4 changed files with 426 additions and 311 deletions
|
@ -27,9 +27,15 @@ impl std::fmt::Debug for Grammar {
|
||||||
}
|
}
|
||||||
|
|
||||||
impl Grammar {
|
impl Grammar {
|
||||||
|
/// Loads a shared library containg a tree sitter grammar with name `name`
|
||||||
|
// from `library_path`.
|
||||||
|
///
|
||||||
|
/// # Safety
|
||||||
|
///
|
||||||
|
/// `library_path` must be a valid tree sitter grammar
|
||||||
pub unsafe fn new(name: &str, library_path: &Path) -> Result<Grammar, Error> {
|
pub unsafe fn new(name: &str, library_path: &Path) -> Result<Grammar, Error> {
|
||||||
let library = unsafe {
|
let library = unsafe {
|
||||||
Library::new(&library_path).map_err(|err| Error::DlOpen {
|
Library::new(library_path).map_err(|err| Error::DlOpen {
|
||||||
err,
|
err,
|
||||||
path: library_path.to_owned(),
|
path: library_path.to_owned(),
|
||||||
})?
|
})?
|
||||||
|
@ -45,7 +51,7 @@ impl Grammar {
|
||||||
Grammar { ptr: language_fn() }
|
Grammar { ptr: language_fn() }
|
||||||
};
|
};
|
||||||
let version = grammar.version();
|
let version = grammar.version();
|
||||||
if MIN_COMPATIBLE_ABI_VERSION <= version && version <= ABI_VERSION {
|
if (MIN_COMPATIBLE_ABI_VERSION..=ABI_VERSION).contains(&version) {
|
||||||
std::mem::forget(library);
|
std::mem::forget(library);
|
||||||
Ok(grammar)
|
Ok(grammar)
|
||||||
} else {
|
} else {
|
||||||
|
|
|
@ -1,46 +1,30 @@
|
||||||
use std::fmt::Display;
|
use std::fmt::{self, Display};
|
||||||
use std::iter::zip;
|
use std::ops::Range;
|
||||||
use std::path::{Path, PathBuf};
|
use std::path::{Path, PathBuf};
|
||||||
use std::ptr::NonNull;
|
use std::ptr::NonNull;
|
||||||
use std::{slice, str};
|
use std::{slice, str};
|
||||||
|
|
||||||
use regex_cursor::engines::meta::Regex;
|
use crate::tree_sitter::query::predicate::{InvalidPredicateError, Predicate, TextPredicate};
|
||||||
|
use crate::tree_sitter::query::property::QueryProperty;
|
||||||
use crate::tree_sitter::Grammar;
|
use crate::tree_sitter::Grammar;
|
||||||
|
|
||||||
macro_rules! bail {
|
mod predicate;
|
||||||
($($args:tt)*) => {{
|
mod property;
|
||||||
return Err(format!($($args)*))
|
|
||||||
}}
|
|
||||||
}
|
|
||||||
|
|
||||||
macro_rules! ensure {
|
|
||||||
($cond: expr, $($args:tt)*) => {{
|
|
||||||
if !$cond {
|
|
||||||
return Err(format!($($args)*))
|
|
||||||
}
|
|
||||||
}}
|
|
||||||
}
|
|
||||||
|
|
||||||
#[derive(Debug)]
|
|
||||||
enum TextPredicateCaptureKind {
|
|
||||||
EqString(u32),
|
|
||||||
EqCapture(u32),
|
|
||||||
MatchString(Regex),
|
|
||||||
AnyString(Box<[Box<str>]>),
|
|
||||||
}
|
|
||||||
|
|
||||||
struct TextPredicateCapture {
|
|
||||||
capture_idx: u32,
|
|
||||||
kind: TextPredicateCaptureKind,
|
|
||||||
negated: bool,
|
|
||||||
match_all: bool,
|
|
||||||
}
|
|
||||||
|
|
||||||
pub enum QueryData {}
|
pub enum QueryData {}
|
||||||
|
|
||||||
|
pub(super) struct Pattern {
|
||||||
|
text_predicates: Range<u32>,
|
||||||
|
properties: Range<u32>,
|
||||||
|
}
|
||||||
|
|
||||||
pub struct Query {
|
pub struct Query {
|
||||||
raw: NonNull<QueryData>,
|
raw: NonNull<QueryData>,
|
||||||
num_captures: u32,
|
num_captures: u32,
|
||||||
|
num_strings: u32,
|
||||||
|
text_predicates: Vec<TextPredicate>,
|
||||||
|
properties: Vec<QueryProperty>,
|
||||||
|
patterns: Box<[Pattern]>,
|
||||||
}
|
}
|
||||||
|
|
||||||
impl Query {
|
impl Query {
|
||||||
|
@ -50,7 +34,12 @@ impl Query {
|
||||||
/// The query is associated with a particular grammar, and can only be run
|
/// The query is associated with a particular grammar, and can only be run
|
||||||
/// on syntax nodes parsed with that grammar. References to Queries can be
|
/// on syntax nodes parsed with that grammar. References to Queries can be
|
||||||
/// shared between multiple threads.
|
/// shared between multiple threads.
|
||||||
pub fn new(grammar: Grammar, source: &str, path: impl AsRef<Path>) -> Result<Self, ParseError> {
|
pub fn new(
|
||||||
|
grammar: Grammar,
|
||||||
|
source: &str,
|
||||||
|
path: impl AsRef<Path>,
|
||||||
|
mut custom_predicate: impl FnMut(Predicate) -> Result<(), InvalidPredicateError>,
|
||||||
|
) -> Result<Self, ParseError> {
|
||||||
assert!(
|
assert!(
|
||||||
source.len() <= i32::MAX as usize,
|
source.len() <= i32::MAX as usize,
|
||||||
"TreeSitter queries must be smaller then 2 GiB (is {})",
|
"TreeSitter queries must be smaller then 2 GiB (is {})",
|
||||||
|
@ -136,167 +125,52 @@ impl Query {
|
||||||
// I am not going to bother with safety comments here, all of these are
|
// I am not going to bother with safety comments here, all of these are
|
||||||
// safe as long as TS is not buggy because raw is a properly constructed query
|
// safe as long as TS is not buggy because raw is a properly constructed query
|
||||||
let num_captures = unsafe { ts_query_capture_count(raw) };
|
let num_captures = unsafe { ts_query_capture_count(raw) };
|
||||||
|
let num_strings = unsafe { ts_query_string_count(raw) };
|
||||||
|
let num_patterns = unsafe { ts_query_pattern_count(raw) };
|
||||||
|
|
||||||
Ok(Query { raw, num_captures })
|
let mut query = Query {
|
||||||
}
|
raw,
|
||||||
|
num_captures,
|
||||||
fn parse_predicates(&mut self) {
|
num_strings,
|
||||||
let pattern_count = unsafe { ts_query_pattern_count(self.raw) };
|
text_predicates: Vec::new(),
|
||||||
|
properties: Vec::new(),
|
||||||
let mut text_predicates = Vec::with_capacity(pattern_count as usize);
|
patterns: Box::default(),
|
||||||
let mut property_predicates = Vec::with_capacity(pattern_count as usize);
|
|
||||||
let mut property_settings = Vec::with_capacity(pattern_count as usize);
|
|
||||||
let mut general_predicates = Vec::with_capacity(pattern_count as usize);
|
|
||||||
|
|
||||||
for i in 0..pattern_count {}
|
|
||||||
}
|
|
||||||
|
|
||||||
fn parse_predicate(&self, pattern_index: u32) -> Result<(), String> {
|
|
||||||
let mut text_predicates = Vec::new();
|
|
||||||
let mut property_predicates = Vec::new();
|
|
||||||
let mut property_settings = Vec::new();
|
|
||||||
let mut general_predicates = Vec::new();
|
|
||||||
for predicate in self.predicates(pattern_index) {
|
|
||||||
let predicate = unsafe { Predicate::new(self, predicate)? };
|
|
||||||
|
|
||||||
// Build a predicate for each of the known predicate function names.
|
|
||||||
match predicate.operator_name {
|
|
||||||
"eq?" | "not-eq?" | "any-eq?" | "any-not-eq?" => {
|
|
||||||
predicate.check_arg_count(2)?;
|
|
||||||
let capture_idx = predicate.get_arg(0, PredicateArg::Capture)?;
|
|
||||||
let (arg2, arg2_kind) = predicate.get_any_arg(1);
|
|
||||||
|
|
||||||
let negated = matches!(predicate.operator_name, "not-eq?" | "not-any-eq?");
|
|
||||||
let match_all = matches!(predicate.operator_name, "eq?" | "not-eq?");
|
|
||||||
let kind = match arg2_kind {
|
|
||||||
PredicateArg::Capture => TextPredicateCaptureKind::EqCapture(arg2),
|
|
||||||
PredicateArg::String => TextPredicateCaptureKind::EqString(arg2),
|
|
||||||
};
|
|
||||||
text_predicates.push(TextPredicateCapture {
|
|
||||||
capture_idx,
|
|
||||||
kind,
|
|
||||||
negated,
|
|
||||||
match_all,
|
|
||||||
});
|
|
||||||
}
|
|
||||||
|
|
||||||
"match?" | "not-match?" | "any-match?" | "any-not-match?" => {
|
|
||||||
predicate.check_arg_count(2)?;
|
|
||||||
let capture_idx = predicate.get_arg(0, PredicateArg::Capture)?;
|
|
||||||
let regex = predicate.get_str_arg(1)?;
|
|
||||||
|
|
||||||
let negated =
|
|
||||||
matches!(predicate.operator_name, "not-match?" | "any-not-match?");
|
|
||||||
let match_all = matches!(predicate.operator_name, "match?" | "not-match?");
|
|
||||||
let regex = match Regex::new(regex) {
|
|
||||||
Ok(regex) => regex,
|
|
||||||
Err(err) => bail!("invalid regex '{regex}', {err}"),
|
|
||||||
};
|
|
||||||
text_predicates.push(TextPredicateCapture {
|
|
||||||
capture_idx,
|
|
||||||
kind: TextPredicateCaptureKind::MatchString(regex),
|
|
||||||
negated,
|
|
||||||
match_all,
|
|
||||||
});
|
|
||||||
}
|
|
||||||
|
|
||||||
"set!" => property_settings.push(Self::parse_property(
|
|
||||||
row,
|
|
||||||
operator_name,
|
|
||||||
&capture_names,
|
|
||||||
&string_values,
|
|
||||||
&p[1..],
|
|
||||||
)?),
|
|
||||||
|
|
||||||
"is?" | "is-not?" => property_predicates.push((
|
|
||||||
Self::parse_property(
|
|
||||||
row,
|
|
||||||
operator_name,
|
|
||||||
&capture_names,
|
|
||||||
&string_values,
|
|
||||||
&p[1..],
|
|
||||||
)?,
|
|
||||||
operator_name == "is?",
|
|
||||||
)),
|
|
||||||
|
|
||||||
"any-of?" | "not-any-of?" => {
|
|
||||||
if p.len() < 2 {
|
|
||||||
return Err(predicate_error(row, format!(
|
|
||||||
"Wrong number of arguments to #any-of? predicate. Expected at least 1, got {}.",
|
|
||||||
p.len() - 1
|
|
||||||
)));
|
|
||||||
}
|
|
||||||
if p[1].type_ != TYPE_CAPTURE {
|
|
||||||
return Err(predicate_error(row, format!(
|
|
||||||
"First argument to #any-of? predicate must be a capture name. Got literal \"{}\".",
|
|
||||||
string_values[p[1].value_id as usize],
|
|
||||||
)));
|
|
||||||
}
|
|
||||||
|
|
||||||
let is_positive = operator_name == "any-of?";
|
|
||||||
let mut values = Vec::new();
|
|
||||||
for arg in &p[2..] {
|
|
||||||
if arg.type_ == TYPE_CAPTURE {
|
|
||||||
return Err(predicate_error(row, format!(
|
|
||||||
"Arguments to #any-of? predicate must be literals. Got capture @{}.",
|
|
||||||
capture_names[arg.value_id as usize],
|
|
||||||
)));
|
|
||||||
}
|
|
||||||
values.push(string_values[arg.value_id as usize]);
|
|
||||||
}
|
|
||||||
text_predicates.push(TextPredicateCapture::AnyString(
|
|
||||||
p[1].value_id,
|
|
||||||
values
|
|
||||||
.iter()
|
|
||||||
.map(|x| (*x).to_string().into())
|
|
||||||
.collect::<Vec<_>>()
|
|
||||||
.into(),
|
|
||||||
is_positive,
|
|
||||||
));
|
|
||||||
}
|
|
||||||
|
|
||||||
_ => general_predicates.push(QueryPredicate {
|
|
||||||
operator: operator_name.to_string().into(),
|
|
||||||
args: p[1..]
|
|
||||||
.iter()
|
|
||||||
.map(|a| {
|
|
||||||
if a.type_ == TYPE_CAPTURE {
|
|
||||||
QueryPredicateArg::Capture(a.value_id)
|
|
||||||
} else {
|
|
||||||
QueryPredicateArg::String(
|
|
||||||
string_values[a.value_id as usize].to_string().into(),
|
|
||||||
)
|
|
||||||
}
|
|
||||||
})
|
|
||||||
.collect(),
|
|
||||||
}),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
text_predicates_vec.push(text_predicates.into());
|
|
||||||
property_predicates_vec.push(property_predicates.into());
|
|
||||||
property_settings_vec.push(property_settings.into());
|
|
||||||
general_predicates_vec.push(general_predicates.into());
|
|
||||||
}
|
|
||||||
|
|
||||||
fn predicates<'a>(
|
|
||||||
&'a self,
|
|
||||||
pattern_index: u32,
|
|
||||||
) -> impl Iterator<Item = &'a [PredicateStep]> + 'a {
|
|
||||||
let predicate_steps = unsafe {
|
|
||||||
let mut len = 0u32;
|
|
||||||
let raw_predicates = ts_query_predicates_for_pattern(self.raw, pattern_index, &mut len);
|
|
||||||
(len != 0)
|
|
||||||
.then(|| slice::from_raw_parts(raw_predicates, len as usize))
|
|
||||||
.unwrap_or_default()
|
|
||||||
};
|
};
|
||||||
predicate_steps
|
let patterns: Result<_, ParseError> = (0..num_patterns)
|
||||||
.split(|step| step.kind == PredicateStepKind::Done)
|
.map(|pattern| {
|
||||||
.filter(|predicate| !predicate.is_empty())
|
query
|
||||||
|
.parse_pattern_predicates(pattern, &mut custom_predicate)
|
||||||
|
.map_err(|err| ParseError::InvalidPredicate {
|
||||||
|
message: err.msg.into(),
|
||||||
|
location: ParserErrorLocation::new(
|
||||||
|
source,
|
||||||
|
path.as_ref(),
|
||||||
|
unsafe { ts_query_start_byte_for_pattern(query.raw, pattern) as usize },
|
||||||
|
0,
|
||||||
|
),
|
||||||
|
})
|
||||||
|
})
|
||||||
|
.collect();
|
||||||
|
query.patterns = patterns?;
|
||||||
|
Ok(query)
|
||||||
}
|
}
|
||||||
|
|
||||||
/// Safety: value_idx must be a valid string id (in bounds) for this query and pattern_index
|
// fn parse_predicates(&mut self) {
|
||||||
unsafe fn get_pattern_string(&self, value_id: u32) -> &str {
|
// let pattern_count = unsafe { ts_query_pattern_count(self.raw) };
|
||||||
|
|
||||||
|
// let mut text_predicates = Vec::with_capacity(pattern_count as usize);
|
||||||
|
// let mut property_predicates = Vec::with_capacity(pattern_count as usize);
|
||||||
|
// let mut property_settings = Vec::with_capacity(pattern_count as usize);
|
||||||
|
// let mut general_predicates = Vec::with_capacity(pattern_count as usize);
|
||||||
|
|
||||||
|
// for i in 0..pattern_count {}
|
||||||
|
// }
|
||||||
|
|
||||||
|
#[inline]
|
||||||
|
fn get_string(&self, str: QueryStr) -> &str {
|
||||||
|
let value_id = str.0;
|
||||||
|
// need an assertions because the ts c api does not do bounds check
|
||||||
|
assert!(value_id <= self.num_captures, "invalid value index");
|
||||||
unsafe {
|
unsafe {
|
||||||
let mut len = 0;
|
let mut len = 0;
|
||||||
let ptr = ts_query_string_value_for_id(self.raw, value_id, &mut len);
|
let ptr = ts_query_string_value_for_id(self.raw, value_id, &mut len);
|
||||||
|
@ -309,9 +183,9 @@ impl Query {
|
||||||
}
|
}
|
||||||
|
|
||||||
#[inline]
|
#[inline]
|
||||||
pub fn capture_name(&self, capture_idx: u32) -> &str {
|
pub fn capture_name(&self, capture_idx: Capture) -> &str {
|
||||||
// this one needs an assertions because the ts c api is inconsisent
|
let capture_idx = capture_idx.0;
|
||||||
// and unsafe, other functions do have checks and would return null
|
// need an assertions because the ts c api does not do bounds check
|
||||||
assert!(capture_idx <= self.num_captures, "invalid capture index");
|
assert!(capture_idx <= self.num_captures, "invalid capture index");
|
||||||
let mut length = 0;
|
let mut length = 0;
|
||||||
unsafe {
|
unsafe {
|
||||||
|
@ -323,6 +197,36 @@ impl Query {
|
||||||
str::from_utf8_unchecked(name)
|
str::from_utf8_unchecked(name)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
pub fn pattern_properies(&self, pattern_idx: u32) -> &[QueryProperty] {
|
||||||
|
let range = self.patterns[pattern_idx as usize].properties.clone();
|
||||||
|
&self.properties[range.start as usize..range.end as usize]
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Drop for Query {
|
||||||
|
fn drop(&mut self) {
|
||||||
|
unsafe { ts_query_delete(self.raw) }
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Clone, Copy, Debug, PartialEq, Eq)]
|
||||||
|
pub struct Capture(u32);
|
||||||
|
|
||||||
|
impl Capture {
|
||||||
|
pub fn name(self, query: &Query) -> &str {
|
||||||
|
query.capture_name(self)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/// A reference to a string stroed in a query
|
||||||
|
#[derive(Clone, Copy, Debug)]
|
||||||
|
pub struct QueryStr(u32);
|
||||||
|
|
||||||
|
impl QueryStr {
|
||||||
|
pub fn get(self, query: &Query) -> &str {
|
||||||
|
query.get_string(self)
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
#[derive(Debug, PartialEq, Eq)]
|
#[derive(Debug, PartialEq, Eq)]
|
||||||
|
@ -357,7 +261,7 @@ impl ParserErrorLocation {
|
||||||
}
|
}
|
||||||
|
|
||||||
impl Display for ParserErrorLocation {
|
impl Display for ParserErrorLocation {
|
||||||
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
|
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
|
||||||
writeln!(
|
writeln!(
|
||||||
f,
|
f,
|
||||||
" --> {}:{}:{}",
|
" --> {}:{}:{}",
|
||||||
|
@ -366,8 +270,8 @@ impl Display for ParserErrorLocation {
|
||||||
self.column
|
self.column
|
||||||
)?;
|
)?;
|
||||||
let line = self.line.to_string();
|
let line = self.line.to_string();
|
||||||
let prefix = format_args!(" {:width$} |", "", width = line.len());
|
let prefix = format!(" {:width$} |", "", width = line.len());
|
||||||
writeln!(f, "{prefix}");
|
writeln!(f, "{prefix}")?;
|
||||||
writeln!(f, " {line} | {}", self.line_content)?;
|
writeln!(f, " {line} | {}", self.line_content)?;
|
||||||
writeln!(
|
writeln!(
|
||||||
f,
|
f,
|
||||||
|
@ -422,87 +326,6 @@ enum RawQueryError {
|
||||||
Language = 6,
|
Language = 6,
|
||||||
}
|
}
|
||||||
|
|
||||||
#[repr(C)]
|
|
||||||
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
|
|
||||||
enum PredicateStepKind {
|
|
||||||
Done = 0,
|
|
||||||
Capture = 1,
|
|
||||||
String = 2,
|
|
||||||
}
|
|
||||||
|
|
||||||
#[repr(C)]
|
|
||||||
struct PredicateStep {
|
|
||||||
kind: PredicateStepKind,
|
|
||||||
value_id: u32,
|
|
||||||
}
|
|
||||||
|
|
||||||
struct Predicate<'a> {
|
|
||||||
operator_name: &'a str,
|
|
||||||
args: &'a [PredicateStep],
|
|
||||||
query: &'a Query,
|
|
||||||
}
|
|
||||||
|
|
||||||
impl<'a> Predicate<'a> {
|
|
||||||
unsafe fn new(
|
|
||||||
query: &'a Query,
|
|
||||||
predicate: &'a [PredicateStep],
|
|
||||||
) -> Result<Predicate<'a>, String> {
|
|
||||||
ensure!(
|
|
||||||
predicate[0].kind == PredicateStepKind::String,
|
|
||||||
"expected predicate to start with a function name. Got @{}.",
|
|
||||||
query.capture_name(predicate[0].value_id)
|
|
||||||
);
|
|
||||||
let operator_name = query.get_pattern_string(predicate[0].value_id);
|
|
||||||
Ok(Predicate {
|
|
||||||
operator_name,
|
|
||||||
args: &predicate[1..],
|
|
||||||
query,
|
|
||||||
})
|
|
||||||
}
|
|
||||||
pub fn check_arg_count(&self, n: usize) -> Result<(), String> {
|
|
||||||
ensure!(
|
|
||||||
self.args.len() == n,
|
|
||||||
"expected {n} arguments for #{}, got {}",
|
|
||||||
self.operator_name,
|
|
||||||
self.args.len()
|
|
||||||
);
|
|
||||||
Ok(())
|
|
||||||
}
|
|
||||||
|
|
||||||
pub fn get_arg(&self, i: usize, expect: PredicateArg) -> Result<u32, String> {
|
|
||||||
let (val, actual) = self.get_any_arg(i);
|
|
||||||
match (actual, expect) {
|
|
||||||
(PredicateArg::Capture, PredicateArg::String) => bail!(
|
|
||||||
"{i}. argument to #{} expected a capture, got literal {val:?}",
|
|
||||||
self.operator_name
|
|
||||||
),
|
|
||||||
(PredicateArg::String, PredicateArg::Capture) => bail!(
|
|
||||||
"{i}. argument to #{} must be a literal, got capture @{val:?}",
|
|
||||||
self.operator_name
|
|
||||||
),
|
|
||||||
_ => (),
|
|
||||||
};
|
|
||||||
Ok(val)
|
|
||||||
}
|
|
||||||
pub fn get_str_arg(&self, i: usize) -> Result<&'a str, String> {
|
|
||||||
let arg = self.get_arg(i, PredicateArg::String)?;
|
|
||||||
unsafe { Ok(self.query.get_pattern_string(arg)) }
|
|
||||||
}
|
|
||||||
|
|
||||||
pub fn get_any_arg(&self, i: usize) -> (u32, PredicateArg) {
|
|
||||||
match self.args[i].kind {
|
|
||||||
PredicateStepKind::String => unsafe { (self.args[i].value_id, PredicateArg::String) },
|
|
||||||
PredicateStepKind::Capture => (self.args[i].value_id, PredicateArg::Capture),
|
|
||||||
PredicateStepKind::Done => unreachable!(),
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
enum PredicateArg {
|
|
||||||
Capture,
|
|
||||||
String,
|
|
||||||
}
|
|
||||||
|
|
||||||
extern "C" {
|
extern "C" {
|
||||||
/// Create a new query from a string containing one or more S-expression
|
/// Create a new query from a string containing one or more S-expression
|
||||||
/// patterns. The query is associated with a particular language, and can
|
/// patterns. The query is associated with a particular language, and can
|
||||||
|
@ -512,7 +335,7 @@ extern "C" {
|
||||||
/// about the problem: 1. The byte offset of the error is written to
|
/// about the problem: 1. The byte offset of the error is written to
|
||||||
/// the `error_offset` parameter. 2. The type of error is written to the
|
/// the `error_offset` parameter. 2. The type of error is written to the
|
||||||
/// `error_type` parameter.
|
/// `error_type` parameter.
|
||||||
pub fn ts_query_new(
|
fn ts_query_new(
|
||||||
grammar: Grammar,
|
grammar: Grammar,
|
||||||
source: *const u8,
|
source: *const u8,
|
||||||
source_len: u32,
|
source_len: u32,
|
||||||
|
@ -521,52 +344,31 @@ extern "C" {
|
||||||
) -> Option<NonNull<QueryData>>;
|
) -> Option<NonNull<QueryData>>;
|
||||||
|
|
||||||
/// Delete a query, freeing all of the memory that it used.
|
/// Delete a query, freeing all of the memory that it used.
|
||||||
pub fn ts_query_delete(query: NonNull<QueryData>);
|
fn ts_query_delete(query: NonNull<QueryData>);
|
||||||
|
|
||||||
/// Get the number of patterns, captures, or string literals in the query.
|
/// Get the number of patterns, captures, or string literals in the query.
|
||||||
pub fn ts_query_pattern_count(query: NonNull<QueryData>) -> u32;
|
fn ts_query_pattern_count(query: NonNull<QueryData>) -> u32;
|
||||||
pub fn ts_query_capture_count(query: NonNull<QueryData>) -> u32;
|
fn ts_query_capture_count(query: NonNull<QueryData>) -> u32;
|
||||||
pub fn ts_query_string_count(query: NonNull<QueryData>) -> u32;
|
fn ts_query_string_count(query: NonNull<QueryData>) -> u32;
|
||||||
|
|
||||||
/// Get the byte offset where the given pattern starts in the query's
|
/// Get the byte offset where the given pattern starts in the query's
|
||||||
/// source. This can be useful when combining queries by concatenating their
|
/// source. This can be useful when combining queries by concatenating their
|
||||||
/// source code strings.
|
/// source code strings.
|
||||||
pub fn ts_query_start_byte_for_pattern(query: NonNull<QueryData>, pattern_index: u32) -> u32;
|
fn ts_query_start_byte_for_pattern(query: NonNull<QueryData>, pattern_index: u32) -> u32;
|
||||||
|
|
||||||
/// Get all of the predicates for the given pattern in the query. The
|
// fn ts_query_is_pattern_rooted(query: NonNull<QueryData>, pattern_index: u32) -> bool;
|
||||||
/// predicates are represented as a single array of steps. There are three
|
// fn ts_query_is_pattern_non_local(query: NonNull<QueryData>, pattern_index: u32) -> bool;
|
||||||
/// types of steps in this array, which correspond to the three legal values
|
// fn ts_query_is_pattern_guaranteed_at_step(query: NonNull<QueryData>, byte_offset: u32) -> bool;
|
||||||
/// for the `type` field: - `TSQueryPredicateStepTypeCapture` - Steps with
|
|
||||||
/// this type represent names of captures. Their `value_id` can be used
|
|
||||||
/// with the [`ts_query_capture_name_for_id`] function to obtain the name
|
|
||||||
/// of the capture. - `TSQueryPredicateStepTypeString` - Steps with this
|
|
||||||
/// type represent literal strings. Their `value_id` can be used with the
|
|
||||||
/// [`ts_query_string_value_for_id`] function to obtain their string value.
|
|
||||||
/// - `TSQueryPredicateStepTypeDone` - Steps with this type are *sentinels*
|
|
||||||
/// that represent the end of an individual predicate. If a pattern has two
|
|
||||||
/// predicates, then there will be two steps with this `type` in the array.
|
|
||||||
pub fn ts_query_predicates_for_pattern(
|
|
||||||
query: NonNull<QueryData>,
|
|
||||||
pattern_index: u32,
|
|
||||||
step_count: &mut u32,
|
|
||||||
) -> *const PredicateStep;
|
|
||||||
|
|
||||||
pub fn ts_query_is_pattern_rooted(query: NonNull<QueryData>, pattern_index: u32) -> bool;
|
|
||||||
pub fn ts_query_is_pattern_non_local(query: NonNull<QueryData>, pattern_index: u32) -> bool;
|
|
||||||
pub fn ts_query_is_pattern_guaranteed_at_step(
|
|
||||||
query: NonNull<QueryData>,
|
|
||||||
byte_offset: u32,
|
|
||||||
) -> bool;
|
|
||||||
/// Get the name and length of one of the query's captures, or one of the
|
/// Get the name and length of one of the query's captures, or one of the
|
||||||
/// query's string literals. Each capture and string is associated with a
|
/// query's string literals. Each capture and string is associated with a
|
||||||
/// numeric id based on the order that it appeared in the query's source.
|
/// numeric id based on the order that it appeared in the query's source.
|
||||||
pub fn ts_query_capture_name_for_id(
|
fn ts_query_capture_name_for_id(
|
||||||
query: NonNull<QueryData>,
|
query: NonNull<QueryData>,
|
||||||
index: u32,
|
index: u32,
|
||||||
length: &mut u32,
|
length: &mut u32,
|
||||||
) -> *const u8;
|
) -> *const u8;
|
||||||
|
|
||||||
pub fn ts_query_string_value_for_id(
|
fn ts_query_string_value_for_id(
|
||||||
self_: NonNull<QueryData>,
|
self_: NonNull<QueryData>,
|
||||||
index: u32,
|
index: u32,
|
||||||
length: &mut u32,
|
length: &mut u32,
|
||||||
|
|
288
helix-syntax/src/tree_sitter/query/predicate.rs
Normal file
288
helix-syntax/src/tree_sitter/query/predicate.rs
Normal file
|
@ -0,0 +1,288 @@
|
||||||
|
use std::error::Error;
|
||||||
|
use std::ptr::NonNull;
|
||||||
|
use std::{fmt, slice};
|
||||||
|
|
||||||
|
use crate::tree_sitter::query::property::QueryProperty;
|
||||||
|
use crate::tree_sitter::query::{Capture, Pattern, Query, QueryData, QueryStr};
|
||||||
|
|
||||||
|
use regex_cursor::engines::meta::Regex;
|
||||||
|
|
||||||
|
macro_rules! bail {
|
||||||
|
($($args:tt)*) => {{
|
||||||
|
return Err(InvalidPredicateError {msg: format!($($args)*).into() })
|
||||||
|
}}
|
||||||
|
}
|
||||||
|
|
||||||
|
macro_rules! ensure {
|
||||||
|
($cond: expr, $($args:tt)*) => {{
|
||||||
|
if !$cond {
|
||||||
|
return Err(InvalidPredicateError { msg: format!($($args)*).into() })
|
||||||
|
}
|
||||||
|
}}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug)]
|
||||||
|
pub(super) enum TextPredicateKind {
|
||||||
|
EqString(QueryStr),
|
||||||
|
EqCapture(Capture),
|
||||||
|
MatchString(Regex),
|
||||||
|
AnyString(Box<[QueryStr]>),
|
||||||
|
}
|
||||||
|
|
||||||
|
pub(super) struct TextPredicate {
|
||||||
|
capture: Capture,
|
||||||
|
kind: TextPredicateKind,
|
||||||
|
negated: bool,
|
||||||
|
match_all: bool,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Query {
|
||||||
|
pub(super) fn parse_pattern_predicates(
|
||||||
|
&mut self,
|
||||||
|
pattern_index: u32,
|
||||||
|
mut custom_predicate: impl FnMut(Predicate) -> Result<(), InvalidPredicateError>,
|
||||||
|
) -> Result<Pattern, InvalidPredicateError> {
|
||||||
|
let text_predicate_start = self.text_predicates.len() as u32;
|
||||||
|
let property_start = self.properties.len() as u32;
|
||||||
|
|
||||||
|
let predicate_steps = unsafe {
|
||||||
|
let mut len = 0u32;
|
||||||
|
let raw_predicates = ts_query_predicates_for_pattern(self.raw, pattern_index, &mut len);
|
||||||
|
(len != 0)
|
||||||
|
.then(|| slice::from_raw_parts(raw_predicates, len as usize))
|
||||||
|
.unwrap_or_default()
|
||||||
|
};
|
||||||
|
let predicates = predicate_steps
|
||||||
|
.split(|step| step.kind == PredicateStepKind::Done)
|
||||||
|
.filter(|predicate| !predicate.is_empty());
|
||||||
|
|
||||||
|
for predicate in predicates {
|
||||||
|
let predicate = unsafe { Predicate::new(self, predicate)? };
|
||||||
|
|
||||||
|
match predicate.name() {
|
||||||
|
"eq?" | "not-eq?" | "any-eq?" | "any-not-eq?" => {
|
||||||
|
predicate.check_arg_count(2)?;
|
||||||
|
let capture_idx = predicate.capture_arg(0)?;
|
||||||
|
let arg2 = predicate.arg(1);
|
||||||
|
|
||||||
|
let negated = matches!(predicate.name(), "not-eq?" | "not-any-eq?");
|
||||||
|
let match_all = matches!(predicate.name(), "eq?" | "not-eq?");
|
||||||
|
let kind = match arg2 {
|
||||||
|
PredicateArg::Capture(capture) => TextPredicateKind::EqCapture(capture),
|
||||||
|
PredicateArg::String(str) => TextPredicateKind::EqString(str),
|
||||||
|
};
|
||||||
|
self.text_predicates.push(TextPredicate {
|
||||||
|
capture: capture_idx,
|
||||||
|
kind,
|
||||||
|
negated,
|
||||||
|
match_all,
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
"match?" | "not-match?" | "any-match?" | "any-not-match?" => {
|
||||||
|
predicate.check_arg_count(2)?;
|
||||||
|
let capture_idx = predicate.capture_arg(0)?;
|
||||||
|
let regex = predicate.str_arg(1)?.get(self);
|
||||||
|
|
||||||
|
let negated = matches!(predicate.name(), "not-match?" | "any-not-match?");
|
||||||
|
let match_all = matches!(predicate.name(), "match?" | "not-match?");
|
||||||
|
let regex = match Regex::new(regex) {
|
||||||
|
Ok(regex) => regex,
|
||||||
|
Err(err) => bail!("invalid regex '{regex}', {err}"),
|
||||||
|
};
|
||||||
|
self.text_predicates.push(TextPredicate {
|
||||||
|
capture: capture_idx,
|
||||||
|
kind: TextPredicateKind::MatchString(regex),
|
||||||
|
negated,
|
||||||
|
match_all,
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
"set!" => self.properties.push(QueryProperty::parse(&predicate)?),
|
||||||
|
|
||||||
|
"any-of?" | "not-any-of?" => {
|
||||||
|
predicate.check_min_arg_count(1)?;
|
||||||
|
let capture = predicate.capture_arg(0)?;
|
||||||
|
let negated = predicate.name() == "not-any-of?";
|
||||||
|
let values: Result<_, InvalidPredicateError> = (1..predicate.num_args())
|
||||||
|
.map(|i| predicate.str_arg(i))
|
||||||
|
.collect();
|
||||||
|
self.text_predicates.push(TextPredicate {
|
||||||
|
capture,
|
||||||
|
kind: TextPredicateKind::AnyString(values?),
|
||||||
|
negated,
|
||||||
|
match_all: false,
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
// is and is-not are better handeled as custom predicates since interpreting is context dependent
|
||||||
|
// "is?" => property_predicates.push((QueryProperty::parse(&predicate), false)),
|
||||||
|
// "is-not?" => property_predicates.push((QueryProperty::parse(&predicate), true)),
|
||||||
|
_ => custom_predicate(predicate)?,
|
||||||
|
}
|
||||||
|
}
|
||||||
|
Ok(Pattern {
|
||||||
|
text_predicates: text_predicate_start..self.text_predicates.len() as u32,
|
||||||
|
properties: property_start..self.properties.len() as u32,
|
||||||
|
})
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub enum PredicateArg {
|
||||||
|
Capture(Capture),
|
||||||
|
String(QueryStr),
|
||||||
|
}
|
||||||
|
|
||||||
|
pub struct Predicate<'a> {
|
||||||
|
pub name: QueryStr,
|
||||||
|
args: &'a [PredicateStep],
|
||||||
|
query: &'a Query,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl<'a> Predicate<'a> {
|
||||||
|
unsafe fn new(
|
||||||
|
query: &'a Query,
|
||||||
|
predicate: &'a [PredicateStep],
|
||||||
|
) -> Result<Predicate<'a>, InvalidPredicateError> {
|
||||||
|
ensure!(
|
||||||
|
predicate[0].kind == PredicateStepKind::String,
|
||||||
|
"expected predicate to start with a function name. Got @{}.",
|
||||||
|
Capture(predicate[0].value_id).name(query)
|
||||||
|
);
|
||||||
|
let operator_name = QueryStr(predicate[0].value_id);
|
||||||
|
Ok(Predicate {
|
||||||
|
name: operator_name,
|
||||||
|
args: &predicate[1..],
|
||||||
|
query,
|
||||||
|
})
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn name(&self) -> &str {
|
||||||
|
self.name.get(self.query)
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn check_arg_count(&self, n: usize) -> Result<(), InvalidPredicateError> {
|
||||||
|
ensure!(
|
||||||
|
self.args.len() == n,
|
||||||
|
"expected {n} arguments for #{}, got {}",
|
||||||
|
self.name(),
|
||||||
|
self.args.len()
|
||||||
|
);
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn check_min_arg_count(&self, n: usize) -> Result<(), InvalidPredicateError> {
|
||||||
|
ensure!(
|
||||||
|
n <= self.args.len(),
|
||||||
|
"expected at least {n} arguments for #{}, got {}",
|
||||||
|
self.name(),
|
||||||
|
self.args.len()
|
||||||
|
);
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn check_max_arg_count(&self, n: usize) -> Result<(), InvalidPredicateError> {
|
||||||
|
ensure!(
|
||||||
|
self.args.len() <= n,
|
||||||
|
"expected at most {n} arguments for #{}, got {}",
|
||||||
|
self.name(),
|
||||||
|
self.args.len()
|
||||||
|
);
|
||||||
|
Ok(())
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn str_arg(&self, i: usize) -> Result<QueryStr, InvalidPredicateError> {
|
||||||
|
match self.arg(i) {
|
||||||
|
PredicateArg::String(str) => Ok(str),
|
||||||
|
PredicateArg::Capture(capture) => bail!(
|
||||||
|
"{i}. argument to #{} must be a literal, got capture @{:?}",
|
||||||
|
self.name(),
|
||||||
|
capture.name(self.query)
|
||||||
|
),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn num_args(&self) -> usize {
|
||||||
|
self.args.len()
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn capture_arg(&self, i: usize) -> Result<Capture, InvalidPredicateError> {
|
||||||
|
match self.arg(i) {
|
||||||
|
PredicateArg::Capture(capture) => Ok(capture),
|
||||||
|
PredicateArg::String(str) => bail!(
|
||||||
|
"{i}. argument to #{} expected a capture, got literal {:?}",
|
||||||
|
self.name(),
|
||||||
|
str.get(self.query)
|
||||||
|
),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn arg(&self, i: usize) -> PredicateArg {
|
||||||
|
self.args[i].try_into().unwrap()
|
||||||
|
}
|
||||||
|
|
||||||
|
pub fn args(&self) -> impl Iterator<Item = PredicateArg> + '_ {
|
||||||
|
self.args.iter().map(|&arg| arg.try_into().unwrap())
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
#[derive(Debug)]
|
||||||
|
pub struct InvalidPredicateError {
|
||||||
|
pub(super) msg: Box<str>,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl fmt::Display for InvalidPredicateError {
|
||||||
|
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
|
||||||
|
f.write_str(&self.msg)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
impl Error for InvalidPredicateError {}
|
||||||
|
|
||||||
|
#[repr(C)]
|
||||||
|
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
|
||||||
|
enum PredicateStepKind {
|
||||||
|
Done = 0,
|
||||||
|
Capture = 1,
|
||||||
|
String = 2,
|
||||||
|
}
|
||||||
|
|
||||||
|
#[repr(C)]
|
||||||
|
#[derive(Debug, Clone, Copy)]
|
||||||
|
struct PredicateStep {
|
||||||
|
kind: PredicateStepKind,
|
||||||
|
value_id: u32,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl TryFrom<PredicateStep> for PredicateArg {
|
||||||
|
type Error = ();
|
||||||
|
|
||||||
|
fn try_from(step: PredicateStep) -> Result<Self, Self::Error> {
|
||||||
|
match step.kind {
|
||||||
|
PredicateStepKind::String => Ok(PredicateArg::String(QueryStr(step.value_id))),
|
||||||
|
PredicateStepKind::Capture => Ok(PredicateArg::Capture(Capture(step.value_id))),
|
||||||
|
PredicateStepKind::Done => Err(()),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
extern "C" {
|
||||||
|
/// Get all of the predicates for the given pattern in the query. The
|
||||||
|
/// predicates are represented as a single array of steps. There are three
|
||||||
|
/// types of steps in this array, which correspond to the three legal values
|
||||||
|
/// for the `type` field: - `TSQueryPredicateStepTypeCapture` - Steps with
|
||||||
|
/// this type represent names of captures. Their `value_id` can be used
|
||||||
|
/// with the [`ts_query_capture_name_for_id`] function to obtain the name
|
||||||
|
/// of the capture. - `TSQueryPredicateStepTypeString` - Steps with this
|
||||||
|
/// type represent literal strings. Their `value_id` can be used with the
|
||||||
|
/// [`ts_query_string_value_for_id`] function to obtain their string value.
|
||||||
|
/// - `TSQueryPredicateStepTypeDone` - Steps with this type are *sentinels*
|
||||||
|
/// that represent the end of an individual predicate. If a pattern has two
|
||||||
|
/// predicates, then there will be two steps with this `type` in the array.
|
||||||
|
fn ts_query_predicates_for_pattern(
|
||||||
|
query: NonNull<QueryData>,
|
||||||
|
pattern_index: u32,
|
||||||
|
step_count: &mut u32,
|
||||||
|
) -> *const PredicateStep;
|
||||||
|
|
||||||
|
}
|
19
helix-syntax/src/tree_sitter/query/property.rs
Normal file
19
helix-syntax/src/tree_sitter/query/property.rs
Normal file
|
@ -0,0 +1,19 @@
|
||||||
|
use crate::tree_sitter::query::predicate::{InvalidPredicateError, Predicate};
|
||||||
|
use crate::tree_sitter::query::QueryStr;
|
||||||
|
|
||||||
|
pub struct QueryProperty {
|
||||||
|
pub key: QueryStr,
|
||||||
|
pub val: Option<QueryStr>,
|
||||||
|
}
|
||||||
|
|
||||||
|
impl QueryProperty {
|
||||||
|
pub fn parse(predicate: &Predicate) -> Result<Self, InvalidPredicateError> {
|
||||||
|
predicate.check_min_arg_count(1)?;
|
||||||
|
predicate.check_max_arg_count(2)?;
|
||||||
|
let key = predicate.str_arg(0)?;
|
||||||
|
let val = (predicate.num_args() == 1)
|
||||||
|
.then(|| predicate.str_arg(1))
|
||||||
|
.transpose()?;
|
||||||
|
Ok(QueryProperty { key, val })
|
||||||
|
}
|
||||||
|
}
|
Loading…
Add table
Add a link
Reference in a new issue