Unnamed repository; edit this file 'description' to name the repository.
Diffstat (limited to 'helix-core/src/indent.rs')
| -rw-r--r-- | helix-core/src/indent.rs | 1322 |
1 files changed, 228 insertions, 1094 deletions
diff --git a/helix-core/src/indent.rs b/helix-core/src/indent.rs index bdf0f405..30f4a340 100644 --- a/helix-core/src/indent.rs +++ b/helix-core/src/indent.rs @@ -1,18 +1,8 @@ -use std::{borrow::Cow, collections::HashMap}; - -use helix_stdx::rope::RopeSliceExt; -use tree_house::TREE_SITTER_MATCH_LIMIT; - use crate::{ chars::{char_is_line_ending, char_is_whitespace}, - graphemes::{grapheme_width, tab_width_at}, - syntax::{self, config::IndentationHeuristic}, - tree_sitter::{ - self, - query::{InvalidPredicateError, UserPredicate}, - Capture, Grammar, InactiveQueryCursor, Node, Pattern, Query, QueryMatch, RopeInput, - }, - Position, Rope, RopeSlice, Syntax, Tendril, + syntax::{IndentQuery, LanguageConfiguration, Syntax}, + tree_sitter::Node, + Rope, RopeSlice, }; /// Enum representing indentation style. @@ -24,10 +14,6 @@ pub enum IndentStyle { Spaces(u8), } -// 16 spaces -const INDENTS: &str = " "; -pub const MAX_INDENT: u8 = 16; - impl IndentStyle { /// Creates an `IndentStyle` from an indentation string. /// @@ -36,10 +22,10 @@ impl IndentStyle { #[inline] pub fn from_str(indent: &str) -> Self { // XXX: do we care about validating the input more than this? Probably not...? - debug_assert!(!indent.is_empty() && indent.len() <= MAX_INDENT as usize); + debug_assert!(!indent.is_empty() && indent.len() <= 8); if indent.starts_with(' ') { - IndentStyle::Spaces(indent.len().clamp(1, MAX_INDENT as usize) as u8) + IndentStyle::Spaces(indent.len() as u8) } else { IndentStyle::Tabs } @@ -49,24 +35,23 @@ impl IndentStyle { pub fn as_str(&self) -> &'static str { match *self { IndentStyle::Tabs => "\t", + IndentStyle::Spaces(1) => " ", + IndentStyle::Spaces(2) => " ", + IndentStyle::Spaces(3) => " ", + IndentStyle::Spaces(4) => " ", + IndentStyle::Spaces(5) => " ", + IndentStyle::Spaces(6) => " ", + IndentStyle::Spaces(7) => " ", + IndentStyle::Spaces(8) => " ", + + // Unsupported indentation style. This should never happen, + // but just in case fall back to two spaces. IndentStyle::Spaces(n) => { - // Unsupported indentation style. This should never happen, - debug_assert!(n > 0 && n <= MAX_INDENT); - - // Either way, clamp to the nearest supported value - let closest_n = n.clamp(1, MAX_INDENT) as usize; - &INDENTS[0..closest_n] + debug_assert!(n > 0 && n <= 8); // Always triggers. `debug_panic!()` wanted. + " " } } } - - #[inline] - pub fn indent_width(&self, tab_width: usize) -> usize { - match *self { - IndentStyle::Tabs => tab_width, - IndentStyle::Spaces(width) => width as usize, - } - } } /// Attempts to detect the indentation style used in a document. @@ -77,9 +62,9 @@ pub fn auto_detect_indent_style(document_text: &Rope) -> Option<IndentStyle> { // Build a histogram of the indentation *increases* between // subsequent lines, ignoring lines that are all whitespace. // - // Index 0 is for tabs, the rest are 1-MAX_INDENT spaces. - let histogram: [usize; MAX_INDENT as usize + 1] = { - let mut histogram = [0; MAX_INDENT as usize + 1]; + // Index 0 is for tabs, the rest are 1-8 spaces. + let histogram: [usize; 9] = { + let mut histogram = [0; 9]; let mut prev_line_is_tabs = false; let mut prev_line_leading_count = 0usize; @@ -138,7 +123,7 @@ pub fn auto_detect_indent_style(document_text: &Rope) -> Option<IndentStyle> { histogram[0] += 1; } else { let amount = leading_count - prev_line_leading_count; - if amount <= MAX_INDENT as usize { + if amount <= 8 { histogram[amount] += 1; } } @@ -153,12 +138,6 @@ pub fn auto_detect_indent_style(document_text: &Rope) -> Option<IndentStyle> { // Give more weight to tabs, because their presence is a very // strong indicator. histogram[0] *= 2; - // Gives less weight to single indent, as single spaces are - // often used in certain languages' comment systems and rarely - // used as the actual document indentation. - if histogram[1] > 1 { - histogram[1] /= 2; - } histogram }; @@ -194,902 +173,122 @@ pub fn auto_detect_indent_style(document_text: &Rope) -> Option<IndentStyle> { /// To determine indentation of a newly inserted line, figure out the indentation at the last col /// of the previous line. -pub fn indent_level_for_line(line: RopeSlice, tab_width: usize, indent_width: usize) -> usize { +pub fn indent_level_for_line(line: RopeSlice, tab_width: usize) -> usize { let mut len = 0; for ch in line.chars() { match ch { - '\t' => len += tab_width_at(len, tab_width as u16), + '\t' => len += tab_width, ' ' => len += 1, _ => break, } } - len / indent_width -} - -/// Create a string of tabs & spaces that has the same visual width as the given RopeSlice (independent of the tab width). -fn whitespace_with_same_width(text: RopeSlice) -> String { - let mut s = String::new(); - for grapheme in text.graphemes() { - if grapheme == "\t" { - s.push('\t'); - } else { - s.extend(std::iter::repeat_n( - ' ', - grapheme_width(&Cow::from(grapheme)), - )); - } - } - s + len / tab_width } -/// normalizes indentation to tabs/spaces based on user configuration -/// This function does not change the actual indentation width, just the character -/// composition. -pub fn normalize_indentation( - prefix: RopeSlice<'_>, - line: RopeSlice<'_>, - dst: &mut Tendril, - indent_style: IndentStyle, - tab_width: usize, -) -> usize { - #[allow(deprecated)] - let off = crate::visual_coords_at_pos(prefix, prefix.len_chars(), tab_width).col; - let mut len = 0; - let mut original_len = 0; - for ch in line.chars() { - match ch { - '\t' => len += tab_width_at(len + off, tab_width as u16), - ' ' => len += 1, - _ => break, - } - original_len += 1; - } - if indent_style == IndentStyle::Tabs { - dst.extend(std::iter::repeat_n('\t', len / tab_width)); - len %= tab_width; - } - dst.extend(std::iter::repeat_n(' ', len)); - original_len -} +/// Find the highest syntax node at position. +/// This is to identify the column where this node (e.g., an HTML closing tag) ends. +fn get_highest_syntax_node_at_bytepos(syntax: &Syntax, pos: usize) -> Option<Node> { + let tree = syntax.tree(); -fn add_indent_level( - mut base_indent: String, - added_indent_level: isize, - indent_style: &IndentStyle, - tab_width: usize, -) -> String { - if added_indent_level >= 0 { - // Adding a non-negative indent is easy, we can simply append the indent string - base_indent.push_str(&indent_style.as_str().repeat(added_indent_level as usize)); - base_indent - } else { - // In this case, we want to return a prefix of `base_indent`. - // Since the width of a tab depends on its offset, we cannot simply iterate over - // the chars of `base_indent` in reverse until we have the desired indent reduction, - // instead we iterate over them twice in forward direction. - let base_indent_rope = RopeSlice::from(base_indent.as_str()); - #[allow(deprecated)] - let base_indent_width = - crate::visual_coords_at_pos(base_indent_rope, base_indent_rope.len_chars(), tab_width) - .col; - let target_indent_width = base_indent_width - .saturating_sub((-added_indent_level) as usize * indent_style.indent_width(tab_width)); - #[allow(deprecated)] - let char_end_idx = crate::pos_at_visual_coords( - base_indent_rope, - Position { - row: 0, - col: target_indent_width, - }, - tab_width, - ); - let byte_end_idx = base_indent_rope.char_to_byte(char_end_idx); - base_indent.truncate(byte_end_idx); - base_indent - } -} + // named_descendant + let mut node = tree.root_node().descendant_for_byte_range(pos, pos)?; -/// Return true if only whitespace comes before the node on its line. -/// If given, new_line_byte_pos is treated the same way as any existing newline. -fn is_first_in_line(node: &Node, text: RopeSlice, new_line_byte_pos: Option<u32>) -> bool { - let line = text.byte_to_line(node.start_byte() as usize); - let mut line_start_byte_pos = text.line_to_byte(line) as u32; - if let Some(pos) = new_line_byte_pos { - if line_start_byte_pos < pos && pos <= node.start_byte() { - line_start_byte_pos = pos; - } - } - text.byte_slice(line_start_byte_pos as usize..node.start_byte() as usize) - .chars() - .all(|c| c.is_whitespace()) -} - -#[derive(Debug, Default)] -pub struct IndentQueryPredicates { - not_kind_eq: Vec<(Capture, Box<str>)>, - same_line: Option<(Capture, Capture, bool)>, - one_line: Option<(Capture, bool)>, -} - -impl IndentQueryPredicates { - fn are_satisfied( - &self, - match_: &QueryMatch, - text: RopeSlice, - new_line_byte_pos: Option<u32>, - ) -> bool { - for (capture, not_expected_kind) in self.not_kind_eq.iter() { - let node = match_.nodes_for_capture(*capture).next(); - if node.is_some_and(|n| n.kind() == not_expected_kind.as_ref()) { - return false; - } - } - - if let Some((capture1, capture2, negated)) = self.same_line { - let n1 = match_.nodes_for_capture(capture1).next(); - let n2 = match_.nodes_for_capture(capture2).next(); - let satisfied = n1.zip(n2).is_some_and(|(n1, n2)| { - let n1_line = get_node_start_line(text, n1, new_line_byte_pos); - let n2_line = get_node_start_line(text, n2, new_line_byte_pos); - let same_line = n1_line == n2_line; - same_line != negated - }); - - if !satisfied { - return false; - } - } - - if let Some((capture, negated)) = self.one_line { - let node = match_.nodes_for_capture(capture).next(); - let satisfied = node.is_some_and(|node| { - let start_line = get_node_start_line(text, node, new_line_byte_pos); - let end_line = get_node_end_line(text, node, new_line_byte_pos); - let one_line = end_line == start_line; - one_line != negated - }); - - if !satisfied { - return false; - } - } - - true - } -} - -#[derive(Debug)] -pub struct IndentQuery { - query: Query, - properties: HashMap<Pattern, IndentScope>, - predicates: HashMap<Pattern, IndentQueryPredicates>, - indent_capture: Option<Capture>, - indent_always_capture: Option<Capture>, - outdent_capture: Option<Capture>, - outdent_always_capture: Option<Capture>, - align_capture: Option<Capture>, - anchor_capture: Option<Capture>, - extend_capture: Option<Capture>, - extend_prevent_once_capture: Option<Capture>, -} - -impl IndentQuery { - pub fn new(grammar: Grammar, source: &str) -> Result<Self, tree_sitter::query::ParseError> { - let mut properties = HashMap::new(); - let mut predicates: HashMap<Pattern, IndentQueryPredicates> = HashMap::new(); - let query = Query::new(grammar, source, |pattern, predicate| match predicate { - UserPredicate::SetProperty { key: "scope", val } => { - let scope = match val { - Some("all") => IndentScope::All, - Some("tail") => IndentScope::Tail, - Some(other) => { - return Err(format!("unknown scope (#set! scope \"{other}\")").into()) - } - None => return Err("missing scope value (#set! scope ...)".into()), - }; - - properties.insert(pattern, scope); - - Ok(()) - } - UserPredicate::Other(predicate) => { - let name = predicate.name(); - match name { - "not-kind-eq?" => { - predicate.check_arg_count(2)?; - let capture = predicate.capture_arg(0)?; - let not_expected_kind = predicate.str_arg(1)?; - - predicates - .entry(pattern) - .or_default() - .not_kind_eq - .push((capture, not_expected_kind.into())); - Ok(()) - } - "same-line?" | "not-same-line?" => { - predicate.check_arg_count(2)?; - let capture1 = predicate.capture_arg(0)?; - let capture2 = predicate.capture_arg(1)?; - let negated = name == "not-same-line?"; - - predicates.entry(pattern).or_default().same_line = - Some((capture1, capture2, negated)); - Ok(()) - } - "one-line?" | "not-one-line?" => { - predicate.check_arg_count(1)?; - let capture = predicate.capture_arg(0)?; - let negated = name == "not-one-line?"; - - predicates.entry(pattern).or_default().one_line = Some((capture, negated)); - Ok(()) - } - _ => Err(InvalidPredicateError::unknown(UserPredicate::Other( - predicate, - ))), - } - } - _ => Err(InvalidPredicateError::unknown(predicate)), - })?; - - Ok(Self { - properties, - predicates, - indent_capture: query.get_capture("indent"), - indent_always_capture: query.get_capture("indent.always"), - outdent_capture: query.get_capture("outdent"), - outdent_always_capture: query.get_capture("outdent.always"), - align_capture: query.get_capture("align"), - anchor_capture: query.get_capture("anchor"), - extend_capture: query.get_capture("extend"), - extend_prevent_once_capture: query.get_capture("extend.prevent-once"), - query, - }) - } -} - -/// The total indent for some line of code. -/// This is usually constructed in one of 2 ways: -/// - Successively add indent captures to get the (added) indent from a single line -/// - Successively add the indent results for each line -/// The string that this indentation defines starts with the string contained in the align field (unless it is None), followed by: -/// - max(0, indent - outdent) tabs, if tabs are used for indentation -/// - max(0, indent - outdent)*indent_width spaces, if spaces are used for indentation -#[derive(Default, Debug, PartialEq, Eq, Clone)] -pub struct Indentation<'a> { - indent: usize, - indent_always: usize, - outdent: usize, - outdent_always: usize, - /// The alignment, as a string containing only tabs & spaces. Storing this as a string instead of e.g. - /// the (visual) width ensures that the alignment is preserved even if the tab width changes. - align: Option<RopeSlice<'a>>, -} - -impl<'a> Indentation<'a> { - /// Add some other [Indentation] to this. - /// The added indent should be the total added indent from one line. - /// Indent should always be added starting from the bottom (or equivalently, the innermost tree-sitter node). - fn add_line(&mut self, added: Indentation<'a>) { - // Align overrides the indent from outer scopes. - if self.align.is_some() { - return; - } - if added.align.is_some() { - self.align = added.align; - return; - } - self.indent += added.indent; - self.indent_always += added.indent_always; - self.outdent += added.outdent; - self.outdent_always += added.outdent_always; - } - - /// Add an indent capture to this indent. - /// Only captures that apply to the same line should be added together in this way (otherwise use `add_line`) - /// and the captures should be added starting from the innermost tree-sitter node (currently this only matters - /// if multiple `@align` patterns occur on the same line). - fn add_capture(&mut self, added: IndentCaptureType<'a>) { - match added { - IndentCaptureType::Indent => { - if self.indent_always == 0 { - self.indent = 1; - } - } - IndentCaptureType::IndentAlways => { - // any time we encounter an `indent.always` on the same line, we - // want to cancel out all regular indents - self.indent_always += 1; - self.indent = 0; - } - IndentCaptureType::Outdent => { - if self.outdent_always == 0 { - self.outdent = 1; - } - } - IndentCaptureType::OutdentAlways => { - self.outdent_always += 1; - self.outdent = 0; - } - IndentCaptureType::Align(align) => { - if self.align.is_none() { - self.align = Some(align); - } - } - } - } - fn net_indent(&self) -> isize { - (self.indent + self.indent_always) as isize - - ((self.outdent + self.outdent_always) as isize) - } - /// Convert `self` into a string, taking into account the computed and actual indentation of some other line. - fn relative_indent( - &self, - other_computed_indent: &Self, - other_leading_whitespace: RopeSlice, - indent_style: &IndentStyle, - tab_width: usize, - ) -> Option<String> { - if self.align == other_computed_indent.align { - // If self and baseline are either not aligned to anything or both aligned the same way, - // we can simply take `other_leading_whitespace` and add some indent / outdent to it (in the second - // case, the alignment should already be accounted for in `other_leading_whitespace`). - let indent_diff = self.net_indent() - other_computed_indent.net_indent(); - Some(add_indent_level( - String::from(other_leading_whitespace), - indent_diff, - indent_style, - tab_width, - )) + while let Some(parent) = node.parent() { + if parent.start_byte() == node.start_byte() { + node = parent } else { - // If the alignment of both lines is different, we cannot compare their indentation in any meaningful way - None - } - } - pub fn to_string(&self, indent_style: &IndentStyle, tab_width: usize) -> String { - add_indent_level( - self.align - .map_or_else(String::new, whitespace_with_same_width), - self.net_indent(), - indent_style, - tab_width, - ) - } -} - -/// An indent definition which corresponds to a capture from the indent query -#[derive(Debug)] -struct IndentCapture<'a> { - capture_type: IndentCaptureType<'a>, - scope: IndentScope, -} -#[derive(Debug, Clone, PartialEq)] -enum IndentCaptureType<'a> { - Indent, - IndentAlways, - Outdent, - OutdentAlways, - /// Alignment given as a string of whitespace - Align(RopeSlice<'a>), -} - -impl IndentCaptureType<'_> { - fn default_scope(&self) -> IndentScope { - match self { - IndentCaptureType::Indent | IndentCaptureType::IndentAlways => IndentScope::Tail, - IndentCaptureType::Outdent | IndentCaptureType::OutdentAlways => IndentScope::All, - IndentCaptureType::Align(_) => IndentScope::All, + break; } } -} -/// This defines which part of a node an [IndentCapture] applies to. -/// Each [IndentCaptureType] has a default scope, but the scope can be changed -/// with `#set!` property declarations. -#[derive(Debug, Clone, Copy)] -enum IndentScope { - /// The indent applies to the whole node - All, - /// The indent applies to everything except for the first line of the node - Tail, -} -/// A capture from the indent query which does not define an indent but extends -/// the range of a node. This is used before the indent is calculated. -#[derive(Debug)] -enum ExtendCapture { - Extend, - PreventOnce, -} - -/// The result of running a tree-sitter indent query. This stores for -/// each node (identified by its ID) the relevant captures (already filtered -/// by predicates). -#[derive(Debug)] -struct IndentQueryResult<'a> { - indent_captures: HashMap<usize, Vec<IndentCapture<'a>>>, - extend_captures: HashMap<usize, Vec<ExtendCapture>>, -} - -fn get_node_start_line(text: RopeSlice, node: &Node, new_line_byte_pos: Option<u32>) -> usize { - let mut node_line = text.byte_to_line(node.start_byte() as usize); - // Adjust for the new line that will be inserted - if new_line_byte_pos.is_some_and(|pos| node.start_byte() >= pos) { - node_line += 1; - } - node_line -} -fn get_node_end_line(text: RopeSlice, node: &Node, new_line_byte_pos: Option<u32>) -> usize { - let mut node_line = text.byte_to_line(node.end_byte() as usize); - // Adjust for the new line that will be inserted (with a strict inequality since end_byte is exclusive) - if new_line_byte_pos.is_some_and(|pos| node.end_byte() > pos) { - node_line += 1; - } - node_line + Some(node) } -fn query_indents<'a>( +/// Calculate the indentation at a given treesitter node. +/// If newline is false, then any "indent" nodes on the line are ignored ("outdent" still applies). +/// This is because the indentation is only increased starting at the second line of the node. +fn calculate_indentation( query: &IndentQuery, - syntax: &Syntax, - text: RopeSlice<'a>, - range: std::ops::Range<u32>, - new_line_byte_pos: Option<u32>, -) -> IndentQueryResult<'a> { - let mut indent_captures: HashMap<usize, Vec<IndentCapture>> = HashMap::new(); - let mut extend_captures: HashMap<usize, Vec<ExtendCapture>> = HashMap::new(); - - let mut cursor = InactiveQueryCursor::new(range, TREE_SITTER_MATCH_LIMIT).execute_query( - &query.query, - &syntax.tree().root_node(), - RopeInput::new(text), - ); - - // Iterate over all captures from the query - while let Some(m) = cursor.next_match() { - // Skip matches where not all custom predicates are fulfilled - if query - .predicates - .get(&m.pattern()) - .is_some_and(|preds| !preds.are_satisfied(&m, text, new_line_byte_pos)) - { - continue; - } - // A list of pairs (node_id, indent_capture) that are added by this match. - // They cannot be added to indent_captures immediately since they may depend on other captures (such as an @anchor). - let mut added_indent_captures: Vec<(usize, IndentCapture)> = Vec::new(); - // The row/column position of the optional anchor in this query - let mut anchor: Option<&Node> = None; - for matched_node in m.matched_nodes() { - let node_id = matched_node.node.id(); - let capture = Some(matched_node.capture); - let capture_type = if capture == query.indent_capture { - IndentCaptureType::Indent - } else if capture == query.indent_always_capture { - IndentCaptureType::IndentAlways - } else if capture == query.outdent_capture { - IndentCaptureType::Outdent - } else if capture == query.outdent_always_capture { - IndentCaptureType::OutdentAlways - } else if capture == query.align_capture { - IndentCaptureType::Align(RopeSlice::from("")) - } else if capture == query.anchor_capture { - if anchor.is_some() { - log::error!("Invalid indent query: Encountered more than one @anchor in the same match.") - } else { - anchor = Some(&matched_node.node); - } - continue; - } else if capture == query.extend_capture { - extend_captures - .entry(node_id) - .or_insert_with(|| Vec::with_capacity(1)) - .push(ExtendCapture::Extend); - continue; - } else if capture == query.extend_prevent_once_capture { - extend_captures - .entry(node_id) - .or_insert_with(|| Vec::with_capacity(1)) - .push(ExtendCapture::PreventOnce); - continue; - } else { - // Ignore any unknown captures (these may be needed for predicates such as #match?) - continue; - }; - - // Apply additional settings for this capture - let scope = query - .properties - .get(&m.pattern()) - .copied() - .unwrap_or_else(|| capture_type.default_scope()); - let indent_capture = IndentCapture { - capture_type, - scope, - }; - added_indent_captures.push((node_id, indent_capture)) - } - for (node_id, mut capture) in added_indent_captures { - // Set the anchor for all align queries. - if let IndentCaptureType::Align(_) = capture.capture_type { - let Some(anchor) = anchor else { - log::error!("Invalid indent query: @align requires an accompanying @anchor."); - continue; - }; - let line = text.byte_to_line(anchor.start_byte() as usize); - let line_start = text.line_to_byte(line); - capture.capture_type = IndentCaptureType::Align( - text.byte_slice(line_start..anchor.start_byte() as usize), - ); - } - indent_captures - .entry(node_id) - .or_insert_with(|| Vec::with_capacity(1)) - .push(capture); - } - } + node: Option<Node>, + line: usize, + newline: bool, +) -> usize { + let mut increment: isize = 0; - let result = IndentQueryResult { - indent_captures, - extend_captures, + let mut node = match node { + Some(node) => node, + None => return 0, }; - log::trace!("indent result = {:?}", result); + let mut current_line = line; + let mut consider_indent = newline; + let mut increment_from_line: isize = 0; - result -} - -/// Handle extend queries. deepest_preceding is the deepest descendant of node that directly precedes the cursor position. -/// Any ancestor of deepest_preceding which is also a descendant of node may be "extended". In that case, node will be updated, -/// so that the indent computation starts with the correct syntax node. -fn extend_nodes<'a>( - node: &mut Node<'a>, - mut deepest_preceding: Node<'a>, - extend_captures: &HashMap<usize, Vec<ExtendCapture>>, - text: RopeSlice, - line: usize, - tab_width: usize, - indent_width: usize, -) { - let mut stop_extend = false; - - while deepest_preceding != *node { - let mut extend_node = false; - // This will be set to true if this node is captured, regardless of whether - // it actually will be extended (e.g. because the cursor isn't indented - // more than the node). - let mut node_captured = false; - if let Some(captures) = extend_captures.get(&deepest_preceding.id()) { - for capture in captures { - match capture { - ExtendCapture::PreventOnce => { - stop_extend = true; - } - ExtendCapture::Extend => { - node_captured = true; - // We extend the node if - // - the cursor is on the same line as the end of the node OR - // - the line that the cursor is on is more indented than the - // first line of the node - if text.byte_to_line(deepest_preceding.end_byte() as usize) == line { - extend_node = true; - } else { - let cursor_indent = - indent_level_for_line(text.line(line), tab_width, indent_width); - let node_indent = indent_level_for_line( - text.line( - text.byte_to_line(deepest_preceding.start_byte() as usize), - ), - tab_width, - indent_width, - ); - if cursor_indent > node_indent { - extend_node = true; - } - } - } - } + loop { + let node_kind = node.kind(); + let start = node.start_position().row; + if current_line != start { + // Indent/dedent by at most one per line: + // .map(|a| { <-- ({ is two scopes + // let len = 1; <-- indents one level + // }) <-- }) is two scopes + if consider_indent || increment_from_line < 0 { + increment += increment_from_line.signum(); } + increment_from_line = 0; + current_line = start; + consider_indent = true; } - // If we encountered some `StopExtend` capture before, we don't - // extend the node even if we otherwise would - if node_captured && stop_extend { - stop_extend = false; - } else if extend_node && !stop_extend { - *node = deepest_preceding.clone(); - break; - } - // If the tree contains a syntax error, `deepest_preceding` may not - // have a parent despite being a descendant of `node`. - deepest_preceding = match deepest_preceding.parent() { - Some(parent) => parent, - None => return, - } - } -} - -/// Prepare an indent query by computing: -/// - The node from which to start the query (this is non-trivial due to `@extend` captures) -/// - The indent captures for all relevant nodes. -#[allow(clippy::too_many_arguments)] -fn init_indent_query<'a, 'b>( - query: &IndentQuery, - syntax: &'a Syntax, - text: RopeSlice<'b>, - tab_width: usize, - indent_width: usize, - line: usize, - byte_pos: u32, - new_line_byte_pos: Option<u32>, -) -> Option<(Node<'a>, HashMap<usize, Vec<IndentCapture<'b>>>)> { - // The innermost tree-sitter node which is considered for the indent - // computation. It may change if some preceding node is extended - let mut node = syntax - .tree() - .root_node() - .descendant_for_byte_range(byte_pos, byte_pos)?; - let (query_result, deepest_preceding) = { - // The query range should intersect with all nodes directly preceding - // the position of the indent query in case one of them is extended. - let mut deepest_preceding = None; // The deepest node preceding the indent query position - for child in node.children() { - if child.byte_range().end <= byte_pos { - deepest_preceding = Some(child.clone()); - } + if query.outdent.contains(node_kind) { + increment_from_line -= 1; } - deepest_preceding = deepest_preceding.map(|mut prec| { - // Get the deepest directly preceding node - while prec.child_count() > 0 { - prec = prec.child(prec.child_count() - 1).unwrap().clone(); - } - prec - }); - let query_range = deepest_preceding - .as_ref() - .map(|prec| prec.byte_range().end - 1..byte_pos + 1) - .unwrap_or(byte_pos..byte_pos + 1); - - let query_result = query_indents(query, syntax, text, query_range, new_line_byte_pos); - (query_result, deepest_preceding) - }; - let extend_captures = query_result.extend_captures; - - // Check for extend captures, potentially changing the node that the indent calculation starts with - if let Some(deepest_preceding) = deepest_preceding { - extend_nodes( - &mut node, - deepest_preceding, - &extend_captures, - text, - line, - tab_width, - indent_width, - ); - } - Some((node, query_result.indent_captures)) -} - -/// Use the syntax tree to determine the indentation for a given position. -/// This can be used in 2 ways: -/// -/// - To get the correct indentation for an existing line (new_line=false), not necessarily equal to the current indentation. -/// - In this case, pos should be inside the first tree-sitter node on that line. -/// In most cases, this can just be the first non-whitespace on that line. -/// - To get the indentation for a new line (new_line=true). This behaves like the first usecase if the part of the current line -/// after pos were moved to a new line. -/// -/// The indentation is determined by traversing all the tree-sitter nodes containing the position. -/// Each of these nodes produces some [Indentation] for: -/// -/// - The line of the (beginning of the) node. This is defined by the scope `all` if this is the first node on its line. -/// - The line after the node. This is defined by: -/// - The scope `tail`. -/// - The scope `all` if this node is not the first node on its line. -/// -/// Intuitively, `all` applies to everything contained in this node while `tail` applies to everything except for the first line of the node. -/// The indents from different nodes for the same line are then combined. -/// The result [Indentation] is simply the sum of the [Indentation] for all lines. -/// -/// Specifying which line exactly an [Indentation] applies to is important because indents on the same line combine differently than indents on different lines: -/// ```ignore -/// some_function(|| { -/// // Both the function parameters as well as the contained block should be indented. -/// // Because they are on the same line, this only yields one indent level -/// }); -/// ``` -/// -/// ```ignore -/// some_function( -/// param1, -/// || { -/// // Here we get 2 indent levels because the 'parameters' and the 'block' node begin on different lines -/// }, -/// ); -/// ``` -#[allow(clippy::too_many_arguments)] -pub fn treesitter_indent_for_pos<'a>( - query: &IndentQuery, - syntax: &Syntax, - tab_width: usize, - indent_width: usize, - text: RopeSlice<'a>, - line: usize, - pos: usize, - new_line: bool, -) -> Option<Indentation<'a>> { - let byte_pos = text.char_to_byte(pos) as u32; - let new_line_byte_pos = new_line.then_some(byte_pos); - let (mut node, mut indent_captures) = init_indent_query( - query, - syntax, - text, - tab_width, - indent_width, - line, - byte_pos, - new_line_byte_pos, - )?; - - let mut result = Indentation::default(); - // We always keep track of all the indent changes on one line, in order to only indent once - // even if there are multiple "indent" nodes on the same line - let mut indent_for_line = Indentation::default(); - let mut indent_for_line_below = Indentation::default(); - - loop { - let is_first = is_first_in_line(&node, text, new_line_byte_pos); - - // Apply all indent definitions for this node. - // Since we only iterate over each node once, we can remove the - // corresponding captures from the HashMap to avoid cloning them. - if let Some(definitions) = indent_captures.remove(&node.id()) { - for definition in definitions { - match definition.scope { - IndentScope::All => { - if is_first { - indent_for_line.add_capture(definition.capture_type); - } else { - indent_for_line_below.add_capture(definition.capture_type); - } - } - IndentScope::Tail => { - indent_for_line_below.add_capture(definition.capture_type); - } - } - } + if query.indent.contains(node_kind) { + increment_from_line += 1; } if let Some(parent) = node.parent() { - let node_line = get_node_start_line(text, &node, new_line_byte_pos); - let parent_line = get_node_start_line(text, &parent, new_line_byte_pos); - - if node_line != parent_line { - // Don't add indent for the line below the line of the query - if node_line < line + (new_line as usize) { - result.add_line(indent_for_line_below); - } - - if node_line == parent_line + 1 { - indent_for_line_below = indent_for_line; - } else { - result.add_line(indent_for_line); - indent_for_line_below = Indentation::default(); - } - - indent_for_line = Indentation::default(); - } - node = parent; } else { - // Only add the indentation for the line below if that line - // is not after the line that the indentation is calculated for. - let node_start_line = text.byte_to_line(node.start_byte() as usize); - if node_start_line < line - || (new_line && node_start_line == line && node.start_byte() < byte_pos) - { - result.add_line(indent_for_line_below); - } - result.add_line(indent_for_line); break; } } - Some(result) + if consider_indent || increment_from_line < 0 { + increment += increment_from_line.signum(); + } + increment.max(0) as usize } -/// Returns the indentation for a new line. -/// This is done either using treesitter, or if that's not available by copying the indentation from the current line -#[allow(clippy::too_many_arguments)] -pub fn indent_for_newline( - loader: &syntax::Loader, +// TODO: two usecases: if we are triggering this for a new, blank line: +// - it should return 0 when mass indenting stuff +// - it should look up the wrapper node and count it too when we press o/O +pub fn suggested_indent_for_pos( + language_config: Option<&LanguageConfiguration>, syntax: Option<&Syntax>, - indent_heuristic: &IndentationHeuristic, - indent_style: &IndentStyle, - tab_width: usize, text: RopeSlice, - line_before: usize, - line_before_end_pos: usize, - current_line: usize, -) -> String { - let indent_width = indent_style.indent_width(tab_width); - if let ( - IndentationHeuristic::TreeSitter | IndentationHeuristic::Hybrid, - Some(query), - Some(syntax), - ) = ( - indent_heuristic, - syntax.and_then(|syntax| loader.indent_query(syntax.root_language())), + pos: usize, + line: usize, + new_line: bool, +) -> Option<usize> { + if let (Some(query), Some(syntax)) = ( + language_config.and_then(|config| config.indent_query()), syntax, ) { - if let Some(indent) = treesitter_indent_for_pos( - query, - syntax, - tab_width, - indent_width, - text, - line_before, - line_before_end_pos, - true, - ) { - if *indent_heuristic == IndentationHeuristic::Hybrid { - // We want to compute the indentation not only based on the - // syntax tree but also on the actual indentation of a previous - // line. This makes indentation computation more resilient to - // incomplete queries, incomplete source code & differing indentation - // styles for the same language. - // However, using the indent of a previous line as a baseline may not - // make sense, e.g. if it has a different alignment than the new line. - // In order to prevent edge cases with long running times, we only try - // a constant number of (non-empty) lines. - const MAX_ATTEMPTS: usize = 4; - let mut num_attempts = 0; - for line_idx in (0..=line_before).rev() { - let line = text.line(line_idx); - let first_non_whitespace_char = match line.first_non_whitespace_char() { - Some(i) => i, - None => { - continue; - } - }; - if let Some(indent) = (|| { - let computed_indent = treesitter_indent_for_pos( - query, - syntax, - tab_width, - indent_width, - text, - line_idx, - text.line_to_char(line_idx) + first_non_whitespace_char, - false, - )?; - let leading_whitespace = line.slice(0..first_non_whitespace_char); - indent.relative_indent( - &computed_indent, - leading_whitespace, - indent_style, - tab_width, - ) - })() { - return indent; - } - num_attempts += 1; - if num_attempts == MAX_ATTEMPTS { - break; - } - } - } - return indent.to_string(indent_style, tab_width); - }; + let byte_start = text.char_to_byte(pos); + let node = get_highest_syntax_node_at_bytepos(syntax, byte_start); + // TODO: special case for comments + // TODO: if preserve_leading_whitespace + Some(calculate_indentation(query, node, line, new_line)) + } else { + None } - // Fallback in case we either don't have indent queries or they failed for some reason - let indent_level = indent_level_for_line(text.line(current_line), tab_width, indent_width); - indent_style.as_str().repeat(indent_level) } -pub fn get_scopes<'a>(syntax: Option<&'a Syntax>, text: RopeSlice, pos: usize) -> Vec<&'a str> { +pub fn get_scopes(syntax: Option<&Syntax>, text: RopeSlice, pos: usize) -> Vec<&'static str> { let mut scopes = Vec::new(); if let Some(syntax) = syntax { - let pos = text.char_to_byte(pos) as u32; + let pos = text.char_to_byte(pos); let mut node = match syntax .tree() .root_node() @@ -1119,229 +318,164 @@ mod test { #[test] fn test_indent_level() { let tab_width = 4; - let indent_width = 4; let line = Rope::from(" fn new"); // 8 spaces - assert_eq!( - indent_level_for_line(line.slice(..), tab_width, indent_width), - 2 - ); + assert_eq!(indent_level_for_line(line.slice(..), tab_width), 2); let line = Rope::from("\t\t\tfn new"); // 3 tabs - assert_eq!( - indent_level_for_line(line.slice(..), tab_width, indent_width), - 3 - ); + assert_eq!(indent_level_for_line(line.slice(..), tab_width), 3); // mixed indentation let line = Rope::from("\t \tfn new"); // 1 tab, 4 spaces, tab - assert_eq!( - indent_level_for_line(line.slice(..), tab_width, indent_width), - 3 - ); + assert_eq!(indent_level_for_line(line.slice(..), tab_width), 3); } #[test] - fn test_large_indent_level() { - let tab_width = 16; - let indent_width = 16; - let line = Rope::from(" fn new"); // 16 spaces - assert_eq!( - indent_level_for_line(line.slice(..), tab_width, indent_width), - 1 - ); - let line = Rope::from(" fn new"); // 32 spaces - assert_eq!( - indent_level_for_line(line.slice(..), tab_width, indent_width), - 2 - ); - } - - #[test] - fn add_capture() { - let indent = || Indentation { - indent: 1, - ..Default::default() - }; - let indent_always = || Indentation { - indent_always: 1, - ..Default::default() - }; - let outdent = || Indentation { - outdent: 1, - ..Default::default() - }; - let outdent_always = || Indentation { - outdent_always: 1, - ..Default::default() - }; + fn test_suggested_indent_for_line() { + let doc = Rope::from( + " +use std::{ + io::{self, stdout, Stdout, Write}, + path::PathBuf, + sync::Arc, + time::Duration, +} +mod test { + fn hello_world() { + 1 + 1; - fn add_capture<'a>( - mut indent: Indentation<'a>, - capture: IndentCaptureType<'a>, - ) -> Indentation<'a> { - indent.add_capture(capture); - indent - } + let does_indentation_work = 1; - // adding an indent to no indent makes an indent - assert_eq!( - indent(), - add_capture(Indentation::default(), IndentCaptureType::Indent) - ); - assert_eq!( - indent_always(), - add_capture(Indentation::default(), IndentCaptureType::IndentAlways) - ); - assert_eq!( - outdent(), - add_capture(Indentation::default(), IndentCaptureType::Outdent) - ); - assert_eq!( - outdent_always(), - add_capture(Indentation::default(), IndentCaptureType::OutdentAlways) + let test_function = function_with_param(this_param, + that_param ); - // adding an indent to an already indented has no effect - assert_eq!(indent(), add_capture(indent(), IndentCaptureType::Indent)); - assert_eq!( - outdent(), - add_capture(outdent(), IndentCaptureType::Outdent) + let test_function = function_with_param( + this_param, + that_param ); - // adding an always to a regular makes it always - assert_eq!( - indent_always(), - add_capture(indent(), IndentCaptureType::IndentAlways) - ); - assert_eq!( - outdent_always(), - add_capture(outdent(), IndentCaptureType::OutdentAlways) + let test_function = function_with_proper_indent(param1, + param2, ); - // adding an always to an always is additive - assert_eq!( - Indentation { - indent_always: 2, - ..Default::default() - }, - add_capture(indent_always(), IndentCaptureType::IndentAlways) - ); - assert_eq!( - Indentation { - outdent_always: 2, - ..Default::default() - }, - add_capture(outdent_always(), IndentCaptureType::OutdentAlways) + let selection = Selection::new( + changes + .clone() + .map(|(start, end, text): (usize, usize, Option<Tendril>)| { + let len = text.map(|text| text.len()).unwrap() - 1; // minus newline + let pos = start + len; + Range::new(pos, pos) + }) + .collect(), + 0, ); - // adding regular to always should be associative - assert_eq!( - Indentation { - indent_always: 1, - ..Default::default() - }, - add_capture( - add_capture(indent(), IndentCaptureType::Indent), - IndentCaptureType::IndentAlways - ) - ); - assert_eq!( - Indentation { - indent_always: 1, - ..Default::default() - }, - add_capture( - add_capture(indent(), IndentCaptureType::IndentAlways), - IndentCaptureType::Indent - ) - ); - assert_eq!( - Indentation { - outdent_always: 1, - ..Default::default() - }, - add_capture( - add_capture(outdent(), IndentCaptureType::Outdent), - IndentCaptureType::OutdentAlways - ) - ); - assert_eq!( - Indentation { - outdent_always: 1, - ..Default::default() - }, - add_capture( - add_capture(outdent(), IndentCaptureType::OutdentAlways), - IndentCaptureType::Outdent - ) - ); + return; } +} - #[test] - fn test_relative_indent() { - let indent_style = IndentStyle::Spaces(4); - let tab_width: usize = 4; - let no_align = [ - Indentation::default(), - Indentation { - indent: 1, - ..Default::default() - }, - Indentation { - indent: 5, - outdent: 1, - ..Default::default() - }, - ]; - let align = no_align.clone().map(|indent| Indentation { - align: Some(RopeSlice::from("12345")), - ..indent - }); - let different_align = Indentation { - align: Some(RopeSlice::from("123456")), - ..Default::default() - }; +impl<A, D> MyTrait<A, D> for YourType +where + A: TraitB + TraitC, + D: TraitE + TraitF, +{ - // Check that relative and absolute indentation computation are the same when the line we compare to is - // indented as we expect. - let check_consistency = |indent: &Indentation, other: &Indentation| { - assert_eq!( - indent.relative_indent( - other, - RopeSlice::from(other.to_string(&indent_style, tab_width).as_str()), - &indent_style, - tab_width - ), - Some(indent.to_string(&indent_style, tab_width)) - ); +} +#[test] +// +match test { + Some(a) => 1, + None => { + unimplemented!() + } +} +std::panic::set_hook(Box::new(move |info| { + hook(info); +})); + +{ { { + 1 +}}} + +pub fn change<I>(document: &Document, changes: I) -> Self +where + I: IntoIterator<Item = Change> + ExactSizeIterator, +{ + [ + 1, + 2, + 3, + ]; + ( + 1, + 2 + ); + true +} +", + ); + + let doc = doc; + use crate::diagnostic::Severity; + use crate::syntax::{ + Configuration, IndentationConfiguration, LanguageConfiguration, Loader, }; - for a in &no_align { - for b in &no_align { - check_consistency(a, b); - } - } - for a in &align { - for b in &align { - check_consistency(a, b); + use once_cell::sync::OnceCell; + let loader = Loader::new(Configuration { + language: vec![LanguageConfiguration { + scope: "source.rust".to_string(), + file_types: vec!["rs".to_string()], + shebangs: vec![], + language_id: "Rust".to_string(), + highlight_config: OnceCell::new(), + config: None, + // + injection_regex: None, + roots: vec![], + comment_token: None, + auto_format: false, + diagnostic_severity: Severity::Warning, + grammar: None, + language_server: None, + indent: Some(IndentationConfiguration { + tab_width: 4, + unit: String::from(" "), + }), + indent_query: OnceCell::new(), + textobject_query: OnceCell::new(), + debugger: None, + auto_pairs: None, + }], + }); + + // set runtime path so we can find the queries + let mut runtime = std::path::PathBuf::from(env!("CARGO_MANIFEST_DIR")); + runtime.push("../runtime"); + std::env::set_var("HELIX_RUNTIME", runtime.to_str().unwrap()); + + let language_config = loader.language_config_for_scope("source.rust").unwrap(); + let highlight_config = language_config.highlight_config(&[]).unwrap(); + let syntax = Syntax::new(&doc, highlight_config, std::sync::Arc::new(loader)); + let text = doc.slice(..); + let tab_width = 4; + + for i in 0..doc.len_lines() { + let line = text.line(i); + if let Some(pos) = crate::find_first_non_whitespace_char(line) { + let indent = indent_level_for_line(line, tab_width); + assert_eq!( + suggested_indent_for_pos( + Some(&language_config), + Some(&syntax), + text, + text.line_to_char(i) + pos, + i, + false + ), + Some(indent), + "line {}: \"{}\"", + i, + line + ); } } - - // Relative indent computation makes no sense if the alignment differs - assert_eq!( - align[0].relative_indent( - &no_align[0], - RopeSlice::from(" "), - &indent_style, - tab_width - ), - None - ); - assert_eq!( - align[0].relative_indent( - &different_align, - RopeSlice::from(" "), - &indent_style, - tab_width - ), - None - ); } } |