RubyGems - rfmt - Versions diffs - 1.5.2 → 1.6.0 - Mend

rfmt 1.5.2 → 1.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +36 -0
data/Cargo.lock +266 -92
data/README.md +22 -18
data/ext/rfmt/Cargo.toml +4 -1
data/ext/rfmt/src/doc/builders.rs +528 -0
data/ext/rfmt/src/doc/mod.rs +220 -0
data/ext/rfmt/src/doc/printer.rs +684 -0
data/ext/rfmt/src/format/context.rs +448 -0
data/ext/rfmt/src/format/formatter.rs +226 -0
data/ext/rfmt/src/format/mod.rs +35 -0
data/ext/rfmt/src/format/registry.rs +195 -0
data/ext/rfmt/src/format/rule.rs +555 -0
data/ext/rfmt/src/format/rules/begin.rs +295 -0
data/ext/rfmt/src/format/rules/body_end.rs +109 -0
data/ext/rfmt/src/format/rules/call.rs +409 -0
data/ext/rfmt/src/format/rules/case.rs +359 -0
data/ext/rfmt/src/format/rules/class.rs +160 -0
data/ext/rfmt/src/format/rules/def.rs +216 -0
data/ext/rfmt/src/format/rules/fallback.rs +116 -0
data/ext/rfmt/src/format/rules/if_unless.rs +407 -0
data/ext/rfmt/src/format/rules/loops.rs +325 -0
data/ext/rfmt/src/format/rules/mod.rs +31 -0
data/ext/rfmt/src/format/rules/module.rs +150 -0
data/ext/rfmt/src/format/rules/singleton_class.rs +202 -0
data/ext/rfmt/src/format/rules/statements.rs +122 -0
data/ext/rfmt/src/format/rules/variable_write.rs +296 -0
data/ext/rfmt/src/lib.rs +8 -5
data/ext/rfmt/src/parser/prism_adapter.rs +157 -2
data/lib/rfmt/version.rb +1 -1
data/lib/ruby_lsp/rfmt/formatter_runner.rb +2 -0
metadata +23 -2
data/ext/rfmt/src/emitter/mod.rs +0 -1760

data/ext/rfmt/src/format/rule.rs ADDED Viewed

@@ -0,0 +1,555 @@
+//! FormatRule trait and helper functions
+//!
+//! This module defines the core FormatRule trait that all formatting rules implement,
+//! along with shared helper functions for common formatting patterns.
+use crate::ast::Node;
+use crate::doc::{concat, hardline, leading_comment, trailing_comment, Doc};
+use crate::error::Result;
+use super::context::FormatContext;
+use super::registry::RuleRegistry;
+/// Trait for formatting rules.
+///
+/// Each rule handles a specific node type (or set of node types) and produces
+/// a Doc IR representation of that node.
+///
+/// Rules are stateless and can be shared across multiple formatting contexts.
+pub trait FormatRule: Send + Sync {
+    /// Formats a node and returns the Doc IR.
+    ///
+    /// # Arguments
+    /// * `node` - The AST node to format
+    /// * `ctx` - The formatting context with source, config, and comment tracking
+    /// * `registry` - The rule registry for recursive formatting
+    ///
+    /// # Returns
+    /// A Doc IR representing the formatted node
+    fn format(&self, node: &Node, ctx: &mut FormatContext, registry: &RuleRegistry) -> Result<Doc>;
+}
+/// Formats a child node by dispatching to the appropriate rule.
+///
+/// This is the primary way to recursively format child nodes within rules.
+pub fn format_child(child: &Node, ctx: &mut FormatContext, registry: &RuleRegistry) -> Result<Doc> {
+    let rule = registry.get_rule(&child.node_type);
+    rule.format(child, ctx, registry)
+}
+/// Boxed rule type for dynamic dispatch.
+pub type BoxedRule = Box<dyn FormatRule>;
+/// Lightweight comment reference using index instead of cloning.
+#[derive(Clone, Copy)]
+struct CommentRef {
+    idx: usize,
+    start_line: usize,
+    end_line: usize,
+}
+/// Formats leading comments before a given line.
+///
+/// This helper collects all unemitted comments that appear before the given line,
+/// formats them with hardlines, and marks them as emitted.
+///
+/// # Arguments
+/// * `ctx` - The formatting context
+/// * `line` - The line number to get comments before
+///
+/// # Returns
+/// A Doc containing all leading comments with proper line breaks
+pub fn format_leading_comments(ctx: &mut FormatContext, line: usize) -> Doc {
+    // Collect lightweight refs while borrowing immutably
+    let comment_refs: Vec<CommentRef> = ctx
+        .get_comment_indices_before(line)
+        .filter_map(|idx| {
+            ctx.get_comment(idx).map(|c| CommentRef {
+                idx,
+                start_line: c.location.start_line,
+                end_line: c.location.end_line,
+            })
+        })
+        .collect();
+    if comment_refs.is_empty() {
+        return Doc::Empty;
+    }
+    let mut docs: Vec<Doc> = Vec::with_capacity(comment_refs.len() * 2);
+    let mut last_end_line: Option<usize> = None;
+    let mut indices_to_mark: Vec<usize> = Vec::with_capacity(comment_refs.len());
+    for cref in &comment_refs {
+        // Preserve blank lines between comments
+        if let Some(prev_end) = last_end_line {
+            let gap = cref.start_line.saturating_sub(prev_end);
+            for _ in 1..gap {
+                docs.push(hardline());
+            }
+        }
+        if let Some(comment) = ctx.get_comment(cref.idx) {
+            docs.push(leading_comment(&comment.text, true));
+        }
+        last_end_line = Some(cref.end_line);
+        indices_to_mark.push(cref.idx);
+    }
+    // Mark comments as emitted in batch
+    ctx.mark_comments_emitted(indices_to_mark);
+    // Add blank line after comments if there's a gap before the node
+    if let Some(last_end) = last_end_line {
+        if line > last_end + 1 {
+            docs.push(hardline());
+        }
+    }
+    concat(docs)
+}
+/// Formats a trailing comment on the same line.
+///
+/// # Arguments
+/// * `ctx` - The formatting context
+/// * `line` - The line number to get trailing comments for
+///
+/// # Returns
+/// A Doc containing the trailing comment, or Empty if none
+pub fn format_trailing_comment(ctx: &mut FormatContext, line: usize) -> Doc {
+    // Collect indices while borrowing immutably
+    let indices: Vec<usize> = ctx.get_trailing_comment_indices(line).collect();
+    if indices.is_empty() {
+        return Doc::Empty;
+    }
+    let mut docs: Vec<Doc> = Vec::with_capacity(indices.len());
+    for &idx in &indices {
+        if let Some(comment) = ctx.get_comment(idx) {
+            docs.push(trailing_comment(&comment.text));
+        }
+    }
+    // Mark comments as emitted in batch
+    ctx.mark_comments_emitted(indices);
+    concat(docs)
+}
+/// Formats comments that appear before the `end` keyword of a construct.
+///
+/// This is used for comments inside class/module/def bodies that appear
+/// on standalone lines before the closing `end`.
+///
+/// # Arguments
+/// * `ctx` - The formatting context
+/// * `start_line` - The start line of the construct
+/// * `end_line` - The end line of the construct (where `end` appears)
+///
+/// # Returns
+/// A Doc containing the formatted comments
+pub fn format_comments_before_end(
+    ctx: &mut FormatContext,
+    start_line: usize,
+    end_line: usize,
+) -> Doc {
+    // Collect indices for comments in range
+    let indices: Vec<usize> = ctx
+        .get_comment_indices_in_range(start_line + 1, end_line)
+        .collect();
+    if indices.is_empty() {
+        return Doc::Empty;
+    }
+    // Filter to only standalone comments
+    let standalone_refs: Vec<CommentRef> = indices
+        .iter()
+        .filter_map(|&idx| {
+            ctx.get_comment(idx).and_then(|c| {
+                if ctx.is_standalone_comment(c) && c.location.end_line < end_line {
+                    Some(CommentRef {
+                        idx,
+                        start_line: c.location.start_line,
+                        end_line: c.location.end_line,
+                    })
+                } else {
+                    None
+                }
+            })
+        })
+        .collect();
+    if standalone_refs.is_empty() {
+        return Doc::Empty;
+    }
+    let mut docs: Vec<Doc> = vec![hardline()];
+    let mut last_end_line: Option<usize> = None;
+    let mut indices_to_mark: Vec<usize> = Vec::with_capacity(standalone_refs.len());
+    for cref in &standalone_refs {
+        // Preserve blank lines between comments
+        if let Some(prev_end) = last_end_line {
+            let gap = cref.start_line.saturating_sub(prev_end);
+            for _ in 1..gap {
+                docs.push(hardline());
+            }
+        }
+        if let Some(comment) = ctx.get_comment(cref.idx) {
+            docs.push(leading_comment(&comment.text, true));
+        }
+        last_end_line = Some(cref.end_line);
+        indices_to_mark.push(cref.idx);
+    }
+    // Mark comments as emitted in batch
+    ctx.mark_comments_emitted(indices_to_mark);
+    concat(docs)
+}
+/// Formats remaining comments at the end of the file.
+///
+/// This should be called after all nodes have been formatted to emit
+/// any comments that weren't attached to specific nodes.
+///
+/// # Arguments
+/// * `ctx` - The formatting context
+/// * `last_code_line` - The last line of code in the file
+///
+/// # Returns
+/// A Doc containing all remaining comments
+pub fn format_remaining_comments(ctx: &mut FormatContext, last_code_line: usize) -> Doc {
+    // Collect remaining comment indices and their line info
+    let comment_refs: Vec<CommentRef> = ctx
+        .get_remaining_comment_indices()
+        .filter_map(|idx| {
+            ctx.get_comment(idx).map(|c| CommentRef {
+                idx,
+                start_line: c.location.start_line,
+                end_line: c.location.end_line,
+            })
+        })
+        .collect();
+    if comment_refs.is_empty() {
+        return Doc::Empty;
+    }
+    let mut docs: Vec<Doc> = Vec::with_capacity(comment_refs.len() * 2);
+    let mut last_end_line = last_code_line;
+    let mut is_first = true;
+    let mut indices_to_mark: Vec<usize> = Vec::with_capacity(comment_refs.len());
+    for cref in &comment_refs {
+        // Preserve blank lines
+        let gap = cref.start_line.saturating_sub(last_end_line);
+        // Only add newlines if not the first comment or if there's a gap
+        if !is_first || gap > 0 {
+            for _ in 0..gap.max(1) {
+                docs.push(hardline());
+            }
+        }
+        if let Some(comment) = ctx.get_comment(cref.idx) {
+            docs.push(leading_comment(&comment.text, false));
+        }
+        last_end_line = cref.end_line;
+        is_first = false;
+        indices_to_mark.push(cref.idx);
+    }
+    // Mark comments as emitted in batch
+    ctx.mark_comments_emitted(indices_to_mark);
+    concat(docs)
+}
+/// Formats a statements node as a sequence of children with proper line spacing.
+///
+/// This is a shared helper used by multiple formatting rules (if_unless, case,
+/// begin, call, loops) to format StatementsNode children consistently.
+///
+/// # Arguments
+/// * `node` - The StatementsNode to format
+/// * `ctx` - The formatting context
+/// * `registry` - The rule registry for recursive formatting
+///
+/// # Returns
+/// A Doc containing all statements with proper line breaks between them
+pub fn format_statements(
+    node: &Node,
+    ctx: &mut FormatContext,
+    registry: &RuleRegistry,
+) -> Result<Doc> {
+    if node.children.is_empty() {
+        return Ok(Doc::Empty);
+    }
+    let mut docs: Vec<Doc> = Vec::with_capacity(node.children.len() * 2);
+    for (i, child) in node.children.iter().enumerate() {
+        let child_doc = format_child(child, ctx, registry)?;
+        docs.push(child_doc);
+        // Add newlines between statements
+        if let Some(next_child) = node.children.get(i + 1) {
+            let current_end_line = child.location.end_line;
+            let next_start_line = next_child.location.start_line;
+            let line_diff = next_start_line.saturating_sub(current_end_line);
+            docs.push(hardline());
+            if line_diff > 1 {
+                docs.push(hardline());
+            }
+        }
+    }
+    Ok(concat(docs))
+}
+/// Reformats multiline method chain text with indented style.
+///
+/// Converts aligned method chains to indented style:
+/// - First line is kept as-is (trimmed at end)
+/// - Subsequent lines starting with `.` or `&.` are re-indented with one level of indentation
+///
+/// Returns `Cow::Borrowed` when no transformation is needed to avoid allocation.
+///
+/// # Arguments
+/// * `source_text` - The source text containing a method chain
+/// * `indent_width` - The number of spaces for one level of indentation
+///
+/// # Example
+/// ```text
+/// Input (indent_width=2):  "foo.bar\n                  .baz"
+/// Output:                  "foo.bar\n  .baz"
+/// ```
+pub fn reformat_chain_lines(source_text: &str, indent_width: usize) -> std::borrow::Cow<'_, str> {
+    use std::borrow::Cow;
+    let lines: Vec<&str> = source_text.lines().collect();
+    if lines.len() <= 1 {
+        return Cow::Borrowed(source_text);
+    }
+    // Check if there are actual chain continuation lines (. or &.)
+    let has_chain = lines[1..].iter().any(|l| {
+        let t = l.trim_start();
+        t.starts_with('.') || t.starts_with("&.")
+    });
+    if !has_chain {
+        return Cow::Borrowed(source_text);
+    }
+    // Build the indented chain with pre-allocated capacity
+    let chain_indent = " ".repeat(indent_width);
+    let mut result = String::with_capacity(source_text.len());
+    result.push_str(lines[0].trim_end());
+    for line in &lines[1..] {
+        result.push('\n');
+        let trimmed = line.trim();
+        if trimmed.starts_with('.') || trimmed.starts_with("&.") {
+            result.push_str(&chain_indent);
+            result.push_str(trimmed);
+        } else {
+            // Non-chain continuation (e.g., heredoc content): preserve as-is
+            result.push_str(line);
+        }
+    }
+    Cow::Owned(result)
+}
+/// Marks comments within a line range as emitted.
+///
+/// This is used when source text is extracted directly, as any comments
+/// within the extracted range are included in the output.
+///
+/// # Arguments
+/// * `ctx` - The formatting context
+/// * `start_line` - The start line of the range
+/// * `end_line` - The end line of the range
+pub fn mark_comments_in_range_emitted(ctx: &mut FormatContext, start_line: usize, end_line: usize) {
+    let indices: Vec<usize> = ctx
+        .get_comment_indices_in_range(start_line, end_line)
+        .collect();
+    ctx.mark_comments_emitted(indices);
+}
+/// Checks if a node is a structural node (part of definition syntax, not body).
+///
+/// Structural nodes are parts of class/module/method definitions that should
+/// not be emitted as body content (e.g., constant names, parameter nodes).
+pub fn is_structural_node(node: &Node) -> bool {
+    use crate::ast::NodeType;
+    matches!(
+        node.node_type,
+        NodeType::ConstantReadNode
+            | NodeType::ConstantWriteNode
+            | NodeType::ConstantPathNode
+            | NodeType::RequiredParameterNode
+            | NodeType::OptionalParameterNode
+            | NodeType::RestParameterNode
+            | NodeType::KeywordParameterNode
+            | NodeType::RequiredKeywordParameterNode
+            | NodeType::OptionalKeywordParameterNode
+            | NodeType::KeywordRestParameterNode
+            | NodeType::BlockParameterNode
+            | NodeType::ForwardingParameterNode
+            | NodeType::NoKeywordsParameterNode
+    )
+}
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::ast::{
+        Comment, CommentPosition, CommentType, FormattingInfo, Location, Node, NodeType,
+    };
+    use crate::config::Config;
+    use std::collections::HashMap;
+    fn make_comment(text: &str, line: usize, start_offset: usize) -> Comment {
+        Comment {
+            text: text.to_string(),
+            location: Location::new(
+                line,
+                0,
+                line,
+                text.len(),
+                start_offset,
+                start_offset + text.len(),
+            ),
+            comment_type: CommentType::Line,
+            position: CommentPosition::Leading,
+        }
+    }
+    fn make_node_with_comments(comments: Vec<Comment>) -> Node {
+        Node {
+            node_type: NodeType::ProgramNode,
+            location: Location::new(1, 0, 10, 0, 0, 100),
+            children: Vec::new(),
+            metadata: HashMap::new(),
+            comments,
+            formatting: FormattingInfo::default(),
+        }
+    }
+    #[test]
+    fn test_format_leading_comments() {
+        let config = Config::default();
+        let source = "# comment\nclass Foo\nend";
+        let mut ctx = FormatContext::new(&config, source);
+        let comment = make_comment("# comment", 1, 0);
+        let node = make_node_with_comments(vec![comment]);
+        ctx.collect_comments(&node);
+        let doc = format_leading_comments(&mut ctx, 5);
+        assert!(!matches!(doc, Doc::Empty));
+    }
+    #[test]
+    fn test_format_trailing_comment() {
+        let config = Config::default();
+        let source = "code # trailing";
+        let mut ctx = FormatContext::new(&config, source);
+        let comment = Comment {
+            text: "# trailing".to_string(),
+            location: Location::new(1, 5, 1, 15, 5, 15),
+            comment_type: CommentType::Line,
+            position: CommentPosition::Trailing,
+        };
+        let node = make_node_with_comments(vec![comment]);
+        ctx.collect_comments(&node);
+        let doc = format_trailing_comment(&mut ctx, 1);
+        assert!(!matches!(doc, Doc::Empty));
+    }
+    #[test]
+    fn test_is_structural_node() {
+        let structural_node = Node {
+            node_type: NodeType::ConstantReadNode,
+            location: Location::new(1, 0, 1, 3, 0, 3),
+            children: Vec::new(),
+            metadata: HashMap::new(),
+            comments: Vec::new(),
+            formatting: FormattingInfo::default(),
+        };
+        let non_structural_node = Node {
+            node_type: NodeType::CallNode,
+            location: Location::new(1, 0, 1, 10, 0, 10),
+            children: Vec::new(),
+            metadata: HashMap::new(),
+            comments: Vec::new(),
+            formatting: FormattingInfo::default(),
+        };
+        assert!(is_structural_node(&structural_node));
+        assert!(!is_structural_node(&non_structural_node));
+    }
+    #[test]
+    fn test_format_child() {
+        let config = Config::default();
+        let source = "puts 'hello'";
+        let mut ctx = FormatContext::new(&config, source);
+        let registry = RuleRegistry::default_registry();
+        let node = Node {
+            node_type: NodeType::CallNode,
+            location: Location::new(1, 0, 1, 12, 0, 12),
+            children: Vec::new(),
+            metadata: HashMap::new(),
+            comments: Vec::new(),
+            formatting: FormattingInfo::default(),
+        };
+        ctx.collect_comments(&node);
+        let doc = format_child(&node, &mut ctx, &registry).unwrap();
+        assert!(!matches!(doc, Doc::Empty));
+    }
+    #[test]
+    fn test_reformat_chain_lines_single_line() {
+        let input = "foo.bar.baz";
+        let result = reformat_chain_lines(input, 2);
+        assert_eq!(result, "foo.bar.baz");
+    }
+    #[test]
+    fn test_reformat_chain_lines_multiline_chain() {
+        let input = "foo.bar\n                  .baz\n                  .qux";
+        let result = reformat_chain_lines(input, 2);
+        assert_eq!(result, "foo.bar\n  .baz\n  .qux");
+    }
+    #[test]
+    fn test_reformat_chain_lines_safe_navigation() {
+        let input = "foo&.bar\n                  &.baz";
+        let result = reformat_chain_lines(input, 2);
+        assert_eq!(result, "foo&.bar\n  &.baz");
+    }
+    #[test]
+    fn test_reformat_chain_lines_no_chain() {
+        let input = "foo(\n  arg1,\n  arg2\n)";
+        let result = reformat_chain_lines(input, 2);
+        assert_eq!(result, input);
+    }
+}