gitingest 0.3.1 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 14bcb35132327c7725e69a895d56b4e88fb21db78fa5473c9afb4d08b879b7ee
4
- data.tar.gz: f3a5e06bec7566a268342678887bac14989d69d26f10cbb590e1f594c6779b89
3
+ metadata.gz: c754bbf3a24a049ce269017c82ef90b295b0503cb05cc0e652c0101ce68df484
4
+ data.tar.gz: c3df8efb661ff08e0525da943062882a7a2b467302895f09cbb5dbab38383927
5
5
  SHA512:
6
- metadata.gz: 1aed7d97acae8b6a1c2b15757cdc9852d802c99b83aa73caf114dfc904d0b05c44b70c853cd453fc12868310c09b15bf6bf71dcac203c01b5dfde241dc7ab0f5
7
- data.tar.gz: 07145ca986675723ad0371c873c176384631da660bed227b31ef4cf2680d72cc98479b4da8fb990fedb3dce0eab74ca5114c1222eea0ca1890a85d73726a8d4b
6
+ metadata.gz: 803d3a5bb7ca76c9f51a268d22d485c1455b8ba7ebbe16aa3c5af8eabd63fddef273810ec10fa682b7cf606094b30c1ce681468d2a48a190d546c81a6eb779ca
7
+ data.tar.gz: 6781db79ba3fce1c75f13e8587ceffe8e26d0da276c0c1bbf175f942a9e8e9f1b742884413aabcc6b719a2c010c4156e601aa4577b9604e6edcd7959c67447ec
data/CHANGELOG.md CHANGED
@@ -1,5 +1,39 @@
1
1
  # Changelog
2
2
 
3
+ ## [0.5.0] - 2025-03-10
4
+
5
+ ### Added
6
+ - Added repository directory structure visualization with `--show-structure` / `-s` option
7
+ - Created `DirectoryStructureBuilder` class to generate tree views of repositories
8
+ - Added `generate_directory_structure` method to the Generator class
9
+ - Added tests for directory structure visualization
10
+
11
+ ### Changed
12
+ - Enhanced documentation with directory structure visualization examples
13
+ - Updated CLI help with the new option
14
+
15
+ ---
16
+
17
+ ## [0.4.0] - 2025-03-03
18
+
19
+ ### Added
20
+ - Added `generate_prompt` method for in-memory content generation without file I/O
21
+ - Integrated visual progress bar with file processing rate reporting
22
+ - Added human-readable time formatting for progress estimates
23
+ - Enhanced test coverage for multithreaded operations
24
+
25
+ ### Changed
26
+ - Refactored `process_content_to_output` for better code reuse between file and string output
27
+ - Improved thread management to handle various error conditions more gracefully
28
+ - Enhanced documentation with programmatic usage examples
29
+
30
+ ### Fixed
31
+ - Resolved thread pool shutdown issues in test environment
32
+ - Fixed race conditions in progress indicator updates
33
+ - Addressed timing inconsistencies in multithreaded test scenarios
34
+
35
+ ---
36
+
3
37
  ## [0.3.1] - 2025-03-03
4
38
 
5
39
  ### Added
data/README.md CHANGED
@@ -1,3 +1,6 @@
1
+ [![Gem Version](https://badge.fury.io/rb/gitingest.svg?icon=si%3Arubygems)](https://badge.fury.io/rb/gitingest)
2
+ ![Gem Total Downloads](https://img.shields.io/gem/dt/gitingest?style=flat-square&link=https%3A%2F%2Frubygems.org%2Fgems%2Fgitingest)
3
+
1
4
  # Gitingest
2
5
 
3
6
  Gitingest is a Ruby gem that fetches files from a GitHub repository and generates a consolidated text prompt, which can be used as input for large language models, documentation generation, or other purposes.
@@ -39,6 +42,18 @@ gitingest --repository user/repo --branch develop
39
42
  # Exclude additional patterns
40
43
  gitingest --repository user/repo --exclude "*.md,docs/"
41
44
 
45
+ # Control the number of threads
46
+ gitingest --repository user/repo -T 4
47
+
48
+ # Set thread pool shutdown timeout
49
+ gitingest --repository user/repo -W 120
50
+
51
+ # Show repository directory structure
52
+ gitingest --repository user/repo -s
53
+
54
+ # Combine threading options
55
+ gitingest --repository user/repo -T 8 -W 90
56
+
42
57
  # Quiet mode
43
58
  gitingest --repository user/repo --quiet
44
59
 
@@ -53,20 +68,41 @@ gitingest --repository user/repo --verbose
53
68
  - `-o, --output FILE`: Output file for the prompt [Default: reponame_prompt.txt]
54
69
  - `-e, --exclude PATTERN`: File patterns to exclude (comma separated)
55
70
  - `-b, --branch BRANCH`: Repository branch [Default: main]
71
+ - `-s, --show-structure`: Show repository directory structure instead of generating prompt
72
+ - `-T, --threads COUNT`: Number of concurrent threads [Default: auto-detected]
73
+ - `-W, --thread-timeout SECONDS`: Thread pool shutdown timeout [Default: 60]
74
+ - `-q, --quiet`: Reduce logging to errors only
75
+ - `-v, --verbose`: Increase logging verbosity
56
76
  - `-h, --help`: Show help message
57
77
 
78
+ ### Directory Structure Visualization
79
+
80
+ ```bash
81
+ gitingest --repository user/repo --show-structure
82
+ ```
83
+
84
+ This will display a tree view of the repository's structure:
85
+
58
86
  ### As a Library
59
87
 
60
88
  ```ruby
61
89
  require "gitingest"
62
90
 
63
- # Basic usage
91
+ # Basic usage - write to a file
64
92
  generator = Gitingest::Generator.new(
65
93
  repository: "user/repo",
66
94
  token: "YOUR_GITHUB_TOKEN" # optional
67
95
  )
96
+
97
+ # Run the full workflow (fetch repository and generate file)
68
98
  generator.run
69
99
 
100
+ # OR generate file only (if you need the output path)
101
+ output_path = generator.generate_file
102
+
103
+ # Get content as a string (for in-memory processing)
104
+ content = generator.generate_prompt
105
+
70
106
  # With custom options
71
107
  generator = Gitingest::Generator.new(
72
108
  repository: "user/repo",
@@ -74,9 +110,10 @@ generator = Gitingest::Generator.new(
74
110
  output_file: "my_prompt.txt",
75
111
  branch: "develop",
76
112
  exclude: ["*.md", "docs/"],
77
- quiet: true # or verbose: true
113
+ threads: 4, # control concurrency
114
+ thread_timeout: 120, # custom thread timeout
115
+ quiet: true # or verbose: true
78
116
  )
79
- generator.run
80
117
 
81
118
  # With custom logger
82
119
  custom_logger = Logger.new("gitingest.log")
@@ -84,7 +121,6 @@ generator = Gitingest::Generator.new(
84
121
  repository: "user/repo",
85
122
  logger: custom_logger
86
123
  )
87
- generator.run
88
124
  ```
89
125
 
90
126
  ## Features
@@ -124,4 +160,4 @@ Inspired by [`cyclotruc/gitingest`](https://github.com/cyclotruc/gitingest).
124
160
 
125
161
  ## License
126
162
 
127
- The gem is available as open source under the terms of the [MIT License](https://opensource.org/licenses/MIT).
163
+ The gem is available as open source under the terms of the [MIT License](https://opensource.org/licenses/MIT).
data/bin/gitingest CHANGED
@@ -22,7 +22,7 @@ parser = OptionParser.new do |opts|
22
22
  options[:output_file] = file
23
23
  end
24
24
 
25
- opts.on("-b", "--branch BRANCH", "Repository branch") do |branch|
25
+ opts.on("-b", "--branch BRANCH", "Repository branch [Default: main]") do |branch|
26
26
  options[:branch] = branch
27
27
  end
28
28
 
@@ -30,11 +30,24 @@ parser = OptionParser.new do |opts|
30
30
  options[:exclude] = pattern.split(",")
31
31
  end
32
32
 
33
- opts.on("-q", "--quiet", "Disable all output except errors") do
33
+ opts.on("-T", "--threads COUNT", Integer, "Number of concurrent threads [Default: auto-detected]") do |threads|
34
+ options[:threads] = threads
35
+ end
36
+
37
+ opts.on("-W", "--thread-timeout SECONDS", Integer,
38
+ "Thread pool shutdown timeout in seconds [Default: 60]") do |timeout|
39
+ options[:thread_timeout] = timeout
40
+ end
41
+
42
+ opts.on("-s", "--show-structure", "Show repository directory structure") do
43
+ options[:show_structure] = true
44
+ end
45
+
46
+ opts.on("-q", "--quiet", "Reduce logging to errors only") do
34
47
  options[:quiet] = true
35
48
  end
36
49
 
37
- opts.on("-v", "--verbose", "Enable verbose output") do
50
+ opts.on("-v", "--verbose", "Increase logging verbosity") do
38
51
  options[:verbose] = true
39
52
  end
40
53
 
@@ -42,6 +55,14 @@ parser = OptionParser.new do |opts|
42
55
  puts opts
43
56
  exit
44
57
  end
58
+
59
+ opts.separator ""
60
+ opts.separator "Examples:"
61
+ opts.separator " gitingest -r user/repo # Basic usage with public repository"
62
+ opts.separator " gitingest -r user/repo -t YOUR_TOKEN # With GitHub token for private repositories"
63
+ opts.separator " gitingest -r user/repo -o custom_prompt.txt # Custom output file"
64
+ opts.separator " gitingest -r user/repo -T 8 # Use 8 threads for processing"
65
+ opts.separator " gitingest -r user/repo -s # Show repository directory structure"
45
66
  end
46
67
 
47
68
  begin
data/index.html CHANGED
@@ -6,6 +6,7 @@
6
6
  <title>Gitingest - GitHub Repository Fetcher and Prompt Generator</title>
7
7
  <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/github-markdown-css/5.2.0/github-markdown.min.css">
8
8
  <style>
9
+ /* Styles remain the same */
9
10
  :root {
10
11
  --bg-color: #0d1117;
11
12
  --text-color: #c9d1d9;
@@ -176,7 +177,7 @@
176
177
  <div class="header">
177
178
  <div class="logo">G</div>
178
179
  <div>
179
- <h1>Gitingest <span class="version-badge">v0.3.0</span></h1>
180
+ <h1>Gitingest <span class="version-badge">v0.5.0</span></h1>
180
181
  <p>A Ruby gem that fetches files from a GitHub repository and generates a consolidated text prompt for LLMs</p>
181
182
  </div>
182
183
  </div>
@@ -213,6 +214,18 @@ gitingest --repository user/repo --branch develop
213
214
  # Exclude additional patterns
214
215
  gitingest --repository user/repo --exclude "*.md,docs/"
215
216
 
217
+ # Show repository directory structure
218
+ gitingest --repository user/repo -s
219
+
220
+ # Control the number of threads
221
+ gitingest --repository user/repo -T 4
222
+
223
+ # Set thread pool shutdown timeout
224
+ gitingest --repository user/repo -W 120
225
+
226
+ # Combine threading options
227
+ gitingest --repository user/repo -T 8 -W 90
228
+
216
229
  # Quiet mode
217
230
  gitingest --repository user/repo --quiet
218
231
 
@@ -226,19 +239,54 @@ gitingest --repository user/repo --verbose</code></pre>
226
239
  <li><code>-o, --output FILE</code>: Output file for the prompt [Default: reponame_prompt.txt]</li>
227
240
  <li><code>-e, --exclude PATTERN</code>: File patterns to exclude (comma separated)</li>
228
241
  <li><code>-b, --branch BRANCH</code>: Repository branch [Default: main]</li>
242
+ <li><code>-s, --show-structure</code>: Show repository directory structure</li>
243
+ <li><code>-T, --threads COUNT</code>: Number of concurrent threads [Default: auto-detected]</li>
244
+ <li><code>-W, --thread-timeout SECONDS</code>: Thread pool shutdown timeout [Default: 60]</li>
245
+ <li><code>-q, --quiet</code>: Reduce logging to errors only</li>
246
+ <li><code>-v, --verbose</code>: Increase logging verbosity</li>
229
247
  <li><code>-h, --help</code>: Show help message</li>
230
248
  </ul>
231
249
 
250
+ <h3>Directory Structure Visualization</h3>
251
+ <p>You can visualize the structure of a repository using the <code>--show-structure</code> option:</p>
252
+ <pre><code>gitingest --repository user/repo --show-structure</code></pre>
253
+
254
+ <p>This will display a tree view of the repository's structure, for example:</p>
255
+ <pre><code>Directory structure:
256
+ └── repo-name/
257
+ ├── README.md
258
+ ├── LICENSE
259
+ ├── lib/
260
+ │ ├── repo-name.rb
261
+ │ └── repo-name/
262
+ │ └── version.rb
263
+ ├── bin/
264
+ │ └── console
265
+ └── spec/
266
+ ├── spec_helper.rb
267
+ └── repo-name_spec.rb</code></pre>
268
+
232
269
  <h3>As a Library</h3>
233
270
  <pre><code>require "gitingest"
234
271
 
235
- # Basic usage
272
+ # Basic usage - write to a file
236
273
  generator = Gitingest::Generator.new(
237
274
  repository: "user/repo",
238
275
  token: "YOUR_GITHUB_TOKEN" # optional
239
276
  )
277
+
278
+ # Run the full workflow (fetch repository and generate file)
240
279
  generator.run
241
280
 
281
+ # OR generate file only (if you need the output path)
282
+ output_path = generator.generate_file
283
+
284
+ # Get content as a string (for in-memory processing)
285
+ content = generator.generate_prompt
286
+
287
+ # Generate and get repository directory structure
288
+ structure = generator.generate_directory_structure
289
+
242
290
  # With custom options
243
291
  generator = Gitingest::Generator.new(
244
292
  repository: "user/repo",
@@ -246,26 +294,32 @@ generator = Gitingest::Generator.new(
246
294
  output_file: "my_prompt.txt",
247
295
  branch: "develop",
248
296
  exclude: ["*.md", "docs/"],
249
- quiet: true # or verbose: true
297
+ threads: 4, # control concurrency
298
+ thread_timeout: 120, # custom thread timeout
299
+ quiet: true, # or verbose: true
300
+ show_structure: true # show directory structure instead of generating prompt
250
301
  )
251
- generator.run
252
302
 
253
303
  # With custom logger
254
304
  custom_logger = Logger.new("gitingest.log")
255
305
  generator = Gitingest::Generator.new(
256
306
  repository: "user/repo",
257
307
  logger: custom_logger
258
- )
259
- generator.run</code></pre>
308
+ )</code></pre>
260
309
 
261
310
  <h2>Features</h2>
262
311
  <ul>
263
312
  <li>Fetches all files from a GitHub repository based on the given branch</li>
264
313
  <li>Automatically excludes common binary files and system files by default</li>
265
314
  <li>Allows custom exclusion patterns for specific file extensions or directories</li>
266
- <li>Uses concurrent processing for faster downloads</li>
267
- <li>Handles GitHub API rate limiting with automatic retry</li>
315
+ <li>Uses concurrent processing with configurable thread count for faster downloads</li>
316
+ <li>Shows real-time progress with visual bar, ETA, and processing rate</li>
317
+ <li>Handles GitHub API rate limiting with automatic retry and exponential backoff</li>
318
+ <li>Optimizes memory usage with buffered writes and thread-local buffers</li>
319
+ <li>Intelligently prioritizes files for better thread distribution</li>
268
320
  <li>Generates a clean, formatted output file with file paths and content</li>
321
+ <li>Provides both file-based and string-based output options</li>
322
+ <li>Visualizes repository directory structure in a tree format</li>
269
323
  </ul>
270
324
 
271
325
  <h2>Default Exclusion Patterns</h2>
@@ -290,6 +344,52 @@ generator.run</code></pre>
290
344
  <div class="changelog">
291
345
  <h2>Changelog</h2>
292
346
 
347
+ <div class="changelog-item">
348
+ <div>
349
+ <span class="changelog-version">v0.5.0</span>
350
+ <span class="changelog-date">- March 4, 2025</span>
351
+ </div>
352
+ <ul class="changelog-list">
353
+ <li>Added repository directory structure visualization with <code>--show-structure</code> option</li>
354
+ <li>Created <code>DirectoryStructureBuilder</code> class to generate tree views of repositories</li>
355
+ <li>Added <code>generate_directory_structure</code> method to the Generator class</li>
356
+ <li>Added tests for the directory structure visualization</li>
357
+ <li>Updated documentation with directory structure visualization examples</li>
358
+ </ul>
359
+ </div>
360
+
361
+ <div class="changelog-item">
362
+ <div>
363
+ <span class="changelog-version">v0.4.0</span>
364
+ <span class="changelog-date">- March 4, 2025</span>
365
+ </div>
366
+ <ul class="changelog-list">
367
+ <li>Added <code>generate_prompt</code> method for in-memory content generation without file I/O</li>
368
+ <li>Integrated visual progress bar with file processing rate reporting</li>
369
+ <li>Added human-readable time formatting for progress estimates</li>
370
+ <li>Enhanced test coverage for multithreaded operations</li>
371
+ <li>Refactored <code>process_content_to_output</code> for better code reuse</li>
372
+ <li>Improved thread management to handle various error conditions gracefully</li>
373
+ <li>Fixed thread pool shutdown issues and race conditions</li>
374
+ </ul>
375
+ </div>
376
+
377
+ <div class="changelog-item">
378
+ <div>
379
+ <span class="changelog-version">v0.3.1</span>
380
+ <span class="changelog-date">- March 3, 2025</span>
381
+ </div>
382
+ <ul class="changelog-list">
383
+ <li>Introduced configurable threading options with <code>:threads</code> and <code>:thread_timeout</code></li>
384
+ <li>Implemented thread-local buffers to reduce mutex contention during file processing</li>
385
+ <li>Added exponential backoff with jitter for rate-limited API requests</li>
386
+ <li>Improved progress indicator with estimated time remaining</li>
387
+ <li>Increased <code>BUFFER_SIZE</code> from 100 to 250 to reduce I/O operations</li>
388
+ <li>Optimized file exclusion check using a combined regex for faster matching</li>
389
+ <li>Improved thread pool efficiency by prioritizing smaller files first</li>
390
+ </ul>
391
+ </div>
392
+
293
393
  <div class="changelog-item">
294
394
  <div>
295
395
  <span class="changelog-version">v0.3.0</span>
@@ -298,7 +398,7 @@ generator.run</code></pre>
298
398
  <ul class="changelog-list">
299
399
  <li>Added <code>faraday-retry</code> gem dependency for better API rate limit handling</li>
300
400
  <li>Implemented thread-safe buffer management with mutex locks</li>
301
- <li>Added new <code>ProgressIndicator</code> class for better CLI progress reporting (showing percentages)</li>
401
+ <li>Added new <code>ProgressIndicator</code> class for better CLI progress reporting</li>
302
402
  <li>Improved memory efficiency with configurable buffer size</li>
303
403
  <li>Enhanced code organization with dedicated methods for file content formatting</li>
304
404
  <li>Added comprehensive method documentation and parameter descriptions</li>
@@ -323,26 +423,6 @@ generator.run</code></pre>
323
423
  <li>Enforced a 1000 file limit to prevent memory overload</li>
324
424
  </ul>
325
425
  </div>
326
-
327
- <div class="changelog-item">
328
- <div>
329
- <span class="changelog-version">v0.1.0</span>
330
- <span class="changelog-date">- March 2, 2025</span>
331
- </div>
332
- <ul class="changelog-list">
333
- <li>Initial release of Gitingest</li>
334
- <li>Core functionality to fetch and process GitHub repository files</li>
335
- <li>Command-line interface for easy interaction</li>
336
- <li>Smart file filtering with default exclusions for common non-code files</li>
337
- <li>Concurrent processing for improved performance</li>
338
- <li>Custom exclude patterns support</li>
339
- <li>GitHub authentication via access tokens</li>
340
- <li>Automatic rate limit handling with retry mechanism</li>
341
- <li>Repository prompt generation with file separation markers</li>
342
- <li>Support for custom branch selection</li>
343
- <li>Custom output file naming options</li>
344
- </ul>
345
- </div>
346
426
  </div>
347
427
 
348
428
  <h2>Contributing</h2>
@@ -357,7 +437,7 @@ generator.run</code></pre>
357
437
 
358
438
  <footer>
359
439
  <p>© 2025 David Santangelo</p>
360
- <p>Last updated: March 2, 2025</p>
440
+ <p>Last updated: March 4, 2025</p>
361
441
  </footer>
362
442
  </body>
363
443
  </html>
@@ -96,6 +96,7 @@ module Gitingest
96
96
  # @option options [Logger] :logger Custom logger instance
97
97
  # @option options [Integer] :threads Number of threads to use (default: auto-detected)
98
98
  # @option options [Integer] :thread_timeout Seconds to wait for thread pool shutdown (default: 60)
99
+ # @option options [Boolean] :show_structure Show repository directory structure (default: false)
99
100
  def initialize(options = {})
100
101
  @options = options
101
102
  @repo_files = []
@@ -106,10 +107,63 @@ module Gitingest
106
107
  compile_excluded_patterns
107
108
  end
108
109
 
109
- # Main execution method
110
+ # Main execution method for command line
110
111
  def run
111
112
  fetch_repository_contents
112
- generate_prompt
113
+
114
+ if @options[:show_structure]
115
+ puts generate_directory_structure
116
+ return
117
+ end
118
+
119
+ generate_file
120
+ end
121
+
122
+ # Generate content and save it to a file
123
+ #
124
+ # @return [String] Path to the generated file
125
+ def generate_file
126
+ fetch_repository_contents if @repo_files.empty?
127
+
128
+ @logger.info "Generating file for #{@options[:repository]}"
129
+ File.open(@options[:output_file], "w") do |file|
130
+ process_content_to_output(file)
131
+ end
132
+
133
+ @logger.info "Prompt generated and saved to #{@options[:output_file]}"
134
+ @options[:output_file]
135
+ end
136
+
137
+ # Generate content and return it as a string
138
+ # Useful for programmatic usage
139
+ #
140
+ # @return [String] The generated repository content
141
+ def generate_prompt
142
+ @logger.info "Generating in-memory prompt for #{@options[:repository]}"
143
+
144
+ fetch_repository_contents if @repo_files.empty?
145
+
146
+ content = StringIO.new
147
+ process_content_to_output(content)
148
+
149
+ result = content.string
150
+ @logger.info "Generated #{result.size} bytes of content in memory"
151
+ result
152
+ end
153
+
154
+ # Generate a textual representation of the repository's directory structure
155
+ #
156
+ # @return [String] The directory structure as a formatted string
157
+ def generate_directory_structure
158
+ fetch_repository_contents if @repo_files.empty?
159
+
160
+ @logger.info "Generating directory structure for #{@options[:repository]}"
161
+
162
+ repo_name = @options[:repository].split("/").last
163
+ structure = DirectoryStructureBuilder.new(repo_name, @repo_files).build
164
+
165
+ @logger.info "\n"
166
+ structure
113
167
  end
114
168
 
115
169
  private
@@ -137,6 +191,7 @@ module Gitingest
137
191
  @options[:exclude] ||= []
138
192
  @options[:threads] ||= DEFAULT_THREAD_COUNT
139
193
  @options[:thread_timeout] ||= DEFAULT_THREAD_TIMEOUT
194
+ @options[:show_structure] ||= false
140
195
  @excluded_patterns = DEFAULT_EXCLUDES + @options[:exclude]
141
196
  end
142
197
 
@@ -202,89 +257,82 @@ module Gitingest
202
257
  path.match?(@combined_exclude_regex)
203
258
  end
204
259
 
205
- # Generate the consolidated prompt file with optimized threading
206
- def generate_prompt
207
- @logger.info "Generating prompt..."
260
+ # Common implementation for both file and string output
261
+ def process_content_to_output(output)
208
262
  @logger.debug "Using thread pool with #{@options[:threads]} threads"
209
263
 
210
264
  buffer = []
211
265
  progress = ProgressIndicator.new(@repo_files.size, @logger)
212
266
 
213
- # Optimization: thread-local buffers to reduce mutex contention
267
+ # Thread-local buffers to reduce mutex contention
214
268
  thread_buffers = {}
215
269
  mutex = Mutex.new
216
270
  errors = []
217
271
 
218
- # Dynamic thread pool based on configuration
272
+ # Thread pool based on configuration
219
273
  pool = Concurrent::FixedThreadPool.new(@options[:threads])
220
274
 
221
- # Group files by priority (smaller files first for better parallelism)
275
+ # Group files by priority
222
276
  prioritized_files = prioritize_files(@repo_files)
223
277
 
224
- File.open(@options[:output_file], "w") do |file|
225
- prioritized_files.each_with_index do |repo_file, index|
226
- pool.post do
227
- # Optimization: Use thread-local buffers
228
- thread_id = Thread.current.object_id
229
- thread_buffers[thread_id] ||= []
230
- local_buffer = thread_buffers[thread_id]
231
-
232
- begin
233
- content = fetch_file_content_with_retry(repo_file.path)
234
- result = format_file_content(repo_file.path, content)
235
- local_buffer << result
236
-
237
- # Optimization: Only acquire mutex when local buffer reaches threshold
238
- if local_buffer.size >= LOCAL_BUFFER_THRESHOLD
239
- mutex.synchronize do
240
- buffer.concat(local_buffer)
241
- write_buffer(file, buffer) if buffer.size >= BUFFER_SIZE
242
- local_buffer.clear
243
- end
244
- end
278
+ prioritized_files.each_with_index do |repo_file, index|
279
+ pool.post do
280
+ thread_id = Thread.current.object_id
281
+ thread_buffers[thread_id] ||= []
282
+ local_buffer = thread_buffers[thread_id]
245
283
 
246
- progress.update(index + 1)
247
- rescue Octokit::Error => e
248
- mutex.synchronize do
249
- errors << "Error fetching #{repo_file.path}: #{e.message}"
250
- @logger.error "Error fetching #{repo_file.path}: #{e.message}"
251
- end
252
- rescue StandardError => e
284
+ begin
285
+ content = fetch_file_content_with_retry(repo_file.path)
286
+ result = format_file_content(repo_file.path, content)
287
+ local_buffer << result
288
+
289
+ if local_buffer.size >= LOCAL_BUFFER_THRESHOLD
253
290
  mutex.synchronize do
254
- errors << "Unexpected error processing #{repo_file.path}: #{e.message}"
255
- @logger.error "Unexpected error processing #{repo_file.path}: #{e.message}"
291
+ buffer.concat(local_buffer)
292
+ write_buffer(output, buffer) if buffer.size >= BUFFER_SIZE
293
+ local_buffer.clear
256
294
  end
257
295
  end
296
+
297
+ progress.update(index + 1)
298
+ rescue Octokit::Error => e
299
+ mutex.synchronize do
300
+ errors << "Error fetching #{repo_file.path}: #{e.message}"
301
+ @logger.error "Error fetching #{repo_file.path}: #{e.message}"
302
+ end
303
+ rescue StandardError => e
304
+ mutex.synchronize do
305
+ errors << "Unexpected error processing #{repo_file.path}: #{e.message}"
306
+ @logger.error "Unexpected error processing #{repo_file.path}: #{e.message}"
307
+ end
258
308
  end
259
309
  end
310
+ end
260
311
 
261
- begin
262
- pool.shutdown
263
- wait_success = pool.wait_for_termination(@options[:thread_timeout])
312
+ begin
313
+ pool.shutdown
314
+ wait_success = pool.wait_for_termination(@options[:thread_timeout])
264
315
 
265
- unless wait_success
266
- @logger.warn "Thread pool did not shut down within #{@options[:thread_timeout]} seconds, forcing termination"
267
- pool.kill
268
- end
269
- rescue StandardError => e
270
- @logger.error "Error during thread pool shutdown: #{e.message}"
316
+ unless wait_success
317
+ @logger.warn "Thread pool did not shut down within #{@options[:thread_timeout]} seconds, forcing termination"
318
+ pool.kill
271
319
  end
320
+ rescue StandardError => e
321
+ @logger.error "Error during thread pool shutdown: #{e.message}"
322
+ end
272
323
 
273
- # Process remaining files in thread-local buffers
274
- mutex.synchronize do
275
- thread_buffers.each_value do |local_buffer|
276
- buffer.concat(local_buffer) unless local_buffer.empty?
277
- end
278
- write_buffer(file, buffer) unless buffer.empty?
324
+ # Process remaining files in thread-local buffers
325
+ mutex.synchronize do
326
+ thread_buffers.each_value do |local_buffer|
327
+ buffer.concat(local_buffer) unless local_buffer.empty?
279
328
  end
329
+ write_buffer(output, buffer) unless buffer.empty?
280
330
  end
281
331
 
282
- if errors.any?
283
- @logger.warn "Completed with #{errors.size} errors"
284
- @logger.debug "First few errors: #{errors.first(3).join(", ")}" if @logger.debug?
285
- end
332
+ return unless errors.any?
286
333
 
287
- @logger.info "Prompt generated and saved to #{@options[:output_file]}"
334
+ @logger.warn "Completed with #{errors.size} errors"
335
+ @logger.debug "First few errors: #{errors.first(3).join(", ")}" if @logger.debug?
288
336
  end
289
337
 
290
338
  # Format a file's content for the prompt
@@ -416,4 +464,57 @@ module Gitingest
416
464
  end
417
465
  end
418
466
  end
467
+
468
+ # Helper class to build directory structure visualization
469
+ class DirectoryStructureBuilder
470
+ def initialize(root_name, files)
471
+ @root_name = root_name
472
+ @files = files.map(&:path)
473
+ end
474
+
475
+ def build
476
+ tree = { @root_name => {} }
477
+
478
+ @files.sort.each do |path|
479
+ parts = path.split("/")
480
+ current = tree[@root_name]
481
+
482
+ parts.each do |part|
483
+ if part == parts.last
484
+ current[part] = nil
485
+ else
486
+ current[part] ||= {}
487
+ current = current[part]
488
+ end
489
+ end
490
+ end
491
+
492
+ output = ["Directory structure:"]
493
+ render_tree(tree, "", output)
494
+ output.join("\n")
495
+ end
496
+
497
+ private
498
+
499
+ def render_tree(tree, prefix, output)
500
+ return if tree.nil?
501
+
502
+ tree.keys.each_with_index do |key, index|
503
+ is_last = index == tree.keys.size - 1
504
+ current_prefix = prefix
505
+
506
+ if prefix.empty?
507
+ output << "└── #{key}/"
508
+ current_prefix = " "
509
+ else
510
+ connector = is_last ? "└── " : "├── "
511
+ item = tree[key].is_a?(Hash) ? "#{key}/" : key
512
+ output << "#{prefix}#{connector}#{item}"
513
+ current_prefix = prefix + (is_last ? " " : "│ ")
514
+ end
515
+
516
+ render_tree(tree[key], current_prefix, output) if tree[key].is_a?(Hash)
517
+ end
518
+ end
519
+ end
419
520
  end
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module Gitingest
4
- VERSION = "0.3.1"
4
+ VERSION = "0.5.0"
5
5
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: gitingest
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.3.1
4
+ version: 0.5.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Davide Santangelo
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2025-03-02 00:00:00.000000000 Z
11
+ date: 2025-03-10 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: concurrent-ruby