gitingest 0.4.0 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 114b6d8e954843f88917f556760e7fab89753126cb5fd059ed6cfe55c8f2e6c6
4
- data.tar.gz: 39873c0d14eff9d6e615f6e2f13e7e30331f0e97db1162b613047782a582ff6c
3
+ metadata.gz: c754bbf3a24a049ce269017c82ef90b295b0503cb05cc0e652c0101ce68df484
4
+ data.tar.gz: c3df8efb661ff08e0525da943062882a7a2b467302895f09cbb5dbab38383927
5
5
  SHA512:
6
- metadata.gz: f35ffb41ddd9990cd1c2e8c4ad08018a5bdd63c8ec222bfce021ede2c67dfa9355fbc7f1102f014c555d0df46501877b01f2767aadf674896635bd7fa5bab355
7
- data.tar.gz: e431693ee45cf65ab3c63931c5c4a69675ddafc8038f90cda3dfb7dacec7449f48a65a41bc12f56996f8e697f80d1a896243e97aa37c96085107491099dabc05
6
+ metadata.gz: 803d3a5bb7ca76c9f51a268d22d485c1455b8ba7ebbe16aa3c5af8eabd63fddef273810ec10fa682b7cf606094b30c1ce681468d2a48a190d546c81a6eb779ca
7
+ data.tar.gz: 6781db79ba3fce1c75f13e8587ceffe8e26d0da276c0c1bbf175f942a9e8e9f1b742884413aabcc6b719a2c010c4156e601aa4577b9604e6edcd7959c67447ec
data/CHANGELOG.md CHANGED
@@ -1,5 +1,19 @@
1
1
  # Changelog
2
2
 
3
+ ## [0.5.0] - 2025-03-10
4
+
5
+ ### Added
6
+ - Added repository directory structure visualization with `--show-structure` / `-s` option
7
+ - Created `DirectoryStructureBuilder` class to generate tree views of repositories
8
+ - Added `generate_directory_structure` method to the Generator class
9
+ - Added tests for directory structure visualization
10
+
11
+ ### Changed
12
+ - Enhanced documentation with directory structure visualization examples
13
+ - Updated CLI help with the new option
14
+
15
+ ---
16
+
3
17
  ## [0.4.0] - 2025-03-03
4
18
 
5
19
  ### Added
data/README.md CHANGED
@@ -1,3 +1,6 @@
1
+ [![Gem Version](https://badge.fury.io/rb/gitingest.svg?icon=si%3Arubygems)](https://badge.fury.io/rb/gitingest)
2
+ ![Gem Total Downloads](https://img.shields.io/gem/dt/gitingest?style=flat-square&link=https%3A%2F%2Frubygems.org%2Fgems%2Fgitingest)
3
+
1
4
  # Gitingest
2
5
 
3
6
  Gitingest is a Ruby gem that fetches files from a GitHub repository and generates a consolidated text prompt, which can be used as input for large language models, documentation generation, or other purposes.
@@ -45,6 +48,9 @@ gitingest --repository user/repo -T 4
45
48
  # Set thread pool shutdown timeout
46
49
  gitingest --repository user/repo -W 120
47
50
 
51
+ # Show repository directory structure
52
+ gitingest --repository user/repo -s
53
+
48
54
  # Combine threading options
49
55
  gitingest --repository user/repo -T 8 -W 90
50
56
 
@@ -62,12 +68,21 @@ gitingest --repository user/repo --verbose
62
68
  - `-o, --output FILE`: Output file for the prompt [Default: reponame_prompt.txt]
63
69
  - `-e, --exclude PATTERN`: File patterns to exclude (comma separated)
64
70
  - `-b, --branch BRANCH`: Repository branch [Default: main]
71
+ - `-s, --show-structure`: Show repository directory structure instead of generating prompt
65
72
  - `-T, --threads COUNT`: Number of concurrent threads [Default: auto-detected]
66
73
  - `-W, --thread-timeout SECONDS`: Thread pool shutdown timeout [Default: 60]
67
74
  - `-q, --quiet`: Reduce logging to errors only
68
75
  - `-v, --verbose`: Increase logging verbosity
69
76
  - `-h, --help`: Show help message
70
77
 
78
+ ### Directory Structure Visualization
79
+
80
+ ```bash
81
+ gitingest --repository user/repo --show-structure
82
+ ```
83
+
84
+ This will display a tree view of the repository's structure:
85
+
71
86
  ### As a Library
72
87
 
73
88
  ```ruby
@@ -145,4 +160,4 @@ Inspired by [`cyclotruc/gitingest`](https://github.com/cyclotruc/gitingest).
145
160
 
146
161
  ## License
147
162
 
148
- The gem is available as open source under the terms of the [MIT License](https://opensource.org/licenses/MIT).
163
+ The gem is available as open source under the terms of the [MIT License](https://opensource.org/licenses/MIT).
data/bin/gitingest CHANGED
@@ -39,6 +39,10 @@ parser = OptionParser.new do |opts|
39
39
  options[:thread_timeout] = timeout
40
40
  end
41
41
 
42
+ opts.on("-s", "--show-structure", "Show repository directory structure") do
43
+ options[:show_structure] = true
44
+ end
45
+
42
46
  opts.on("-q", "--quiet", "Reduce logging to errors only") do
43
47
  options[:quiet] = true
44
48
  end
@@ -58,6 +62,7 @@ parser = OptionParser.new do |opts|
58
62
  opts.separator " gitingest -r user/repo -t YOUR_TOKEN # With GitHub token for private repositories"
59
63
  opts.separator " gitingest -r user/repo -o custom_prompt.txt # Custom output file"
60
64
  opts.separator " gitingest -r user/repo -T 8 # Use 8 threads for processing"
65
+ opts.separator " gitingest -r user/repo -s # Show repository directory structure"
61
66
  end
62
67
 
63
68
  begin
data/index.html CHANGED
@@ -6,6 +6,7 @@
6
6
  <title>Gitingest - GitHub Repository Fetcher and Prompt Generator</title>
7
7
  <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/github-markdown-css/5.2.0/github-markdown.min.css">
8
8
  <style>
9
+ /* Styles remain the same */
9
10
  :root {
10
11
  --bg-color: #0d1117;
11
12
  --text-color: #c9d1d9;
@@ -176,7 +177,7 @@
176
177
  <div class="header">
177
178
  <div class="logo">G</div>
178
179
  <div>
179
- <h1>Gitingest <span class="version-badge">v0.3.0</span></h1>
180
+ <h1>Gitingest <span class="version-badge">v0.5.0</span></h1>
180
181
  <p>A Ruby gem that fetches files from a GitHub repository and generates a consolidated text prompt for LLMs</p>
181
182
  </div>
182
183
  </div>
@@ -213,6 +214,18 @@ gitingest --repository user/repo --branch develop
213
214
  # Exclude additional patterns
214
215
  gitingest --repository user/repo --exclude "*.md,docs/"
215
216
 
217
+ # Show repository directory structure
218
+ gitingest --repository user/repo -s
219
+
220
+ # Control the number of threads
221
+ gitingest --repository user/repo -T 4
222
+
223
+ # Set thread pool shutdown timeout
224
+ gitingest --repository user/repo -W 120
225
+
226
+ # Combine threading options
227
+ gitingest --repository user/repo -T 8 -W 90
228
+
216
229
  # Quiet mode
217
230
  gitingest --repository user/repo --quiet
218
231
 
@@ -226,19 +239,54 @@ gitingest --repository user/repo --verbose</code></pre>
226
239
  <li><code>-o, --output FILE</code>: Output file for the prompt [Default: reponame_prompt.txt]</li>
227
240
  <li><code>-e, --exclude PATTERN</code>: File patterns to exclude (comma separated)</li>
228
241
  <li><code>-b, --branch BRANCH</code>: Repository branch [Default: main]</li>
242
+ <li><code>-s, --show-structure</code>: Show repository directory structure</li>
243
+ <li><code>-T, --threads COUNT</code>: Number of concurrent threads [Default: auto-detected]</li>
244
+ <li><code>-W, --thread-timeout SECONDS</code>: Thread pool shutdown timeout [Default: 60]</li>
245
+ <li><code>-q, --quiet</code>: Reduce logging to errors only</li>
246
+ <li><code>-v, --verbose</code>: Increase logging verbosity</li>
229
247
  <li><code>-h, --help</code>: Show help message</li>
230
248
  </ul>
231
249
 
250
+ <h3>Directory Structure Visualization</h3>
251
+ <p>You can visualize the structure of a repository using the <code>--show-structure</code> option:</p>
252
+ <pre><code>gitingest --repository user/repo --show-structure</code></pre>
253
+
254
+ <p>This will display a tree view of the repository's structure, for example:</p>
255
+ <pre><code>Directory structure:
256
+ └── repo-name/
257
+ ├── README.md
258
+ ├── LICENSE
259
+ ├── lib/
260
+ │ ├── repo-name.rb
261
+ │ └── repo-name/
262
+ │ └── version.rb
263
+ ├── bin/
264
+ │ └── console
265
+ └── spec/
266
+ ├── spec_helper.rb
267
+ └── repo-name_spec.rb</code></pre>
268
+
232
269
  <h3>As a Library</h3>
233
270
  <pre><code>require "gitingest"
234
271
 
235
- # Basic usage
272
+ # Basic usage - write to a file
236
273
  generator = Gitingest::Generator.new(
237
274
  repository: "user/repo",
238
275
  token: "YOUR_GITHUB_TOKEN" # optional
239
276
  )
277
+
278
+ # Run the full workflow (fetch repository and generate file)
240
279
  generator.run
241
280
 
281
+ # OR generate file only (if you need the output path)
282
+ output_path = generator.generate_file
283
+
284
+ # Get content as a string (for in-memory processing)
285
+ content = generator.generate_prompt
286
+
287
+ # Generate and get repository directory structure
288
+ structure = generator.generate_directory_structure
289
+
242
290
  # With custom options
243
291
  generator = Gitingest::Generator.new(
244
292
  repository: "user/repo",
@@ -246,26 +294,32 @@ generator = Gitingest::Generator.new(
246
294
  output_file: "my_prompt.txt",
247
295
  branch: "develop",
248
296
  exclude: ["*.md", "docs/"],
249
- quiet: true # or verbose: true
297
+ threads: 4, # control concurrency
298
+ thread_timeout: 120, # custom thread timeout
299
+ quiet: true, # or verbose: true
300
+ show_structure: true # show directory structure instead of generating prompt
250
301
  )
251
- generator.run
252
302
 
253
303
  # With custom logger
254
304
  custom_logger = Logger.new("gitingest.log")
255
305
  generator = Gitingest::Generator.new(
256
306
  repository: "user/repo",
257
307
  logger: custom_logger
258
- )
259
- generator.run</code></pre>
308
+ )</code></pre>
260
309
 
261
310
  <h2>Features</h2>
262
311
  <ul>
263
312
  <li>Fetches all files from a GitHub repository based on the given branch</li>
264
313
  <li>Automatically excludes common binary files and system files by default</li>
265
314
  <li>Allows custom exclusion patterns for specific file extensions or directories</li>
266
- <li>Uses concurrent processing for faster downloads</li>
267
- <li>Handles GitHub API rate limiting with automatic retry</li>
315
+ <li>Uses concurrent processing with configurable thread count for faster downloads</li>
316
+ <li>Shows real-time progress with visual bar, ETA, and processing rate</li>
317
+ <li>Handles GitHub API rate limiting with automatic retry and exponential backoff</li>
318
+ <li>Optimizes memory usage with buffered writes and thread-local buffers</li>
319
+ <li>Intelligently prioritizes files for better thread distribution</li>
268
320
  <li>Generates a clean, formatted output file with file paths and content</li>
321
+ <li>Provides both file-based and string-based output options</li>
322
+ <li>Visualizes repository directory structure in a tree format</li>
269
323
  </ul>
270
324
 
271
325
  <h2>Default Exclusion Patterns</h2>
@@ -290,6 +344,52 @@ generator.run</code></pre>
290
344
  <div class="changelog">
291
345
  <h2>Changelog</h2>
292
346
 
347
+ <div class="changelog-item">
348
+ <div>
349
+ <span class="changelog-version">v0.5.0</span>
350
+ <span class="changelog-date">- March 4, 2025</span>
351
+ </div>
352
+ <ul class="changelog-list">
353
+ <li>Added repository directory structure visualization with <code>--show-structure</code> option</li>
354
+ <li>Created <code>DirectoryStructureBuilder</code> class to generate tree views of repositories</li>
355
+ <li>Added <code>generate_directory_structure</code> method to the Generator class</li>
356
+ <li>Added tests for the directory structure visualization</li>
357
+ <li>Updated documentation with directory structure visualization examples</li>
358
+ </ul>
359
+ </div>
360
+
361
+ <div class="changelog-item">
362
+ <div>
363
+ <span class="changelog-version">v0.4.0</span>
364
+ <span class="changelog-date">- March 4, 2025</span>
365
+ </div>
366
+ <ul class="changelog-list">
367
+ <li>Added <code>generate_prompt</code> method for in-memory content generation without file I/O</li>
368
+ <li>Integrated visual progress bar with file processing rate reporting</li>
369
+ <li>Added human-readable time formatting for progress estimates</li>
370
+ <li>Enhanced test coverage for multithreaded operations</li>
371
+ <li>Refactored <code>process_content_to_output</code> for better code reuse</li>
372
+ <li>Improved thread management to handle various error conditions gracefully</li>
373
+ <li>Fixed thread pool shutdown issues and race conditions</li>
374
+ </ul>
375
+ </div>
376
+
377
+ <div class="changelog-item">
378
+ <div>
379
+ <span class="changelog-version">v0.3.1</span>
380
+ <span class="changelog-date">- March 3, 2025</span>
381
+ </div>
382
+ <ul class="changelog-list">
383
+ <li>Introduced configurable threading options with <code>:threads</code> and <code>:thread_timeout</code></li>
384
+ <li>Implemented thread-local buffers to reduce mutex contention during file processing</li>
385
+ <li>Added exponential backoff with jitter for rate-limited API requests</li>
386
+ <li>Improved progress indicator with estimated time remaining</li>
387
+ <li>Increased <code>BUFFER_SIZE</code> from 100 to 250 to reduce I/O operations</li>
388
+ <li>Optimized file exclusion check using a combined regex for faster matching</li>
389
+ <li>Improved thread pool efficiency by prioritizing smaller files first</li>
390
+ </ul>
391
+ </div>
392
+
293
393
  <div class="changelog-item">
294
394
  <div>
295
395
  <span class="changelog-version">v0.3.0</span>
@@ -298,7 +398,7 @@ generator.run</code></pre>
298
398
  <ul class="changelog-list">
299
399
  <li>Added <code>faraday-retry</code> gem dependency for better API rate limit handling</li>
300
400
  <li>Implemented thread-safe buffer management with mutex locks</li>
301
- <li>Added new <code>ProgressIndicator</code> class for better CLI progress reporting (showing percentages)</li>
401
+ <li>Added new <code>ProgressIndicator</code> class for better CLI progress reporting</li>
302
402
  <li>Improved memory efficiency with configurable buffer size</li>
303
403
  <li>Enhanced code organization with dedicated methods for file content formatting</li>
304
404
  <li>Added comprehensive method documentation and parameter descriptions</li>
@@ -323,26 +423,6 @@ generator.run</code></pre>
323
423
  <li>Enforced a 1000 file limit to prevent memory overload</li>
324
424
  </ul>
325
425
  </div>
326
-
327
- <div class="changelog-item">
328
- <div>
329
- <span class="changelog-version">v0.1.0</span>
330
- <span class="changelog-date">- March 2, 2025</span>
331
- </div>
332
- <ul class="changelog-list">
333
- <li>Initial release of Gitingest</li>
334
- <li>Core functionality to fetch and process GitHub repository files</li>
335
- <li>Command-line interface for easy interaction</li>
336
- <li>Smart file filtering with default exclusions for common non-code files</li>
337
- <li>Concurrent processing for improved performance</li>
338
- <li>Custom exclude patterns support</li>
339
- <li>GitHub authentication via access tokens</li>
340
- <li>Automatic rate limit handling with retry mechanism</li>
341
- <li>Repository prompt generation with file separation markers</li>
342
- <li>Support for custom branch selection</li>
343
- <li>Custom output file naming options</li>
344
- </ul>
345
- </div>
346
426
  </div>
347
427
 
348
428
  <h2>Contributing</h2>
@@ -357,7 +437,7 @@ generator.run</code></pre>
357
437
 
358
438
  <footer>
359
439
  <p>© 2025 David Santangelo</p>
360
- <p>Last updated: March 2, 2025</p>
440
+ <p>Last updated: March 4, 2025</p>
361
441
  </footer>
362
442
  </body>
363
443
  </html>
@@ -96,6 +96,7 @@ module Gitingest
96
96
  # @option options [Logger] :logger Custom logger instance
97
97
  # @option options [Integer] :threads Number of threads to use (default: auto-detected)
98
98
  # @option options [Integer] :thread_timeout Seconds to wait for thread pool shutdown (default: 60)
99
+ # @option options [Boolean] :show_structure Show repository directory structure (default: false)
99
100
  def initialize(options = {})
100
101
  @options = options
101
102
  @repo_files = []
@@ -109,6 +110,12 @@ module Gitingest
109
110
  # Main execution method for command line
110
111
  def run
111
112
  fetch_repository_contents
113
+
114
+ if @options[:show_structure]
115
+ puts generate_directory_structure
116
+ return
117
+ end
118
+
112
119
  generate_file
113
120
  end
114
121
 
@@ -144,6 +151,21 @@ module Gitingest
144
151
  result
145
152
  end
146
153
 
154
+ # Generate a textual representation of the repository's directory structure
155
+ #
156
+ # @return [String] The directory structure as a formatted string
157
+ def generate_directory_structure
158
+ fetch_repository_contents if @repo_files.empty?
159
+
160
+ @logger.info "Generating directory structure for #{@options[:repository]}"
161
+
162
+ repo_name = @options[:repository].split("/").last
163
+ structure = DirectoryStructureBuilder.new(repo_name, @repo_files).build
164
+
165
+ @logger.info "\n"
166
+ structure
167
+ end
168
+
147
169
  private
148
170
 
149
171
  # Set up logging based on verbosity options
@@ -169,6 +191,7 @@ module Gitingest
169
191
  @options[:exclude] ||= []
170
192
  @options[:threads] ||= DEFAULT_THREAD_COUNT
171
193
  @options[:thread_timeout] ||= DEFAULT_THREAD_TIMEOUT
194
+ @options[:show_structure] ||= false
172
195
  @excluded_patterns = DEFAULT_EXCLUDES + @options[:exclude]
173
196
  end
174
197
 
@@ -441,4 +464,57 @@ module Gitingest
441
464
  end
442
465
  end
443
466
  end
467
+
468
+ # Helper class to build directory structure visualization
469
+ class DirectoryStructureBuilder
470
+ def initialize(root_name, files)
471
+ @root_name = root_name
472
+ @files = files.map(&:path)
473
+ end
474
+
475
+ def build
476
+ tree = { @root_name => {} }
477
+
478
+ @files.sort.each do |path|
479
+ parts = path.split("/")
480
+ current = tree[@root_name]
481
+
482
+ parts.each do |part|
483
+ if part == parts.last
484
+ current[part] = nil
485
+ else
486
+ current[part] ||= {}
487
+ current = current[part]
488
+ end
489
+ end
490
+ end
491
+
492
+ output = ["Directory structure:"]
493
+ render_tree(tree, "", output)
494
+ output.join("\n")
495
+ end
496
+
497
+ private
498
+
499
+ def render_tree(tree, prefix, output)
500
+ return if tree.nil?
501
+
502
+ tree.keys.each_with_index do |key, index|
503
+ is_last = index == tree.keys.size - 1
504
+ current_prefix = prefix
505
+
506
+ if prefix.empty?
507
+ output << "└── #{key}/"
508
+ current_prefix = " "
509
+ else
510
+ connector = is_last ? "└── " : "├── "
511
+ item = tree[key].is_a?(Hash) ? "#{key}/" : key
512
+ output << "#{prefix}#{connector}#{item}"
513
+ current_prefix = prefix + (is_last ? " " : "│ ")
514
+ end
515
+
516
+ render_tree(tree[key], current_prefix, output) if tree[key].is_a?(Hash)
517
+ end
518
+ end
519
+ end
444
520
  end
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module Gitingest
4
- VERSION = "0.4.0"
4
+ VERSION = "0.5.0"
5
5
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: gitingest
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.4.0
4
+ version: 0.5.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Davide Santangelo
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2025-03-03 00:00:00.000000000 Z
11
+ date: 2025-03-10 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: concurrent-ruby