gitingest 0.4.0 → 0.5.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +14 -0
- data/README.md +16 -1
- data/bin/gitingest +5 -0
- data/index.html +110 -30
- data/lib/gitingest/generator.rb +76 -0
- data/lib/gitingest/version.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: c754bbf3a24a049ce269017c82ef90b295b0503cb05cc0e652c0101ce68df484
|
4
|
+
data.tar.gz: c3df8efb661ff08e0525da943062882a7a2b467302895f09cbb5dbab38383927
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 803d3a5bb7ca76c9f51a268d22d485c1455b8ba7ebbe16aa3c5af8eabd63fddef273810ec10fa682b7cf606094b30c1ce681468d2a48a190d546c81a6eb779ca
|
7
|
+
data.tar.gz: 6781db79ba3fce1c75f13e8587ceffe8e26d0da276c0c1bbf175f942a9e8e9f1b742884413aabcc6b719a2c010c4156e601aa4577b9604e6edcd7959c67447ec
|
data/CHANGELOG.md
CHANGED
@@ -1,5 +1,19 @@
|
|
1
1
|
# Changelog
|
2
2
|
|
3
|
+
## [0.5.0] - 2025-03-10
|
4
|
+
|
5
|
+
### Added
|
6
|
+
- Added repository directory structure visualization with `--show-structure` / `-s` option
|
7
|
+
- Created `DirectoryStructureBuilder` class to generate tree views of repositories
|
8
|
+
- Added `generate_directory_structure` method to the Generator class
|
9
|
+
- Added tests for directory structure visualization
|
10
|
+
|
11
|
+
### Changed
|
12
|
+
- Enhanced documentation with directory structure visualization examples
|
13
|
+
- Updated CLI help with the new option
|
14
|
+
|
15
|
+
---
|
16
|
+
|
3
17
|
## [0.4.0] - 2025-03-03
|
4
18
|
|
5
19
|
### Added
|
data/README.md
CHANGED
@@ -1,3 +1,6 @@
|
|
1
|
+
[](https://badge.fury.io/rb/gitingest)
|
2
|
+

|
3
|
+
|
1
4
|
# Gitingest
|
2
5
|
|
3
6
|
Gitingest is a Ruby gem that fetches files from a GitHub repository and generates a consolidated text prompt, which can be used as input for large language models, documentation generation, or other purposes.
|
@@ -45,6 +48,9 @@ gitingest --repository user/repo -T 4
|
|
45
48
|
# Set thread pool shutdown timeout
|
46
49
|
gitingest --repository user/repo -W 120
|
47
50
|
|
51
|
+
# Show repository directory structure
|
52
|
+
gitingest --repository user/repo -s
|
53
|
+
|
48
54
|
# Combine threading options
|
49
55
|
gitingest --repository user/repo -T 8 -W 90
|
50
56
|
|
@@ -62,12 +68,21 @@ gitingest --repository user/repo --verbose
|
|
62
68
|
- `-o, --output FILE`: Output file for the prompt [Default: reponame_prompt.txt]
|
63
69
|
- `-e, --exclude PATTERN`: File patterns to exclude (comma separated)
|
64
70
|
- `-b, --branch BRANCH`: Repository branch [Default: main]
|
71
|
+
- `-s, --show-structure`: Show repository directory structure instead of generating prompt
|
65
72
|
- `-T, --threads COUNT`: Number of concurrent threads [Default: auto-detected]
|
66
73
|
- `-W, --thread-timeout SECONDS`: Thread pool shutdown timeout [Default: 60]
|
67
74
|
- `-q, --quiet`: Reduce logging to errors only
|
68
75
|
- `-v, --verbose`: Increase logging verbosity
|
69
76
|
- `-h, --help`: Show help message
|
70
77
|
|
78
|
+
### Directory Structure Visualization
|
79
|
+
|
80
|
+
```bash
|
81
|
+
gitingest --repository user/repo --show-structure
|
82
|
+
```
|
83
|
+
|
84
|
+
This will display a tree view of the repository's structure:
|
85
|
+
|
71
86
|
### As a Library
|
72
87
|
|
73
88
|
```ruby
|
@@ -145,4 +160,4 @@ Inspired by [`cyclotruc/gitingest`](https://github.com/cyclotruc/gitingest).
|
|
145
160
|
|
146
161
|
## License
|
147
162
|
|
148
|
-
The gem is available as open source under the terms of the [MIT License](https://opensource.org/licenses/MIT).
|
163
|
+
The gem is available as open source under the terms of the [MIT License](https://opensource.org/licenses/MIT).
|
data/bin/gitingest
CHANGED
@@ -39,6 +39,10 @@ parser = OptionParser.new do |opts|
|
|
39
39
|
options[:thread_timeout] = timeout
|
40
40
|
end
|
41
41
|
|
42
|
+
opts.on("-s", "--show-structure", "Show repository directory structure") do
|
43
|
+
options[:show_structure] = true
|
44
|
+
end
|
45
|
+
|
42
46
|
opts.on("-q", "--quiet", "Reduce logging to errors only") do
|
43
47
|
options[:quiet] = true
|
44
48
|
end
|
@@ -58,6 +62,7 @@ parser = OptionParser.new do |opts|
|
|
58
62
|
opts.separator " gitingest -r user/repo -t YOUR_TOKEN # With GitHub token for private repositories"
|
59
63
|
opts.separator " gitingest -r user/repo -o custom_prompt.txt # Custom output file"
|
60
64
|
opts.separator " gitingest -r user/repo -T 8 # Use 8 threads for processing"
|
65
|
+
opts.separator " gitingest -r user/repo -s # Show repository directory structure"
|
61
66
|
end
|
62
67
|
|
63
68
|
begin
|
data/index.html
CHANGED
@@ -6,6 +6,7 @@
|
|
6
6
|
<title>Gitingest - GitHub Repository Fetcher and Prompt Generator</title>
|
7
7
|
<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/github-markdown-css/5.2.0/github-markdown.min.css">
|
8
8
|
<style>
|
9
|
+
/* Styles remain the same */
|
9
10
|
:root {
|
10
11
|
--bg-color: #0d1117;
|
11
12
|
--text-color: #c9d1d9;
|
@@ -176,7 +177,7 @@
|
|
176
177
|
<div class="header">
|
177
178
|
<div class="logo">G</div>
|
178
179
|
<div>
|
179
|
-
<h1>Gitingest <span class="version-badge">v0.
|
180
|
+
<h1>Gitingest <span class="version-badge">v0.5.0</span></h1>
|
180
181
|
<p>A Ruby gem that fetches files from a GitHub repository and generates a consolidated text prompt for LLMs</p>
|
181
182
|
</div>
|
182
183
|
</div>
|
@@ -213,6 +214,18 @@ gitingest --repository user/repo --branch develop
|
|
213
214
|
# Exclude additional patterns
|
214
215
|
gitingest --repository user/repo --exclude "*.md,docs/"
|
215
216
|
|
217
|
+
# Show repository directory structure
|
218
|
+
gitingest --repository user/repo -s
|
219
|
+
|
220
|
+
# Control the number of threads
|
221
|
+
gitingest --repository user/repo -T 4
|
222
|
+
|
223
|
+
# Set thread pool shutdown timeout
|
224
|
+
gitingest --repository user/repo -W 120
|
225
|
+
|
226
|
+
# Combine threading options
|
227
|
+
gitingest --repository user/repo -T 8 -W 90
|
228
|
+
|
216
229
|
# Quiet mode
|
217
230
|
gitingest --repository user/repo --quiet
|
218
231
|
|
@@ -226,19 +239,54 @@ gitingest --repository user/repo --verbose</code></pre>
|
|
226
239
|
<li><code>-o, --output FILE</code>: Output file for the prompt [Default: reponame_prompt.txt]</li>
|
227
240
|
<li><code>-e, --exclude PATTERN</code>: File patterns to exclude (comma separated)</li>
|
228
241
|
<li><code>-b, --branch BRANCH</code>: Repository branch [Default: main]</li>
|
242
|
+
<li><code>-s, --show-structure</code>: Show repository directory structure</li>
|
243
|
+
<li><code>-T, --threads COUNT</code>: Number of concurrent threads [Default: auto-detected]</li>
|
244
|
+
<li><code>-W, --thread-timeout SECONDS</code>: Thread pool shutdown timeout [Default: 60]</li>
|
245
|
+
<li><code>-q, --quiet</code>: Reduce logging to errors only</li>
|
246
|
+
<li><code>-v, --verbose</code>: Increase logging verbosity</li>
|
229
247
|
<li><code>-h, --help</code>: Show help message</li>
|
230
248
|
</ul>
|
231
249
|
|
250
|
+
<h3>Directory Structure Visualization</h3>
|
251
|
+
<p>You can visualize the structure of a repository using the <code>--show-structure</code> option:</p>
|
252
|
+
<pre><code>gitingest --repository user/repo --show-structure</code></pre>
|
253
|
+
|
254
|
+
<p>This will display a tree view of the repository's structure, for example:</p>
|
255
|
+
<pre><code>Directory structure:
|
256
|
+
└── repo-name/
|
257
|
+
├── README.md
|
258
|
+
├── LICENSE
|
259
|
+
├── lib/
|
260
|
+
│ ├── repo-name.rb
|
261
|
+
│ └── repo-name/
|
262
|
+
│ └── version.rb
|
263
|
+
├── bin/
|
264
|
+
│ └── console
|
265
|
+
└── spec/
|
266
|
+
├── spec_helper.rb
|
267
|
+
└── repo-name_spec.rb</code></pre>
|
268
|
+
|
232
269
|
<h3>As a Library</h3>
|
233
270
|
<pre><code>require "gitingest"
|
234
271
|
|
235
|
-
# Basic usage
|
272
|
+
# Basic usage - write to a file
|
236
273
|
generator = Gitingest::Generator.new(
|
237
274
|
repository: "user/repo",
|
238
275
|
token: "YOUR_GITHUB_TOKEN" # optional
|
239
276
|
)
|
277
|
+
|
278
|
+
# Run the full workflow (fetch repository and generate file)
|
240
279
|
generator.run
|
241
280
|
|
281
|
+
# OR generate file only (if you need the output path)
|
282
|
+
output_path = generator.generate_file
|
283
|
+
|
284
|
+
# Get content as a string (for in-memory processing)
|
285
|
+
content = generator.generate_prompt
|
286
|
+
|
287
|
+
# Generate and get repository directory structure
|
288
|
+
structure = generator.generate_directory_structure
|
289
|
+
|
242
290
|
# With custom options
|
243
291
|
generator = Gitingest::Generator.new(
|
244
292
|
repository: "user/repo",
|
@@ -246,26 +294,32 @@ generator = Gitingest::Generator.new(
|
|
246
294
|
output_file: "my_prompt.txt",
|
247
295
|
branch: "develop",
|
248
296
|
exclude: ["*.md", "docs/"],
|
249
|
-
|
297
|
+
threads: 4, # control concurrency
|
298
|
+
thread_timeout: 120, # custom thread timeout
|
299
|
+
quiet: true, # or verbose: true
|
300
|
+
show_structure: true # show directory structure instead of generating prompt
|
250
301
|
)
|
251
|
-
generator.run
|
252
302
|
|
253
303
|
# With custom logger
|
254
304
|
custom_logger = Logger.new("gitingest.log")
|
255
305
|
generator = Gitingest::Generator.new(
|
256
306
|
repository: "user/repo",
|
257
307
|
logger: custom_logger
|
258
|
-
)
|
259
|
-
generator.run</code></pre>
|
308
|
+
)</code></pre>
|
260
309
|
|
261
310
|
<h2>Features</h2>
|
262
311
|
<ul>
|
263
312
|
<li>Fetches all files from a GitHub repository based on the given branch</li>
|
264
313
|
<li>Automatically excludes common binary files and system files by default</li>
|
265
314
|
<li>Allows custom exclusion patterns for specific file extensions or directories</li>
|
266
|
-
<li>Uses concurrent processing for faster downloads</li>
|
267
|
-
<li>
|
315
|
+
<li>Uses concurrent processing with configurable thread count for faster downloads</li>
|
316
|
+
<li>Shows real-time progress with visual bar, ETA, and processing rate</li>
|
317
|
+
<li>Handles GitHub API rate limiting with automatic retry and exponential backoff</li>
|
318
|
+
<li>Optimizes memory usage with buffered writes and thread-local buffers</li>
|
319
|
+
<li>Intelligently prioritizes files for better thread distribution</li>
|
268
320
|
<li>Generates a clean, formatted output file with file paths and content</li>
|
321
|
+
<li>Provides both file-based and string-based output options</li>
|
322
|
+
<li>Visualizes repository directory structure in a tree format</li>
|
269
323
|
</ul>
|
270
324
|
|
271
325
|
<h2>Default Exclusion Patterns</h2>
|
@@ -290,6 +344,52 @@ generator.run</code></pre>
|
|
290
344
|
<div class="changelog">
|
291
345
|
<h2>Changelog</h2>
|
292
346
|
|
347
|
+
<div class="changelog-item">
|
348
|
+
<div>
|
349
|
+
<span class="changelog-version">v0.5.0</span>
|
350
|
+
<span class="changelog-date">- March 4, 2025</span>
|
351
|
+
</div>
|
352
|
+
<ul class="changelog-list">
|
353
|
+
<li>Added repository directory structure visualization with <code>--show-structure</code> option</li>
|
354
|
+
<li>Created <code>DirectoryStructureBuilder</code> class to generate tree views of repositories</li>
|
355
|
+
<li>Added <code>generate_directory_structure</code> method to the Generator class</li>
|
356
|
+
<li>Added tests for the directory structure visualization</li>
|
357
|
+
<li>Updated documentation with directory structure visualization examples</li>
|
358
|
+
</ul>
|
359
|
+
</div>
|
360
|
+
|
361
|
+
<div class="changelog-item">
|
362
|
+
<div>
|
363
|
+
<span class="changelog-version">v0.4.0</span>
|
364
|
+
<span class="changelog-date">- March 4, 2025</span>
|
365
|
+
</div>
|
366
|
+
<ul class="changelog-list">
|
367
|
+
<li>Added <code>generate_prompt</code> method for in-memory content generation without file I/O</li>
|
368
|
+
<li>Integrated visual progress bar with file processing rate reporting</li>
|
369
|
+
<li>Added human-readable time formatting for progress estimates</li>
|
370
|
+
<li>Enhanced test coverage for multithreaded operations</li>
|
371
|
+
<li>Refactored <code>process_content_to_output</code> for better code reuse</li>
|
372
|
+
<li>Improved thread management to handle various error conditions gracefully</li>
|
373
|
+
<li>Fixed thread pool shutdown issues and race conditions</li>
|
374
|
+
</ul>
|
375
|
+
</div>
|
376
|
+
|
377
|
+
<div class="changelog-item">
|
378
|
+
<div>
|
379
|
+
<span class="changelog-version">v0.3.1</span>
|
380
|
+
<span class="changelog-date">- March 3, 2025</span>
|
381
|
+
</div>
|
382
|
+
<ul class="changelog-list">
|
383
|
+
<li>Introduced configurable threading options with <code>:threads</code> and <code>:thread_timeout</code></li>
|
384
|
+
<li>Implemented thread-local buffers to reduce mutex contention during file processing</li>
|
385
|
+
<li>Added exponential backoff with jitter for rate-limited API requests</li>
|
386
|
+
<li>Improved progress indicator with estimated time remaining</li>
|
387
|
+
<li>Increased <code>BUFFER_SIZE</code> from 100 to 250 to reduce I/O operations</li>
|
388
|
+
<li>Optimized file exclusion check using a combined regex for faster matching</li>
|
389
|
+
<li>Improved thread pool efficiency by prioritizing smaller files first</li>
|
390
|
+
</ul>
|
391
|
+
</div>
|
392
|
+
|
293
393
|
<div class="changelog-item">
|
294
394
|
<div>
|
295
395
|
<span class="changelog-version">v0.3.0</span>
|
@@ -298,7 +398,7 @@ generator.run</code></pre>
|
|
298
398
|
<ul class="changelog-list">
|
299
399
|
<li>Added <code>faraday-retry</code> gem dependency for better API rate limit handling</li>
|
300
400
|
<li>Implemented thread-safe buffer management with mutex locks</li>
|
301
|
-
<li>Added new <code>ProgressIndicator</code> class for better CLI progress reporting
|
401
|
+
<li>Added new <code>ProgressIndicator</code> class for better CLI progress reporting</li>
|
302
402
|
<li>Improved memory efficiency with configurable buffer size</li>
|
303
403
|
<li>Enhanced code organization with dedicated methods for file content formatting</li>
|
304
404
|
<li>Added comprehensive method documentation and parameter descriptions</li>
|
@@ -323,26 +423,6 @@ generator.run</code></pre>
|
|
323
423
|
<li>Enforced a 1000 file limit to prevent memory overload</li>
|
324
424
|
</ul>
|
325
425
|
</div>
|
326
|
-
|
327
|
-
<div class="changelog-item">
|
328
|
-
<div>
|
329
|
-
<span class="changelog-version">v0.1.0</span>
|
330
|
-
<span class="changelog-date">- March 2, 2025</span>
|
331
|
-
</div>
|
332
|
-
<ul class="changelog-list">
|
333
|
-
<li>Initial release of Gitingest</li>
|
334
|
-
<li>Core functionality to fetch and process GitHub repository files</li>
|
335
|
-
<li>Command-line interface for easy interaction</li>
|
336
|
-
<li>Smart file filtering with default exclusions for common non-code files</li>
|
337
|
-
<li>Concurrent processing for improved performance</li>
|
338
|
-
<li>Custom exclude patterns support</li>
|
339
|
-
<li>GitHub authentication via access tokens</li>
|
340
|
-
<li>Automatic rate limit handling with retry mechanism</li>
|
341
|
-
<li>Repository prompt generation with file separation markers</li>
|
342
|
-
<li>Support for custom branch selection</li>
|
343
|
-
<li>Custom output file naming options</li>
|
344
|
-
</ul>
|
345
|
-
</div>
|
346
426
|
</div>
|
347
427
|
|
348
428
|
<h2>Contributing</h2>
|
@@ -357,7 +437,7 @@ generator.run</code></pre>
|
|
357
437
|
|
358
438
|
<footer>
|
359
439
|
<p>© 2025 David Santangelo</p>
|
360
|
-
<p>Last updated: March
|
440
|
+
<p>Last updated: March 4, 2025</p>
|
361
441
|
</footer>
|
362
442
|
</body>
|
363
443
|
</html>
|
data/lib/gitingest/generator.rb
CHANGED
@@ -96,6 +96,7 @@ module Gitingest
|
|
96
96
|
# @option options [Logger] :logger Custom logger instance
|
97
97
|
# @option options [Integer] :threads Number of threads to use (default: auto-detected)
|
98
98
|
# @option options [Integer] :thread_timeout Seconds to wait for thread pool shutdown (default: 60)
|
99
|
+
# @option options [Boolean] :show_structure Show repository directory structure (default: false)
|
99
100
|
def initialize(options = {})
|
100
101
|
@options = options
|
101
102
|
@repo_files = []
|
@@ -109,6 +110,12 @@ module Gitingest
|
|
109
110
|
# Main execution method for command line
|
110
111
|
def run
|
111
112
|
fetch_repository_contents
|
113
|
+
|
114
|
+
if @options[:show_structure]
|
115
|
+
puts generate_directory_structure
|
116
|
+
return
|
117
|
+
end
|
118
|
+
|
112
119
|
generate_file
|
113
120
|
end
|
114
121
|
|
@@ -144,6 +151,21 @@ module Gitingest
|
|
144
151
|
result
|
145
152
|
end
|
146
153
|
|
154
|
+
# Generate a textual representation of the repository's directory structure
|
155
|
+
#
|
156
|
+
# @return [String] The directory structure as a formatted string
|
157
|
+
def generate_directory_structure
|
158
|
+
fetch_repository_contents if @repo_files.empty?
|
159
|
+
|
160
|
+
@logger.info "Generating directory structure for #{@options[:repository]}"
|
161
|
+
|
162
|
+
repo_name = @options[:repository].split("/").last
|
163
|
+
structure = DirectoryStructureBuilder.new(repo_name, @repo_files).build
|
164
|
+
|
165
|
+
@logger.info "\n"
|
166
|
+
structure
|
167
|
+
end
|
168
|
+
|
147
169
|
private
|
148
170
|
|
149
171
|
# Set up logging based on verbosity options
|
@@ -169,6 +191,7 @@ module Gitingest
|
|
169
191
|
@options[:exclude] ||= []
|
170
192
|
@options[:threads] ||= DEFAULT_THREAD_COUNT
|
171
193
|
@options[:thread_timeout] ||= DEFAULT_THREAD_TIMEOUT
|
194
|
+
@options[:show_structure] ||= false
|
172
195
|
@excluded_patterns = DEFAULT_EXCLUDES + @options[:exclude]
|
173
196
|
end
|
174
197
|
|
@@ -441,4 +464,57 @@ module Gitingest
|
|
441
464
|
end
|
442
465
|
end
|
443
466
|
end
|
467
|
+
|
468
|
+
# Helper class to build directory structure visualization
|
469
|
+
class DirectoryStructureBuilder
|
470
|
+
def initialize(root_name, files)
|
471
|
+
@root_name = root_name
|
472
|
+
@files = files.map(&:path)
|
473
|
+
end
|
474
|
+
|
475
|
+
def build
|
476
|
+
tree = { @root_name => {} }
|
477
|
+
|
478
|
+
@files.sort.each do |path|
|
479
|
+
parts = path.split("/")
|
480
|
+
current = tree[@root_name]
|
481
|
+
|
482
|
+
parts.each do |part|
|
483
|
+
if part == parts.last
|
484
|
+
current[part] = nil
|
485
|
+
else
|
486
|
+
current[part] ||= {}
|
487
|
+
current = current[part]
|
488
|
+
end
|
489
|
+
end
|
490
|
+
end
|
491
|
+
|
492
|
+
output = ["Directory structure:"]
|
493
|
+
render_tree(tree, "", output)
|
494
|
+
output.join("\n")
|
495
|
+
end
|
496
|
+
|
497
|
+
private
|
498
|
+
|
499
|
+
def render_tree(tree, prefix, output)
|
500
|
+
return if tree.nil?
|
501
|
+
|
502
|
+
tree.keys.each_with_index do |key, index|
|
503
|
+
is_last = index == tree.keys.size - 1
|
504
|
+
current_prefix = prefix
|
505
|
+
|
506
|
+
if prefix.empty?
|
507
|
+
output << "└── #{key}/"
|
508
|
+
current_prefix = " "
|
509
|
+
else
|
510
|
+
connector = is_last ? "└── " : "├── "
|
511
|
+
item = tree[key].is_a?(Hash) ? "#{key}/" : key
|
512
|
+
output << "#{prefix}#{connector}#{item}"
|
513
|
+
current_prefix = prefix + (is_last ? " " : "│ ")
|
514
|
+
end
|
515
|
+
|
516
|
+
render_tree(tree[key], current_prefix, output) if tree[key].is_a?(Hash)
|
517
|
+
end
|
518
|
+
end
|
519
|
+
end
|
444
520
|
end
|
data/lib/gitingest/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: gitingest
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.
|
4
|
+
version: 0.5.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Davide Santangelo
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2025-03-
|
11
|
+
date: 2025-03-10 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: concurrent-ruby
|