gitingest 0.3.1 → 0.5.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +34 -0
- data/README.md +41 -5
- data/bin/gitingest +24 -3
- data/index.html +110 -30
- data/lib/gitingest/generator.rb +159 -58
- data/lib/gitingest/version.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: c754bbf3a24a049ce269017c82ef90b295b0503cb05cc0e652c0101ce68df484
|
4
|
+
data.tar.gz: c3df8efb661ff08e0525da943062882a7a2b467302895f09cbb5dbab38383927
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 803d3a5bb7ca76c9f51a268d22d485c1455b8ba7ebbe16aa3c5af8eabd63fddef273810ec10fa682b7cf606094b30c1ce681468d2a48a190d546c81a6eb779ca
|
7
|
+
data.tar.gz: 6781db79ba3fce1c75f13e8587ceffe8e26d0da276c0c1bbf175f942a9e8e9f1b742884413aabcc6b719a2c010c4156e601aa4577b9604e6edcd7959c67447ec
|
data/CHANGELOG.md
CHANGED
@@ -1,5 +1,39 @@
|
|
1
1
|
# Changelog
|
2
2
|
|
3
|
+
## [0.5.0] - 2025-03-10
|
4
|
+
|
5
|
+
### Added
|
6
|
+
- Added repository directory structure visualization with `--show-structure` / `-s` option
|
7
|
+
- Created `DirectoryStructureBuilder` class to generate tree views of repositories
|
8
|
+
- Added `generate_directory_structure` method to the Generator class
|
9
|
+
- Added tests for directory structure visualization
|
10
|
+
|
11
|
+
### Changed
|
12
|
+
- Enhanced documentation with directory structure visualization examples
|
13
|
+
- Updated CLI help with the new option
|
14
|
+
|
15
|
+
---
|
16
|
+
|
17
|
+
## [0.4.0] - 2025-03-03
|
18
|
+
|
19
|
+
### Added
|
20
|
+
- Added `generate_prompt` method for in-memory content generation without file I/O
|
21
|
+
- Integrated visual progress bar with file processing rate reporting
|
22
|
+
- Added human-readable time formatting for progress estimates
|
23
|
+
- Enhanced test coverage for multithreaded operations
|
24
|
+
|
25
|
+
### Changed
|
26
|
+
- Refactored `process_content_to_output` for better code reuse between file and string output
|
27
|
+
- Improved thread management to handle various error conditions more gracefully
|
28
|
+
- Enhanced documentation with programmatic usage examples
|
29
|
+
|
30
|
+
### Fixed
|
31
|
+
- Resolved thread pool shutdown issues in test environment
|
32
|
+
- Fixed race conditions in progress indicator updates
|
33
|
+
- Addressed timing inconsistencies in multithreaded test scenarios
|
34
|
+
|
35
|
+
---
|
36
|
+
|
3
37
|
## [0.3.1] - 2025-03-03
|
4
38
|
|
5
39
|
### Added
|
data/README.md
CHANGED
@@ -1,3 +1,6 @@
|
|
1
|
+
[](https://badge.fury.io/rb/gitingest)
|
2
|
+

|
3
|
+
|
1
4
|
# Gitingest
|
2
5
|
|
3
6
|
Gitingest is a Ruby gem that fetches files from a GitHub repository and generates a consolidated text prompt, which can be used as input for large language models, documentation generation, or other purposes.
|
@@ -39,6 +42,18 @@ gitingest --repository user/repo --branch develop
|
|
39
42
|
# Exclude additional patterns
|
40
43
|
gitingest --repository user/repo --exclude "*.md,docs/"
|
41
44
|
|
45
|
+
# Control the number of threads
|
46
|
+
gitingest --repository user/repo -T 4
|
47
|
+
|
48
|
+
# Set thread pool shutdown timeout
|
49
|
+
gitingest --repository user/repo -W 120
|
50
|
+
|
51
|
+
# Show repository directory structure
|
52
|
+
gitingest --repository user/repo -s
|
53
|
+
|
54
|
+
# Combine threading options
|
55
|
+
gitingest --repository user/repo -T 8 -W 90
|
56
|
+
|
42
57
|
# Quiet mode
|
43
58
|
gitingest --repository user/repo --quiet
|
44
59
|
|
@@ -53,20 +68,41 @@ gitingest --repository user/repo --verbose
|
|
53
68
|
- `-o, --output FILE`: Output file for the prompt [Default: reponame_prompt.txt]
|
54
69
|
- `-e, --exclude PATTERN`: File patterns to exclude (comma separated)
|
55
70
|
- `-b, --branch BRANCH`: Repository branch [Default: main]
|
71
|
+
- `-s, --show-structure`: Show repository directory structure instead of generating prompt
|
72
|
+
- `-T, --threads COUNT`: Number of concurrent threads [Default: auto-detected]
|
73
|
+
- `-W, --thread-timeout SECONDS`: Thread pool shutdown timeout [Default: 60]
|
74
|
+
- `-q, --quiet`: Reduce logging to errors only
|
75
|
+
- `-v, --verbose`: Increase logging verbosity
|
56
76
|
- `-h, --help`: Show help message
|
57
77
|
|
78
|
+
### Directory Structure Visualization
|
79
|
+
|
80
|
+
```bash
|
81
|
+
gitingest --repository user/repo --show-structure
|
82
|
+
```
|
83
|
+
|
84
|
+
This will display a tree view of the repository's structure:
|
85
|
+
|
58
86
|
### As a Library
|
59
87
|
|
60
88
|
```ruby
|
61
89
|
require "gitingest"
|
62
90
|
|
63
|
-
# Basic usage
|
91
|
+
# Basic usage - write to a file
|
64
92
|
generator = Gitingest::Generator.new(
|
65
93
|
repository: "user/repo",
|
66
94
|
token: "YOUR_GITHUB_TOKEN" # optional
|
67
95
|
)
|
96
|
+
|
97
|
+
# Run the full workflow (fetch repository and generate file)
|
68
98
|
generator.run
|
69
99
|
|
100
|
+
# OR generate file only (if you need the output path)
|
101
|
+
output_path = generator.generate_file
|
102
|
+
|
103
|
+
# Get content as a string (for in-memory processing)
|
104
|
+
content = generator.generate_prompt
|
105
|
+
|
70
106
|
# With custom options
|
71
107
|
generator = Gitingest::Generator.new(
|
72
108
|
repository: "user/repo",
|
@@ -74,9 +110,10 @@ generator = Gitingest::Generator.new(
|
|
74
110
|
output_file: "my_prompt.txt",
|
75
111
|
branch: "develop",
|
76
112
|
exclude: ["*.md", "docs/"],
|
77
|
-
|
113
|
+
threads: 4, # control concurrency
|
114
|
+
thread_timeout: 120, # custom thread timeout
|
115
|
+
quiet: true # or verbose: true
|
78
116
|
)
|
79
|
-
generator.run
|
80
117
|
|
81
118
|
# With custom logger
|
82
119
|
custom_logger = Logger.new("gitingest.log")
|
@@ -84,7 +121,6 @@ generator = Gitingest::Generator.new(
|
|
84
121
|
repository: "user/repo",
|
85
122
|
logger: custom_logger
|
86
123
|
)
|
87
|
-
generator.run
|
88
124
|
```
|
89
125
|
|
90
126
|
## Features
|
@@ -124,4 +160,4 @@ Inspired by [`cyclotruc/gitingest`](https://github.com/cyclotruc/gitingest).
|
|
124
160
|
|
125
161
|
## License
|
126
162
|
|
127
|
-
The gem is available as open source under the terms of the [MIT License](https://opensource.org/licenses/MIT).
|
163
|
+
The gem is available as open source under the terms of the [MIT License](https://opensource.org/licenses/MIT).
|
data/bin/gitingest
CHANGED
@@ -22,7 +22,7 @@ parser = OptionParser.new do |opts|
|
|
22
22
|
options[:output_file] = file
|
23
23
|
end
|
24
24
|
|
25
|
-
opts.on("-b", "--branch BRANCH", "Repository branch") do |branch|
|
25
|
+
opts.on("-b", "--branch BRANCH", "Repository branch [Default: main]") do |branch|
|
26
26
|
options[:branch] = branch
|
27
27
|
end
|
28
28
|
|
@@ -30,11 +30,24 @@ parser = OptionParser.new do |opts|
|
|
30
30
|
options[:exclude] = pattern.split(",")
|
31
31
|
end
|
32
32
|
|
33
|
-
opts.on("-
|
33
|
+
opts.on("-T", "--threads COUNT", Integer, "Number of concurrent threads [Default: auto-detected]") do |threads|
|
34
|
+
options[:threads] = threads
|
35
|
+
end
|
36
|
+
|
37
|
+
opts.on("-W", "--thread-timeout SECONDS", Integer,
|
38
|
+
"Thread pool shutdown timeout in seconds [Default: 60]") do |timeout|
|
39
|
+
options[:thread_timeout] = timeout
|
40
|
+
end
|
41
|
+
|
42
|
+
opts.on("-s", "--show-structure", "Show repository directory structure") do
|
43
|
+
options[:show_structure] = true
|
44
|
+
end
|
45
|
+
|
46
|
+
opts.on("-q", "--quiet", "Reduce logging to errors only") do
|
34
47
|
options[:quiet] = true
|
35
48
|
end
|
36
49
|
|
37
|
-
opts.on("-v", "--verbose", "
|
50
|
+
opts.on("-v", "--verbose", "Increase logging verbosity") do
|
38
51
|
options[:verbose] = true
|
39
52
|
end
|
40
53
|
|
@@ -42,6 +55,14 @@ parser = OptionParser.new do |opts|
|
|
42
55
|
puts opts
|
43
56
|
exit
|
44
57
|
end
|
58
|
+
|
59
|
+
opts.separator ""
|
60
|
+
opts.separator "Examples:"
|
61
|
+
opts.separator " gitingest -r user/repo # Basic usage with public repository"
|
62
|
+
opts.separator " gitingest -r user/repo -t YOUR_TOKEN # With GitHub token for private repositories"
|
63
|
+
opts.separator " gitingest -r user/repo -o custom_prompt.txt # Custom output file"
|
64
|
+
opts.separator " gitingest -r user/repo -T 8 # Use 8 threads for processing"
|
65
|
+
opts.separator " gitingest -r user/repo -s # Show repository directory structure"
|
45
66
|
end
|
46
67
|
|
47
68
|
begin
|
data/index.html
CHANGED
@@ -6,6 +6,7 @@
|
|
6
6
|
<title>Gitingest - GitHub Repository Fetcher and Prompt Generator</title>
|
7
7
|
<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/github-markdown-css/5.2.0/github-markdown.min.css">
|
8
8
|
<style>
|
9
|
+
/* Styles remain the same */
|
9
10
|
:root {
|
10
11
|
--bg-color: #0d1117;
|
11
12
|
--text-color: #c9d1d9;
|
@@ -176,7 +177,7 @@
|
|
176
177
|
<div class="header">
|
177
178
|
<div class="logo">G</div>
|
178
179
|
<div>
|
179
|
-
<h1>Gitingest <span class="version-badge">v0.
|
180
|
+
<h1>Gitingest <span class="version-badge">v0.5.0</span></h1>
|
180
181
|
<p>A Ruby gem that fetches files from a GitHub repository and generates a consolidated text prompt for LLMs</p>
|
181
182
|
</div>
|
182
183
|
</div>
|
@@ -213,6 +214,18 @@ gitingest --repository user/repo --branch develop
|
|
213
214
|
# Exclude additional patterns
|
214
215
|
gitingest --repository user/repo --exclude "*.md,docs/"
|
215
216
|
|
217
|
+
# Show repository directory structure
|
218
|
+
gitingest --repository user/repo -s
|
219
|
+
|
220
|
+
# Control the number of threads
|
221
|
+
gitingest --repository user/repo -T 4
|
222
|
+
|
223
|
+
# Set thread pool shutdown timeout
|
224
|
+
gitingest --repository user/repo -W 120
|
225
|
+
|
226
|
+
# Combine threading options
|
227
|
+
gitingest --repository user/repo -T 8 -W 90
|
228
|
+
|
216
229
|
# Quiet mode
|
217
230
|
gitingest --repository user/repo --quiet
|
218
231
|
|
@@ -226,19 +239,54 @@ gitingest --repository user/repo --verbose</code></pre>
|
|
226
239
|
<li><code>-o, --output FILE</code>: Output file for the prompt [Default: reponame_prompt.txt]</li>
|
227
240
|
<li><code>-e, --exclude PATTERN</code>: File patterns to exclude (comma separated)</li>
|
228
241
|
<li><code>-b, --branch BRANCH</code>: Repository branch [Default: main]</li>
|
242
|
+
<li><code>-s, --show-structure</code>: Show repository directory structure</li>
|
243
|
+
<li><code>-T, --threads COUNT</code>: Number of concurrent threads [Default: auto-detected]</li>
|
244
|
+
<li><code>-W, --thread-timeout SECONDS</code>: Thread pool shutdown timeout [Default: 60]</li>
|
245
|
+
<li><code>-q, --quiet</code>: Reduce logging to errors only</li>
|
246
|
+
<li><code>-v, --verbose</code>: Increase logging verbosity</li>
|
229
247
|
<li><code>-h, --help</code>: Show help message</li>
|
230
248
|
</ul>
|
231
249
|
|
250
|
+
<h3>Directory Structure Visualization</h3>
|
251
|
+
<p>You can visualize the structure of a repository using the <code>--show-structure</code> option:</p>
|
252
|
+
<pre><code>gitingest --repository user/repo --show-structure</code></pre>
|
253
|
+
|
254
|
+
<p>This will display a tree view of the repository's structure, for example:</p>
|
255
|
+
<pre><code>Directory structure:
|
256
|
+
└── repo-name/
|
257
|
+
├── README.md
|
258
|
+
├── LICENSE
|
259
|
+
├── lib/
|
260
|
+
│ ├── repo-name.rb
|
261
|
+
│ └── repo-name/
|
262
|
+
│ └── version.rb
|
263
|
+
├── bin/
|
264
|
+
│ └── console
|
265
|
+
└── spec/
|
266
|
+
├── spec_helper.rb
|
267
|
+
└── repo-name_spec.rb</code></pre>
|
268
|
+
|
232
269
|
<h3>As a Library</h3>
|
233
270
|
<pre><code>require "gitingest"
|
234
271
|
|
235
|
-
# Basic usage
|
272
|
+
# Basic usage - write to a file
|
236
273
|
generator = Gitingest::Generator.new(
|
237
274
|
repository: "user/repo",
|
238
275
|
token: "YOUR_GITHUB_TOKEN" # optional
|
239
276
|
)
|
277
|
+
|
278
|
+
# Run the full workflow (fetch repository and generate file)
|
240
279
|
generator.run
|
241
280
|
|
281
|
+
# OR generate file only (if you need the output path)
|
282
|
+
output_path = generator.generate_file
|
283
|
+
|
284
|
+
# Get content as a string (for in-memory processing)
|
285
|
+
content = generator.generate_prompt
|
286
|
+
|
287
|
+
# Generate and get repository directory structure
|
288
|
+
structure = generator.generate_directory_structure
|
289
|
+
|
242
290
|
# With custom options
|
243
291
|
generator = Gitingest::Generator.new(
|
244
292
|
repository: "user/repo",
|
@@ -246,26 +294,32 @@ generator = Gitingest::Generator.new(
|
|
246
294
|
output_file: "my_prompt.txt",
|
247
295
|
branch: "develop",
|
248
296
|
exclude: ["*.md", "docs/"],
|
249
|
-
|
297
|
+
threads: 4, # control concurrency
|
298
|
+
thread_timeout: 120, # custom thread timeout
|
299
|
+
quiet: true, # or verbose: true
|
300
|
+
show_structure: true # show directory structure instead of generating prompt
|
250
301
|
)
|
251
|
-
generator.run
|
252
302
|
|
253
303
|
# With custom logger
|
254
304
|
custom_logger = Logger.new("gitingest.log")
|
255
305
|
generator = Gitingest::Generator.new(
|
256
306
|
repository: "user/repo",
|
257
307
|
logger: custom_logger
|
258
|
-
)
|
259
|
-
generator.run</code></pre>
|
308
|
+
)</code></pre>
|
260
309
|
|
261
310
|
<h2>Features</h2>
|
262
311
|
<ul>
|
263
312
|
<li>Fetches all files from a GitHub repository based on the given branch</li>
|
264
313
|
<li>Automatically excludes common binary files and system files by default</li>
|
265
314
|
<li>Allows custom exclusion patterns for specific file extensions or directories</li>
|
266
|
-
<li>Uses concurrent processing for faster downloads</li>
|
267
|
-
<li>
|
315
|
+
<li>Uses concurrent processing with configurable thread count for faster downloads</li>
|
316
|
+
<li>Shows real-time progress with visual bar, ETA, and processing rate</li>
|
317
|
+
<li>Handles GitHub API rate limiting with automatic retry and exponential backoff</li>
|
318
|
+
<li>Optimizes memory usage with buffered writes and thread-local buffers</li>
|
319
|
+
<li>Intelligently prioritizes files for better thread distribution</li>
|
268
320
|
<li>Generates a clean, formatted output file with file paths and content</li>
|
321
|
+
<li>Provides both file-based and string-based output options</li>
|
322
|
+
<li>Visualizes repository directory structure in a tree format</li>
|
269
323
|
</ul>
|
270
324
|
|
271
325
|
<h2>Default Exclusion Patterns</h2>
|
@@ -290,6 +344,52 @@ generator.run</code></pre>
|
|
290
344
|
<div class="changelog">
|
291
345
|
<h2>Changelog</h2>
|
292
346
|
|
347
|
+
<div class="changelog-item">
|
348
|
+
<div>
|
349
|
+
<span class="changelog-version">v0.5.0</span>
|
350
|
+
<span class="changelog-date">- March 4, 2025</span>
|
351
|
+
</div>
|
352
|
+
<ul class="changelog-list">
|
353
|
+
<li>Added repository directory structure visualization with <code>--show-structure</code> option</li>
|
354
|
+
<li>Created <code>DirectoryStructureBuilder</code> class to generate tree views of repositories</li>
|
355
|
+
<li>Added <code>generate_directory_structure</code> method to the Generator class</li>
|
356
|
+
<li>Added tests for the directory structure visualization</li>
|
357
|
+
<li>Updated documentation with directory structure visualization examples</li>
|
358
|
+
</ul>
|
359
|
+
</div>
|
360
|
+
|
361
|
+
<div class="changelog-item">
|
362
|
+
<div>
|
363
|
+
<span class="changelog-version">v0.4.0</span>
|
364
|
+
<span class="changelog-date">- March 4, 2025</span>
|
365
|
+
</div>
|
366
|
+
<ul class="changelog-list">
|
367
|
+
<li>Added <code>generate_prompt</code> method for in-memory content generation without file I/O</li>
|
368
|
+
<li>Integrated visual progress bar with file processing rate reporting</li>
|
369
|
+
<li>Added human-readable time formatting for progress estimates</li>
|
370
|
+
<li>Enhanced test coverage for multithreaded operations</li>
|
371
|
+
<li>Refactored <code>process_content_to_output</code> for better code reuse</li>
|
372
|
+
<li>Improved thread management to handle various error conditions gracefully</li>
|
373
|
+
<li>Fixed thread pool shutdown issues and race conditions</li>
|
374
|
+
</ul>
|
375
|
+
</div>
|
376
|
+
|
377
|
+
<div class="changelog-item">
|
378
|
+
<div>
|
379
|
+
<span class="changelog-version">v0.3.1</span>
|
380
|
+
<span class="changelog-date">- March 3, 2025</span>
|
381
|
+
</div>
|
382
|
+
<ul class="changelog-list">
|
383
|
+
<li>Introduced configurable threading options with <code>:threads</code> and <code>:thread_timeout</code></li>
|
384
|
+
<li>Implemented thread-local buffers to reduce mutex contention during file processing</li>
|
385
|
+
<li>Added exponential backoff with jitter for rate-limited API requests</li>
|
386
|
+
<li>Improved progress indicator with estimated time remaining</li>
|
387
|
+
<li>Increased <code>BUFFER_SIZE</code> from 100 to 250 to reduce I/O operations</li>
|
388
|
+
<li>Optimized file exclusion check using a combined regex for faster matching</li>
|
389
|
+
<li>Improved thread pool efficiency by prioritizing smaller files first</li>
|
390
|
+
</ul>
|
391
|
+
</div>
|
392
|
+
|
293
393
|
<div class="changelog-item">
|
294
394
|
<div>
|
295
395
|
<span class="changelog-version">v0.3.0</span>
|
@@ -298,7 +398,7 @@ generator.run</code></pre>
|
|
298
398
|
<ul class="changelog-list">
|
299
399
|
<li>Added <code>faraday-retry</code> gem dependency for better API rate limit handling</li>
|
300
400
|
<li>Implemented thread-safe buffer management with mutex locks</li>
|
301
|
-
<li>Added new <code>ProgressIndicator</code> class for better CLI progress reporting
|
401
|
+
<li>Added new <code>ProgressIndicator</code> class for better CLI progress reporting</li>
|
302
402
|
<li>Improved memory efficiency with configurable buffer size</li>
|
303
403
|
<li>Enhanced code organization with dedicated methods for file content formatting</li>
|
304
404
|
<li>Added comprehensive method documentation and parameter descriptions</li>
|
@@ -323,26 +423,6 @@ generator.run</code></pre>
|
|
323
423
|
<li>Enforced a 1000 file limit to prevent memory overload</li>
|
324
424
|
</ul>
|
325
425
|
</div>
|
326
|
-
|
327
|
-
<div class="changelog-item">
|
328
|
-
<div>
|
329
|
-
<span class="changelog-version">v0.1.0</span>
|
330
|
-
<span class="changelog-date">- March 2, 2025</span>
|
331
|
-
</div>
|
332
|
-
<ul class="changelog-list">
|
333
|
-
<li>Initial release of Gitingest</li>
|
334
|
-
<li>Core functionality to fetch and process GitHub repository files</li>
|
335
|
-
<li>Command-line interface for easy interaction</li>
|
336
|
-
<li>Smart file filtering with default exclusions for common non-code files</li>
|
337
|
-
<li>Concurrent processing for improved performance</li>
|
338
|
-
<li>Custom exclude patterns support</li>
|
339
|
-
<li>GitHub authentication via access tokens</li>
|
340
|
-
<li>Automatic rate limit handling with retry mechanism</li>
|
341
|
-
<li>Repository prompt generation with file separation markers</li>
|
342
|
-
<li>Support for custom branch selection</li>
|
343
|
-
<li>Custom output file naming options</li>
|
344
|
-
</ul>
|
345
|
-
</div>
|
346
426
|
</div>
|
347
427
|
|
348
428
|
<h2>Contributing</h2>
|
@@ -357,7 +437,7 @@ generator.run</code></pre>
|
|
357
437
|
|
358
438
|
<footer>
|
359
439
|
<p>© 2025 David Santangelo</p>
|
360
|
-
<p>Last updated: March
|
440
|
+
<p>Last updated: March 4, 2025</p>
|
361
441
|
</footer>
|
362
442
|
</body>
|
363
443
|
</html>
|
data/lib/gitingest/generator.rb
CHANGED
@@ -96,6 +96,7 @@ module Gitingest
|
|
96
96
|
# @option options [Logger] :logger Custom logger instance
|
97
97
|
# @option options [Integer] :threads Number of threads to use (default: auto-detected)
|
98
98
|
# @option options [Integer] :thread_timeout Seconds to wait for thread pool shutdown (default: 60)
|
99
|
+
# @option options [Boolean] :show_structure Show repository directory structure (default: false)
|
99
100
|
def initialize(options = {})
|
100
101
|
@options = options
|
101
102
|
@repo_files = []
|
@@ -106,10 +107,63 @@ module Gitingest
|
|
106
107
|
compile_excluded_patterns
|
107
108
|
end
|
108
109
|
|
109
|
-
# Main execution method
|
110
|
+
# Main execution method for command line
|
110
111
|
def run
|
111
112
|
fetch_repository_contents
|
112
|
-
|
113
|
+
|
114
|
+
if @options[:show_structure]
|
115
|
+
puts generate_directory_structure
|
116
|
+
return
|
117
|
+
end
|
118
|
+
|
119
|
+
generate_file
|
120
|
+
end
|
121
|
+
|
122
|
+
# Generate content and save it to a file
|
123
|
+
#
|
124
|
+
# @return [String] Path to the generated file
|
125
|
+
def generate_file
|
126
|
+
fetch_repository_contents if @repo_files.empty?
|
127
|
+
|
128
|
+
@logger.info "Generating file for #{@options[:repository]}"
|
129
|
+
File.open(@options[:output_file], "w") do |file|
|
130
|
+
process_content_to_output(file)
|
131
|
+
end
|
132
|
+
|
133
|
+
@logger.info "Prompt generated and saved to #{@options[:output_file]}"
|
134
|
+
@options[:output_file]
|
135
|
+
end
|
136
|
+
|
137
|
+
# Generate content and return it as a string
|
138
|
+
# Useful for programmatic usage
|
139
|
+
#
|
140
|
+
# @return [String] The generated repository content
|
141
|
+
def generate_prompt
|
142
|
+
@logger.info "Generating in-memory prompt for #{@options[:repository]}"
|
143
|
+
|
144
|
+
fetch_repository_contents if @repo_files.empty?
|
145
|
+
|
146
|
+
content = StringIO.new
|
147
|
+
process_content_to_output(content)
|
148
|
+
|
149
|
+
result = content.string
|
150
|
+
@logger.info "Generated #{result.size} bytes of content in memory"
|
151
|
+
result
|
152
|
+
end
|
153
|
+
|
154
|
+
# Generate a textual representation of the repository's directory structure
|
155
|
+
#
|
156
|
+
# @return [String] The directory structure as a formatted string
|
157
|
+
def generate_directory_structure
|
158
|
+
fetch_repository_contents if @repo_files.empty?
|
159
|
+
|
160
|
+
@logger.info "Generating directory structure for #{@options[:repository]}"
|
161
|
+
|
162
|
+
repo_name = @options[:repository].split("/").last
|
163
|
+
structure = DirectoryStructureBuilder.new(repo_name, @repo_files).build
|
164
|
+
|
165
|
+
@logger.info "\n"
|
166
|
+
structure
|
113
167
|
end
|
114
168
|
|
115
169
|
private
|
@@ -137,6 +191,7 @@ module Gitingest
|
|
137
191
|
@options[:exclude] ||= []
|
138
192
|
@options[:threads] ||= DEFAULT_THREAD_COUNT
|
139
193
|
@options[:thread_timeout] ||= DEFAULT_THREAD_TIMEOUT
|
194
|
+
@options[:show_structure] ||= false
|
140
195
|
@excluded_patterns = DEFAULT_EXCLUDES + @options[:exclude]
|
141
196
|
end
|
142
197
|
|
@@ -202,89 +257,82 @@ module Gitingest
|
|
202
257
|
path.match?(@combined_exclude_regex)
|
203
258
|
end
|
204
259
|
|
205
|
-
#
|
206
|
-
def
|
207
|
-
@logger.info "Generating prompt..."
|
260
|
+
# Common implementation for both file and string output
|
261
|
+
def process_content_to_output(output)
|
208
262
|
@logger.debug "Using thread pool with #{@options[:threads]} threads"
|
209
263
|
|
210
264
|
buffer = []
|
211
265
|
progress = ProgressIndicator.new(@repo_files.size, @logger)
|
212
266
|
|
213
|
-
#
|
267
|
+
# Thread-local buffers to reduce mutex contention
|
214
268
|
thread_buffers = {}
|
215
269
|
mutex = Mutex.new
|
216
270
|
errors = []
|
217
271
|
|
218
|
-
#
|
272
|
+
# Thread pool based on configuration
|
219
273
|
pool = Concurrent::FixedThreadPool.new(@options[:threads])
|
220
274
|
|
221
|
-
# Group files by priority
|
275
|
+
# Group files by priority
|
222
276
|
prioritized_files = prioritize_files(@repo_files)
|
223
277
|
|
224
|
-
|
225
|
-
|
226
|
-
|
227
|
-
|
228
|
-
|
229
|
-
thread_buffers[thread_id] ||= []
|
230
|
-
local_buffer = thread_buffers[thread_id]
|
231
|
-
|
232
|
-
begin
|
233
|
-
content = fetch_file_content_with_retry(repo_file.path)
|
234
|
-
result = format_file_content(repo_file.path, content)
|
235
|
-
local_buffer << result
|
236
|
-
|
237
|
-
# Optimization: Only acquire mutex when local buffer reaches threshold
|
238
|
-
if local_buffer.size >= LOCAL_BUFFER_THRESHOLD
|
239
|
-
mutex.synchronize do
|
240
|
-
buffer.concat(local_buffer)
|
241
|
-
write_buffer(file, buffer) if buffer.size >= BUFFER_SIZE
|
242
|
-
local_buffer.clear
|
243
|
-
end
|
244
|
-
end
|
278
|
+
prioritized_files.each_with_index do |repo_file, index|
|
279
|
+
pool.post do
|
280
|
+
thread_id = Thread.current.object_id
|
281
|
+
thread_buffers[thread_id] ||= []
|
282
|
+
local_buffer = thread_buffers[thread_id]
|
245
283
|
|
246
|
-
|
247
|
-
|
248
|
-
|
249
|
-
|
250
|
-
|
251
|
-
|
252
|
-
rescue StandardError => e
|
284
|
+
begin
|
285
|
+
content = fetch_file_content_with_retry(repo_file.path)
|
286
|
+
result = format_file_content(repo_file.path, content)
|
287
|
+
local_buffer << result
|
288
|
+
|
289
|
+
if local_buffer.size >= LOCAL_BUFFER_THRESHOLD
|
253
290
|
mutex.synchronize do
|
254
|
-
|
255
|
-
|
291
|
+
buffer.concat(local_buffer)
|
292
|
+
write_buffer(output, buffer) if buffer.size >= BUFFER_SIZE
|
293
|
+
local_buffer.clear
|
256
294
|
end
|
257
295
|
end
|
296
|
+
|
297
|
+
progress.update(index + 1)
|
298
|
+
rescue Octokit::Error => e
|
299
|
+
mutex.synchronize do
|
300
|
+
errors << "Error fetching #{repo_file.path}: #{e.message}"
|
301
|
+
@logger.error "Error fetching #{repo_file.path}: #{e.message}"
|
302
|
+
end
|
303
|
+
rescue StandardError => e
|
304
|
+
mutex.synchronize do
|
305
|
+
errors << "Unexpected error processing #{repo_file.path}: #{e.message}"
|
306
|
+
@logger.error "Unexpected error processing #{repo_file.path}: #{e.message}"
|
307
|
+
end
|
258
308
|
end
|
259
309
|
end
|
310
|
+
end
|
260
311
|
|
261
|
-
|
262
|
-
|
263
|
-
|
312
|
+
begin
|
313
|
+
pool.shutdown
|
314
|
+
wait_success = pool.wait_for_termination(@options[:thread_timeout])
|
264
315
|
|
265
|
-
|
266
|
-
|
267
|
-
|
268
|
-
end
|
269
|
-
rescue StandardError => e
|
270
|
-
@logger.error "Error during thread pool shutdown: #{e.message}"
|
316
|
+
unless wait_success
|
317
|
+
@logger.warn "Thread pool did not shut down within #{@options[:thread_timeout]} seconds, forcing termination"
|
318
|
+
pool.kill
|
271
319
|
end
|
320
|
+
rescue StandardError => e
|
321
|
+
@logger.error "Error during thread pool shutdown: #{e.message}"
|
322
|
+
end
|
272
323
|
|
273
|
-
|
274
|
-
|
275
|
-
|
276
|
-
|
277
|
-
end
|
278
|
-
write_buffer(file, buffer) unless buffer.empty?
|
324
|
+
# Process remaining files in thread-local buffers
|
325
|
+
mutex.synchronize do
|
326
|
+
thread_buffers.each_value do |local_buffer|
|
327
|
+
buffer.concat(local_buffer) unless local_buffer.empty?
|
279
328
|
end
|
329
|
+
write_buffer(output, buffer) unless buffer.empty?
|
280
330
|
end
|
281
331
|
|
282
|
-
|
283
|
-
@logger.warn "Completed with #{errors.size} errors"
|
284
|
-
@logger.debug "First few errors: #{errors.first(3).join(", ")}" if @logger.debug?
|
285
|
-
end
|
332
|
+
return unless errors.any?
|
286
333
|
|
287
|
-
@logger.
|
334
|
+
@logger.warn "Completed with #{errors.size} errors"
|
335
|
+
@logger.debug "First few errors: #{errors.first(3).join(", ")}" if @logger.debug?
|
288
336
|
end
|
289
337
|
|
290
338
|
# Format a file's content for the prompt
|
@@ -416,4 +464,57 @@ module Gitingest
|
|
416
464
|
end
|
417
465
|
end
|
418
466
|
end
|
467
|
+
|
468
|
+
# Helper class to build directory structure visualization
|
469
|
+
class DirectoryStructureBuilder
|
470
|
+
def initialize(root_name, files)
|
471
|
+
@root_name = root_name
|
472
|
+
@files = files.map(&:path)
|
473
|
+
end
|
474
|
+
|
475
|
+
def build
|
476
|
+
tree = { @root_name => {} }
|
477
|
+
|
478
|
+
@files.sort.each do |path|
|
479
|
+
parts = path.split("/")
|
480
|
+
current = tree[@root_name]
|
481
|
+
|
482
|
+
parts.each do |part|
|
483
|
+
if part == parts.last
|
484
|
+
current[part] = nil
|
485
|
+
else
|
486
|
+
current[part] ||= {}
|
487
|
+
current = current[part]
|
488
|
+
end
|
489
|
+
end
|
490
|
+
end
|
491
|
+
|
492
|
+
output = ["Directory structure:"]
|
493
|
+
render_tree(tree, "", output)
|
494
|
+
output.join("\n")
|
495
|
+
end
|
496
|
+
|
497
|
+
private
|
498
|
+
|
499
|
+
def render_tree(tree, prefix, output)
|
500
|
+
return if tree.nil?
|
501
|
+
|
502
|
+
tree.keys.each_with_index do |key, index|
|
503
|
+
is_last = index == tree.keys.size - 1
|
504
|
+
current_prefix = prefix
|
505
|
+
|
506
|
+
if prefix.empty?
|
507
|
+
output << "└── #{key}/"
|
508
|
+
current_prefix = " "
|
509
|
+
else
|
510
|
+
connector = is_last ? "└── " : "├── "
|
511
|
+
item = tree[key].is_a?(Hash) ? "#{key}/" : key
|
512
|
+
output << "#{prefix}#{connector}#{item}"
|
513
|
+
current_prefix = prefix + (is_last ? " " : "│ ")
|
514
|
+
end
|
515
|
+
|
516
|
+
render_tree(tree[key], current_prefix, output) if tree[key].is_a?(Hash)
|
517
|
+
end
|
518
|
+
end
|
519
|
+
end
|
419
520
|
end
|
data/lib/gitingest/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: gitingest
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.
|
4
|
+
version: 0.5.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Davide Santangelo
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2025-03-
|
11
|
+
date: 2025-03-10 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: concurrent-ruby
|