gffkit 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
gffkit-0.1.0/LICENSE ADDED
@@ -0,0 +1,21 @@
1
+ MIT License
2
+
3
+ Copyright (c) 2026 Qunjie Zhang
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
@@ -0,0 +1,3 @@
1
+ include README.md
2
+ include LICENSE
3
+ recursive-include src/gffkit *.py
gffkit-0.1.0/PKG-INFO ADDED
@@ -0,0 +1,96 @@
1
+ Metadata-Version: 2.1
2
+ Name: gffkit
3
+ Version: 0.1.0
4
+ Summary: Region-aware GFF annotation integration toolkit
5
+ Author: Qunjie Zhang
6
+ License: MIT
7
+ Project-URL: Homepage, https://github.com/qunjie-zhang/gffkit
8
+ Project-URL: Repository, https://github.com/qunjie-zhang/gffkit
9
+ Project-URL: Issues, https://github.com/qunjie-zhang/gffkit/issues
10
+ Keywords: GFF3,GTF,genome annotation,bioinformatics,UTR,gene annotation
11
+ Classifier: Development Status :: 3 - Alpha
12
+ Classifier: Intended Audience :: Science/Research
13
+ Classifier: Topic :: Scientific/Engineering :: Bio-Informatics
14
+ Classifier: License :: OSI Approved :: MIT License
15
+ Classifier: Programming Language :: Python :: 3
16
+ Classifier: Programming Language :: Python :: 3.8
17
+ Classifier: Programming Language :: Python :: 3.9
18
+ Classifier: Programming Language :: Python :: 3.10
19
+ Classifier: Programming Language :: Python :: 3.11
20
+ Classifier: Programming Language :: Python :: 3.12
21
+ Classifier: Operating System :: OS Independent
22
+ Requires-Python: >=3.8
23
+ Description-Content-Type: text/markdown
24
+ License-File: LICENSE
25
+
26
+ # gffkit
27
+
28
+ `gffkit` is a lightweight toolkit for region-aware GFF/GTF annotation integration.
29
+ It combines three utilities:
30
+
31
+ 1. `detect-bridge`: detect suspicious merged-gene artifacts caused by bridge transcripts.
32
+ 2. `complement`: complement/merge annotations, with optional region-swap mode.
33
+ 3. `add-utr`: reconstruct `five_prime_UTR` and `three_prime_UTR` features from exon/CDS coordinates.
34
+
35
+ ## Installation
36
+
37
+ ```bash
38
+ pip install gffkit
39
+ ```
40
+
41
+
42
+ ## Quick start
43
+
44
+ ### Full integration pipeline
45
+
46
+ ```bash
47
+ gffkit integrate \
48
+ --annotation-a EviAnn.gff3 \
49
+ --annotation-b ANNEVO.gff3 \
50
+ --outdir gffkit_out \
51
+ --prefix sample
52
+ ```
53
+
54
+ Outputs:
55
+
56
+ - `gffkit_out/sample.suspicious.tsv`
57
+ - `gffkit_out/sample.merged.gff3`
58
+ - `gffkit_out/sample.final.withUTR.gff3`
59
+
60
+ ### Step-by-step usage
61
+
62
+ ```bash
63
+ # 1. Detect suspicious merged genes in Annotation A
64
+ gffkit detect-bridge -i EviAnn.gff3 -o suspicious.tsv
65
+
66
+ # 2. Use A as the global reference, but switch to B in suspicious regions
67
+ gffkit complement \
68
+ --ref EviAnn.gff3 \
69
+ --add ANNEVO.gff3 \
70
+ --swap_region_tsv suspicious.tsv \
71
+ --swap_region_flank 100 \
72
+ --output merged.gff3
73
+
74
+ # 3. Add UTR features
75
+ gffkit add-utr -i merged.gff3 -o final.annotation.withUTR.gff3
76
+ ```
77
+
78
+ ## Command overview
79
+
80
+ ```bash
81
+ gffkit --help
82
+ gffkit detect-bridge --help
83
+ gffkit complement --help
84
+ gffkit add-utr --help
85
+ gffkit integrate --help
86
+ ```
87
+
88
+ ## Annotation integration strategy
89
+
90
+ - Annotation A, for example EviAnn/RNA-seq-supported GFF, is used as the global primary reference.
91
+ - Annotation B, for example ANNEVO/deep-learning GFF, is used as the local primary reference only in suspicious merged-gene regions.
92
+ - UTR features are reconstructed after merging using an exon-minus-CDS strategy.
93
+
94
+ ## License
95
+
96
+ MIT License.
gffkit-0.1.0/README.md ADDED
@@ -0,0 +1,71 @@
1
+ # gffkit
2
+
3
+ `gffkit` is a lightweight toolkit for region-aware GFF/GTF annotation integration.
4
+ It combines three utilities:
5
+
6
+ 1. `detect-bridge`: detect suspicious merged-gene artifacts caused by bridge transcripts.
7
+ 2. `complement`: complement/merge annotations, with optional region-swap mode.
8
+ 3. `add-utr`: reconstruct `five_prime_UTR` and `three_prime_UTR` features from exon/CDS coordinates.
9
+
10
+ ## Installation
11
+
12
+ ```bash
13
+ pip install gffkit
14
+ ```
15
+
16
+
17
+ ## Quick start
18
+
19
+ ### Full integration pipeline
20
+
21
+ ```bash
22
+ gffkit integrate \
23
+ --annotation-a EviAnn.gff3 \
24
+ --annotation-b ANNEVO.gff3 \
25
+ --outdir gffkit_out \
26
+ --prefix sample
27
+ ```
28
+
29
+ Outputs:
30
+
31
+ - `gffkit_out/sample.suspicious.tsv`
32
+ - `gffkit_out/sample.merged.gff3`
33
+ - `gffkit_out/sample.final.withUTR.gff3`
34
+
35
+ ### Step-by-step usage
36
+
37
+ ```bash
38
+ # 1. Detect suspicious merged genes in Annotation A
39
+ gffkit detect-bridge -i EviAnn.gff3 -o suspicious.tsv
40
+
41
+ # 2. Use A as the global reference, but switch to B in suspicious regions
42
+ gffkit complement \
43
+ --ref EviAnn.gff3 \
44
+ --add ANNEVO.gff3 \
45
+ --swap_region_tsv suspicious.tsv \
46
+ --swap_region_flank 100 \
47
+ --output merged.gff3
48
+
49
+ # 3. Add UTR features
50
+ gffkit add-utr -i merged.gff3 -o final.annotation.withUTR.gff3
51
+ ```
52
+
53
+ ## Command overview
54
+
55
+ ```bash
56
+ gffkit --help
57
+ gffkit detect-bridge --help
58
+ gffkit complement --help
59
+ gffkit add-utr --help
60
+ gffkit integrate --help
61
+ ```
62
+
63
+ ## Annotation integration strategy
64
+
65
+ - Annotation A, for example EviAnn/RNA-seq-supported GFF, is used as the global primary reference.
66
+ - Annotation B, for example ANNEVO/deep-learning GFF, is used as the local primary reference only in suspicious merged-gene regions.
67
+ - UTR features are reconstructed after merging using an exon-minus-CDS strategy.
68
+
69
+ ## License
70
+
71
+ MIT License.
@@ -0,0 +1,46 @@
1
+ [build-system]
2
+ requires = ["setuptools>=68", "wheel"]
3
+ build-backend = "setuptools.build_meta"
4
+
5
+ [project]
6
+ name = "gffkit"
7
+ version = "0.1.0"
8
+ description = "Region-aware GFF annotation integration toolkit"
9
+ readme = "README.md"
10
+ requires-python = ">=3.8"
11
+ license = {text = "MIT"}
12
+ authors = [
13
+ {name = "Qunjie Zhang"}
14
+ ]
15
+ keywords = ["GFF3", "GTF", "genome annotation", "bioinformatics", "UTR", "gene annotation"]
16
+ classifiers = [
17
+ "Development Status :: 3 - Alpha",
18
+ "Intended Audience :: Science/Research",
19
+ "Topic :: Scientific/Engineering :: Bio-Informatics",
20
+ "License :: OSI Approved :: MIT License",
21
+ "Programming Language :: Python :: 3",
22
+ "Programming Language :: Python :: 3.8",
23
+ "Programming Language :: Python :: 3.9",
24
+ "Programming Language :: Python :: 3.10",
25
+ "Programming Language :: Python :: 3.11",
26
+ "Programming Language :: Python :: 3.12",
27
+ "Operating System :: OS Independent",
28
+ ]
29
+ dependencies = []
30
+
31
+ [project.urls]
32
+ Homepage = "https://github.com/qunjie-zhang/gffkit"
33
+ Repository = "https://github.com/qunjie-zhang/gffkit"
34
+ Issues = "https://github.com/qunjie-zhang/gffkit/issues"
35
+
36
+ [project.scripts]
37
+ gffkit = "gffkit.main:main"
38
+ gffkit-detect-bridge = "gffkit.detect_bridge_merged_genes:main"
39
+ gffkit-complement = "gffkit.complement_annotations:main"
40
+ gffkit-add-utr = "gffkit.add_utr:main"
41
+
42
+ [tool.setuptools]
43
+ package-dir = {"" = "src"}
44
+
45
+ [tool.setuptools.packages.find]
46
+ where = ["src"]
gffkit-0.1.0/setup.cfg ADDED
@@ -0,0 +1,4 @@
1
+ [egg_info]
2
+ tag_build =
3
+ tag_date = 0
4
+
@@ -0,0 +1,3 @@
1
+ """gffkit: region-aware GFF annotation integration utilities."""
2
+
3
+ __version__ = "0.1.0"
@@ -0,0 +1,4 @@
1
+ from .main import main
2
+
3
+ if __name__ == "__main__":
4
+ raise SystemExit(main())