agridatasets 0.1.0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- agridatasets-0.1.0/CHANGELOG.md +13 -0
- agridatasets-0.1.0/LICENSE +21 -0
- agridatasets-0.1.0/MANIFEST.in +24 -0
- agridatasets-0.1.0/PKG-INFO +146 -0
- agridatasets-0.1.0/README.md +75 -0
- agridatasets-0.1.0/agridatasets/__init__.py +17 -0
- agridatasets-0.1.0/agridatasets/core.py +40 -0
- agridatasets-0.1.0/agridatasets/data/alfalfa_soil.csv +13 -0
- agridatasets-0.1.0/agridatasets/data/apple_canker.csv +37 -0
- agridatasets-0.1.0/agridatasets/data/apple_uniformity.csv +199 -0
- agridatasets-0.1.0/agridatasets/data/avocado_us_sale.csv +811 -0
- agridatasets-0.1.0/agridatasets/data/bamboo_growth.csv +596 -0
- agridatasets-0.1.0/agridatasets/data/biological_control.csv +16 -0
- agridatasets-0.1.0/agridatasets/data/bird_grazing.csv +63 -0
- agridatasets-0.1.0/agridatasets/data/black_duck_survival.csv +51 -0
- agridatasets-0.1.0/agridatasets/data/blackgrass_herbicide.csv +136 -0
- agridatasets-0.1.0/agridatasets/data/broiler_growth.csv +60 -0
- agridatasets-0.1.0/agridatasets/data/budworm_pyrethroid.csv +13 -0
- agridatasets-0.1.0/agridatasets/data/carrot_fly_infestation.csv +97 -0
- agridatasets-0.1.0/agridatasets/data/carrot_insecticide.csv +37 -0
- agridatasets-0.1.0/agridatasets/data/cattle_butterfat.csv +101 -0
- agridatasets-0.1.0/agridatasets/data/cauliflower_growth.csv +15 -0
- agridatasets-0.1.0/agridatasets/data/cork_tree_direction.csv +113 -0
- agridatasets-0.1.0/agridatasets/data/corn_hybrid_density.csv +25 -0
- agridatasets-0.1.0/agridatasets/data/cotton_pesticide.csv +26 -0
- agridatasets-0.1.0/agridatasets/data/cowpea_maize_yield.csv +73 -0
- agridatasets-0.1.0/agridatasets/data/cows_insemination.csv +11 -0
- agridatasets-0.1.0/agridatasets/data/earthworm_crop_soils.csv +13 -0
- agridatasets-0.1.0/agridatasets/data/earthworm_population.csv +47 -0
- agridatasets-0.1.0/agridatasets/data/eelworm_fumigation.csv +49 -0
- agridatasets-0.1.0/agridatasets/data/egg_weight_daily.csv +241 -0
- agridatasets-0.1.0/agridatasets/data/eucalyptus_progenies.csv +73 -0
- agridatasets-0.1.0/agridatasets/data/fish_feeding.csv +34 -0
- agridatasets-0.1.0/agridatasets/data/fungicide_latin_square.csv +26 -0
- agridatasets-0.1.0/agridatasets/data/grape_uniformity.csv +156 -0
- agridatasets-0.1.0/agridatasets/data/guinea_pig_sleep.csv +31 -0
- agridatasets-0.1.0/agridatasets/data/hawaii_plant_size.csv +59 -0
- agridatasets-0.1.0/agridatasets/data/hawaii_tree_growth.csv +64 -0
- agridatasets-0.1.0/agridatasets/data/idn_rice_farms.csv +1027 -0
- agridatasets-0.1.0/agridatasets/data/kiwi_crop_design.csv +13 -0
- agridatasets-0.1.0/agridatasets/data/ladybird_fungus_spread.csv +73 -0
- agridatasets-0.1.0/agridatasets/data/lamb_births.csv +37 -0
- agridatasets-0.1.0/agridatasets/data/nitrofen_toxicity.csv +51 -0
- agridatasets-0.1.0/agridatasets/data/orange_rootstocks.csv +28 -0
- agridatasets-0.1.0/agridatasets/data/peach_uniformity.csv +145 -0
- agridatasets-0.1.0/agridatasets/data/pig_weight_gain.csv +31 -0
- agridatasets-0.1.0/agridatasets/data/plant_growth_regulator.csv +25 -0
- agridatasets-0.1.0/agridatasets/data/pollen_removal.csv +48 -0
- agridatasets-0.1.0/agridatasets/data/potato_scab_sulfur.csv +33 -0
- agridatasets-0.1.0/agridatasets/data/rabbit_body_mass.csv +142 -0
- agridatasets-0.1.0/agridatasets/data/red_wine_quality.csv +1600 -0
- agridatasets-0.1.0/agridatasets/data/rice_wheat_production.csv +107 -0
- agridatasets-0.1.0/agridatasets/data/river_deforestation.csv +57 -0
- agridatasets-0.1.0/agridatasets/data/seed_germination.csv +65 -0
- agridatasets-0.1.0/agridatasets/data/soil_munsell_colors.csv +483 -0
- agridatasets-0.1.0/agridatasets/data/soil_munsell_minerals.csv +21 -0
- agridatasets-0.1.0/agridatasets/data/soybean_cultivars.csv +41 -0
- agridatasets-0.1.0/agridatasets/data/strawberry_cross_disease.csv +145 -0
- agridatasets-0.1.0/agridatasets/data/strawberry_yield.csv +33 -0
- agridatasets-0.1.0/agridatasets/data/timber_genetics.csv +225 -0
- agridatasets-0.1.0/agridatasets/data/tomato_uniformity.csv +181 -0
- agridatasets-0.1.0/agridatasets/data/toxin_lethal_dose.csv +7 -0
- agridatasets-0.1.0/agridatasets/data/turnip_density.csv +61 -0
- agridatasets-0.1.0/agridatasets/data/us_state_soils.csv +53 -0
- agridatasets-0.1.0/agridatasets/data/wheat_bunt.csv +401 -0
- agridatasets-0.1.0/agridatasets/data/wheat_splitsplit.csv +161 -0
- agridatasets-0.1.0/agridatasets/data/willow_cutting_yield.csv +26 -0
- agridatasets-0.1.0/agridatasets/datasets.py +547 -0
- agridatasets-0.1.0/agridatasets.egg-info/PKG-INFO +146 -0
- agridatasets-0.1.0/agridatasets.egg-info/SOURCES.txt +79 -0
- agridatasets-0.1.0/agridatasets.egg-info/dependency_links.txt +1 -0
- agridatasets-0.1.0/agridatasets.egg-info/not-zip-safe +1 -0
- agridatasets-0.1.0/agridatasets.egg-info/requires.txt +12 -0
- agridatasets-0.1.0/agridatasets.egg-info/top_level.txt +2 -0
- agridatasets-0.1.0/docs/examples.md +53 -0
- agridatasets-0.1.0/docs/index.md +122 -0
- agridatasets-0.1.0/examples/basic_usage.py +41 -0
- agridatasets-0.1.0/pyproject.toml +84 -0
- agridatasets-0.1.0/setup.cfg +114 -0
- agridatasets-0.1.0/setup.py +94 -0
|
@@ -0,0 +1,13 @@
|
|
|
1
|
+
# Changelog
|
|
2
|
+
|
|
3
|
+
All notable changes to `agridatasets` will be documented in this file.
|
|
4
|
+
|
|
5
|
+
The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
|
|
6
|
+
and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
|
|
7
|
+
|
|
8
|
+
## [0.1.0] - 2026-06-07
|
|
9
|
+
|
|
10
|
+
### Added
|
|
11
|
+
- Initial release of `agridatasets`
|
|
12
|
+
- Access to a curated collection of agricultural, agronomic, and livestock datasets for data analysis, statistical modeling, and machine learning research in Python.
|
|
13
|
+
- Basic documentation and usage examples
|
|
@@ -0,0 +1,21 @@
|
|
|
1
|
+
MIT License
|
|
2
|
+
|
|
3
|
+
Copyright (c) 2026 Renzo Caceres Rossi
|
|
4
|
+
|
|
5
|
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
6
|
+
of this software and associated documentation files (the "Software"), to deal
|
|
7
|
+
in the Software without restriction, including without limitation the rights
|
|
8
|
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
9
|
+
copies of the Software, and to permit persons to whom the Software is
|
|
10
|
+
furnished to do so, subject to the following conditions:
|
|
11
|
+
|
|
12
|
+
The above copyright notice and this permission notice shall be included in all
|
|
13
|
+
copies or substantial portions of the Software.
|
|
14
|
+
|
|
15
|
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
16
|
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
17
|
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
18
|
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
19
|
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
20
|
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
21
|
+
SOFTWARE.
|
|
@@ -0,0 +1,24 @@
|
|
|
1
|
+
# Main Documentation
|
|
2
|
+
include README.md
|
|
3
|
+
include LICENSE
|
|
4
|
+
include CHANGELOG.md
|
|
5
|
+
|
|
6
|
+
# Setup / build config
|
|
7
|
+
include pyproject.toml
|
|
8
|
+
include setup.cfg
|
|
9
|
+
|
|
10
|
+
# Datasets (inside the Python package)
|
|
11
|
+
recursive-include agridatasets/data *.csv
|
|
12
|
+
|
|
13
|
+
# Additional documentation
|
|
14
|
+
recursive-include docs *.md
|
|
15
|
+
|
|
16
|
+
# Examples
|
|
17
|
+
recursive-include examples *.py
|
|
18
|
+
|
|
19
|
+
# Do not include
|
|
20
|
+
prune tests
|
|
21
|
+
prune __pycache__
|
|
22
|
+
global-exclude __pycache__/*
|
|
23
|
+
global-exclude *.py[cod]
|
|
24
|
+
global-exclude .DS_Store
|
|
@@ -0,0 +1,146 @@
|
|
|
1
|
+
Metadata-Version: 2.4
|
|
2
|
+
Name: agridatasets
|
|
3
|
+
Version: 0.1.0
|
|
4
|
+
Summary: A curated collection of agricultural, agronomic, and livestock datasets for data analysis, statistical modeling, and machine learning research. Includes crop yield trials, soil Munsell mineral classifications, field uniformity experiments, forestry genetics, plant disease infestations, pesticide efficacy, biological pest controls, dairy cattle and broiler chicken development tracking, and more from curated R packages on CRAN.
|
|
5
|
+
Home-page: https://github.com/lightbluetitan/agridatasets-py
|
|
6
|
+
Author: Renzo Caceres Rossi
|
|
7
|
+
Author-email: Renzo Caceres Rossi <arenzocaceresrossi@gmail.com>
|
|
8
|
+
Maintainer-email: Renzo Caceres Rossi <arenzocaceresrossi@gmail.com>
|
|
9
|
+
License: MIT License
|
|
10
|
+
|
|
11
|
+
Copyright (c) 2026 Renzo Caceres Rossi
|
|
12
|
+
|
|
13
|
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
14
|
+
of this software and associated documentation files (the "Software"), to deal
|
|
15
|
+
in the Software without restriction, including without limitation the rights
|
|
16
|
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
17
|
+
copies of the Software, and to permit persons to whom the Software is
|
|
18
|
+
furnished to do so, subject to the following conditions:
|
|
19
|
+
|
|
20
|
+
The above copyright notice and this permission notice shall be included in all
|
|
21
|
+
copies or substantial portions of the Software.
|
|
22
|
+
|
|
23
|
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
24
|
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
25
|
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
26
|
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
27
|
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
28
|
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
29
|
+
SOFTWARE.
|
|
30
|
+
|
|
31
|
+
Project-URL: Bug Tracker, https://github.com/lightbluetitan/agridatasets-py/issues
|
|
32
|
+
Project-URL: Documentation, https://github.com/lightbluetitan/agridatasets-py
|
|
33
|
+
Project-URL: Source Code, https://github.com/lightbluetitan/agridatasets-py
|
|
34
|
+
Keywords: agriculture,agronomy,datasets,crop yield,soil science,forestry,horticulture,plant pathology,entomology,livestock,animal science,pesticides,uniform trials,split plot,latin square,experimental design,munsell color,data science,statistics,research,open science,open data,agricultural statistics
|
|
35
|
+
Classifier: Development Status :: 4 - Beta
|
|
36
|
+
Classifier: Intended Audience :: Developers
|
|
37
|
+
Classifier: Intended Audience :: Education
|
|
38
|
+
Classifier: Intended Audience :: Science/Research
|
|
39
|
+
Classifier: Topic :: Scientific/Engineering :: Information Analysis
|
|
40
|
+
Classifier: Topic :: Scientific/Engineering :: Mathematics
|
|
41
|
+
Classifier: Topic :: Software Development :: Libraries :: Python Modules
|
|
42
|
+
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
|
|
43
|
+
Classifier: License :: OSI Approved :: MIT License
|
|
44
|
+
Classifier: Programming Language :: Python :: 3
|
|
45
|
+
Classifier: Programming Language :: Python :: 3.8
|
|
46
|
+
Classifier: Programming Language :: Python :: 3.9
|
|
47
|
+
Classifier: Programming Language :: Python :: 3.10
|
|
48
|
+
Classifier: Programming Language :: Python :: 3.11
|
|
49
|
+
Classifier: Programming Language :: Python :: 3.12
|
|
50
|
+
Classifier: Programming Language :: Python :: 3.13
|
|
51
|
+
Classifier: Programming Language :: Python :: 3 :: Only
|
|
52
|
+
Classifier: Operating System :: OS Independent
|
|
53
|
+
Classifier: Natural Language :: English
|
|
54
|
+
Requires-Python: >=3.8
|
|
55
|
+
Description-Content-Type: text/markdown
|
|
56
|
+
License-File: LICENSE
|
|
57
|
+
Requires-Dist: pandas<3.0,>=1.5
|
|
58
|
+
Provides-Extra: dev
|
|
59
|
+
Requires-Dist: pytest>=7.0; extra == "dev"
|
|
60
|
+
Requires-Dist: pytest-cov; extra == "dev"
|
|
61
|
+
Requires-Dist: black; extra == "dev"
|
|
62
|
+
Requires-Dist: flake8; extra == "dev"
|
|
63
|
+
Requires-Dist: mypy; extra == "dev"
|
|
64
|
+
Provides-Extra: docs
|
|
65
|
+
Requires-Dist: mkdocs; extra == "docs"
|
|
66
|
+
Requires-Dist: mkdocs-material; extra == "docs"
|
|
67
|
+
Dynamic: author
|
|
68
|
+
Dynamic: home-page
|
|
69
|
+
Dynamic: license-file
|
|
70
|
+
Dynamic: requires-python
|
|
71
|
+
|
|
72
|
+
# agridatasets
|
|
73
|
+
|
|
74
|
+
[](https://opensource.org/licenses/MIT)
|
|
75
|
+
[](https://www.python.org/downloads/)
|
|
76
|
+
|
|
77
|
+
The `agridatasets` package provides a curated collection of agricultural, agronomic, and livestock
|
|
78
|
+
datasets for data analysis, statistical modeling, and machine learning research. Includes crop yield
|
|
79
|
+
trials, soil Munsell mineral classifications, field uniformity experiments, forestry genetics, plant
|
|
80
|
+
disease infestations, pesticide efficacy, biological pest controls, dairy cattle and broiler chicken
|
|
81
|
+
development tracking, and more from curated R packages on CRAN.
|
|
82
|
+
|
|
83
|
+
## Installation
|
|
84
|
+
You can install the `agridatasets` package from PyPI:
|
|
85
|
+
```bash
|
|
86
|
+
pip install agridatasets
|
|
87
|
+
```
|
|
88
|
+
|
|
89
|
+
## Usage
|
|
90
|
+
```python
|
|
91
|
+
|
|
92
|
+
import agridatasets as agd
|
|
93
|
+
|
|
94
|
+
# List all available datasets
|
|
95
|
+
|
|
96
|
+
datasets = agd.list_datasets()
|
|
97
|
+
print(datasets)
|
|
98
|
+
|
|
99
|
+
# Load a specific dataset
|
|
100
|
+
|
|
101
|
+
df = agd.load_dataset('bamboo_growth')
|
|
102
|
+
print(df.head())
|
|
103
|
+
|
|
104
|
+
# Describe dataset
|
|
105
|
+
|
|
106
|
+
df_01 = agd.describe('cows_insemination')
|
|
107
|
+
print(df_01)
|
|
108
|
+
|
|
109
|
+
```
|
|
110
|
+
|
|
111
|
+
## 📊 Some Available Datasets
|
|
112
|
+
|
|
113
|
+
| Dataset | Description |
|
|
114
|
+
|---------|-------------|
|
|
115
|
+
| `bamboo_growth` | Bamboo growth observations across different geographic locations and transects. |
|
|
116
|
+
| `cows_insemination` | Cow insemination and conception records across time intervals. |
|
|
117
|
+
| `earthworm_population` | Seasonal earthworm population data, including density and biomass measurements. |
|
|
118
|
+
| `earthworm_crop_soils` | Earthworm density and biomass data from cultivated soils under different crops. |
|
|
119
|
+
| `rabbit_body_mass` | Rabbit body weight and hind foot length measurements. |
|
|
120
|
+
|
|
121
|
+
> Run `agridatasets.list_datasets()` or `agd.list_datasets()` (using `agd` as alias) to see the full list of available datasets.
|
|
122
|
+
|
|
123
|
+
## Disclaimer
|
|
124
|
+
|
|
125
|
+
The datasets included in `agridatasets` are provided strictly for educational,
|
|
126
|
+
research, and informational purposes. All datasets originate from curated R packages
|
|
127
|
+
available on CRAN and retain their original licenses and attributions.
|
|
128
|
+
|
|
129
|
+
The author of `agridatasets` makes no warranties, express or implied, regarding
|
|
130
|
+
the accuracy, completeness, or suitability of any dataset for a particular purpose.
|
|
131
|
+
Users are solely responsible for ensuring that their use of these datasets complies
|
|
132
|
+
with applicable laws, regulations, and ethical guidelines.
|
|
133
|
+
|
|
134
|
+
Any findings, conclusions, or decisions derived from the use of these datasets
|
|
135
|
+
are the sole responsibility of the user. The author shall not be held liable for
|
|
136
|
+
any direct, indirect, incidental, or consequential damages arising from the use
|
|
137
|
+
or misuse of the datasets included in this library.
|
|
138
|
+
|
|
139
|
+
For agronomic advice, crop management, or any agriculture-related decision-making purposes,
|
|
140
|
+
always consult a qualified agricultural professional or agronomist.
|
|
141
|
+
|
|
142
|
+
|
|
143
|
+
## License
|
|
144
|
+
|
|
145
|
+
The `agridatasets` library is released under the **MIT License**, which allows free use,
|
|
146
|
+
modification, and distribution. See the [LICENSE](LICENSE) file for details.
|
|
@@ -0,0 +1,75 @@
|
|
|
1
|
+
# agridatasets
|
|
2
|
+
|
|
3
|
+
[](https://opensource.org/licenses/MIT)
|
|
4
|
+
[](https://www.python.org/downloads/)
|
|
5
|
+
|
|
6
|
+
The `agridatasets` package provides a curated collection of agricultural, agronomic, and livestock
|
|
7
|
+
datasets for data analysis, statistical modeling, and machine learning research. Includes crop yield
|
|
8
|
+
trials, soil Munsell mineral classifications, field uniformity experiments, forestry genetics, plant
|
|
9
|
+
disease infestations, pesticide efficacy, biological pest controls, dairy cattle and broiler chicken
|
|
10
|
+
development tracking, and more from curated R packages on CRAN.
|
|
11
|
+
|
|
12
|
+
## Installation
|
|
13
|
+
You can install the `agridatasets` package from PyPI:
|
|
14
|
+
```bash
|
|
15
|
+
pip install agridatasets
|
|
16
|
+
```
|
|
17
|
+
|
|
18
|
+
## Usage
|
|
19
|
+
```python
|
|
20
|
+
|
|
21
|
+
import agridatasets as agd
|
|
22
|
+
|
|
23
|
+
# List all available datasets
|
|
24
|
+
|
|
25
|
+
datasets = agd.list_datasets()
|
|
26
|
+
print(datasets)
|
|
27
|
+
|
|
28
|
+
# Load a specific dataset
|
|
29
|
+
|
|
30
|
+
df = agd.load_dataset('bamboo_growth')
|
|
31
|
+
print(df.head())
|
|
32
|
+
|
|
33
|
+
# Describe dataset
|
|
34
|
+
|
|
35
|
+
df_01 = agd.describe('cows_insemination')
|
|
36
|
+
print(df_01)
|
|
37
|
+
|
|
38
|
+
```
|
|
39
|
+
|
|
40
|
+
## 📊 Some Available Datasets
|
|
41
|
+
|
|
42
|
+
| Dataset | Description |
|
|
43
|
+
|---------|-------------|
|
|
44
|
+
| `bamboo_growth` | Bamboo growth observations across different geographic locations and transects. |
|
|
45
|
+
| `cows_insemination` | Cow insemination and conception records across time intervals. |
|
|
46
|
+
| `earthworm_population` | Seasonal earthworm population data, including density and biomass measurements. |
|
|
47
|
+
| `earthworm_crop_soils` | Earthworm density and biomass data from cultivated soils under different crops. |
|
|
48
|
+
| `rabbit_body_mass` | Rabbit body weight and hind foot length measurements. |
|
|
49
|
+
|
|
50
|
+
> Run `agridatasets.list_datasets()` or `agd.list_datasets()` (using `agd` as alias) to see the full list of available datasets.
|
|
51
|
+
|
|
52
|
+
## Disclaimer
|
|
53
|
+
|
|
54
|
+
The datasets included in `agridatasets` are provided strictly for educational,
|
|
55
|
+
research, and informational purposes. All datasets originate from curated R packages
|
|
56
|
+
available on CRAN and retain their original licenses and attributions.
|
|
57
|
+
|
|
58
|
+
The author of `agridatasets` makes no warranties, express or implied, regarding
|
|
59
|
+
the accuracy, completeness, or suitability of any dataset for a particular purpose.
|
|
60
|
+
Users are solely responsible for ensuring that their use of these datasets complies
|
|
61
|
+
with applicable laws, regulations, and ethical guidelines.
|
|
62
|
+
|
|
63
|
+
Any findings, conclusions, or decisions derived from the use of these datasets
|
|
64
|
+
are the sole responsibility of the user. The author shall not be held liable for
|
|
65
|
+
any direct, indirect, incidental, or consequential damages arising from the use
|
|
66
|
+
or misuse of the datasets included in this library.
|
|
67
|
+
|
|
68
|
+
For agronomic advice, crop management, or any agriculture-related decision-making purposes,
|
|
69
|
+
always consult a qualified agricultural professional or agronomist.
|
|
70
|
+
|
|
71
|
+
|
|
72
|
+
## License
|
|
73
|
+
|
|
74
|
+
The `agridatasets` library is released under the **MIT License**, which allows free use,
|
|
75
|
+
modification, and distribution. See the [LICENSE](LICENSE) file for details.
|
|
@@ -0,0 +1,17 @@
|
|
|
1
|
+
"""
|
|
2
|
+
agridatasets
|
|
3
|
+
A Python package providing agricultural, agronomic, and livestock datasets in CSV format from curated R dataset packages.
|
|
4
|
+
"""
|
|
5
|
+
|
|
6
|
+
__version__ = "0.1.0"
|
|
7
|
+
|
|
8
|
+
from .core import load_dataset, list_datasets, describe
|
|
9
|
+
from .datasets import DATASETS
|
|
10
|
+
|
|
11
|
+
__all__ = [
|
|
12
|
+
"load_dataset",
|
|
13
|
+
"list_datasets",
|
|
14
|
+
"describe",
|
|
15
|
+
"DATASETS",
|
|
16
|
+
"__version__",
|
|
17
|
+
]
|
|
@@ -0,0 +1,40 @@
|
|
|
1
|
+
from pathlib import Path
|
|
2
|
+
import pandas as pd
|
|
3
|
+
from .datasets import DATASETS
|
|
4
|
+
|
|
5
|
+
_DATA_PATH = Path(__file__).parent / "data"
|
|
6
|
+
|
|
7
|
+
|
|
8
|
+
def list_datasets():
|
|
9
|
+
"""
|
|
10
|
+
Return a sorted list of available dataset names.
|
|
11
|
+
"""
|
|
12
|
+
return sorted(DATASETS.keys())
|
|
13
|
+
|
|
14
|
+
|
|
15
|
+
def describe(name):
|
|
16
|
+
"""
|
|
17
|
+
Return metadata for a given dataset.
|
|
18
|
+
"""
|
|
19
|
+
if name not in DATASETS:
|
|
20
|
+
raise ValueError(
|
|
21
|
+
f"Dataset '{name}' not found. "
|
|
22
|
+
f"Available datasets: {', '.join(list_datasets())}"
|
|
23
|
+
)
|
|
24
|
+
return DATASETS[name]
|
|
25
|
+
|
|
26
|
+
|
|
27
|
+
def load_dataset(name):
|
|
28
|
+
"""
|
|
29
|
+
Load a dataset by name and return a pandas DataFrame.
|
|
30
|
+
"""
|
|
31
|
+
if name not in DATASETS:
|
|
32
|
+
raise ValueError(
|
|
33
|
+
f"Dataset '{name}' not found. "
|
|
34
|
+
f"Available datasets: {', '.join(list_datasets())}"
|
|
35
|
+
)
|
|
36
|
+
filename = DATASETS[name]["Filename"]
|
|
37
|
+
file_path = _DATA_PATH / filename
|
|
38
|
+
if not file_path.exists():
|
|
39
|
+
raise FileNotFoundError(f"Dataset file not found: {filename}")
|
|
40
|
+
return pd.read_csv(file_path, low_memory=False)
|
|
@@ -0,0 +1,13 @@
|
|
|
1
|
+
code,s3_a,s2_a,s1_a,s1_b,s2_b,s3_b,wts
|
|
2
|
+
SoilTe,NA,NA,NA,NA,NA,NA,NA
|
|
3
|
+
CFragm,55.0,35.0,15.0,NA,NA,NA,NA
|
|
4
|
+
SoilDpt,20.0,50.0,75.0,NA,NA,NA,NA
|
|
5
|
+
CaCO3,35.0,25.0,15.0,NA,NA,NA,NA
|
|
6
|
+
Gyps,20.0,10.0,4.0,NA,NA,NA,NA
|
|
7
|
+
CECc,16.0,16.0,16.0,NA,NA,NA,NA
|
|
8
|
+
BS,19.9,20.0,35.0,NA,NA,NA,NA
|
|
9
|
+
SumBCs,2.0,3.5,5.0,NA,NA,NA,NA
|
|
10
|
+
pHH2O,5.2,5.5,6.0,8,8.2,8.5,NA
|
|
11
|
+
OC,0.7,0.8,1.2,NA,NA,NA,NA
|
|
12
|
+
ECedS,12.0,9.0,5.0,NA,NA,NA,NA
|
|
13
|
+
ESP,50.0,35.0,20.0,NA,NA,NA,NA
|
|
@@ -0,0 +1,37 @@
|
|
|
1
|
+
inoculum,gen,block,y,n
|
|
2
|
+
200,Jonagold,B1,1,5
|
|
3
|
+
200,Jonagold,B2,2,5
|
|
4
|
+
200,Jonagold,B3,1,5
|
|
5
|
+
200,Jonagold,B4,0,5
|
|
6
|
+
200,Golden,B1,1,5
|
|
7
|
+
200,Golden,B2,0,5
|
|
8
|
+
200,Golden,B3,0,5
|
|
9
|
+
200,Golden,B4,0,5
|
|
10
|
+
200,Jonathan,B1,2,5
|
|
11
|
+
200,Jonathan,B2,2,5
|
|
12
|
+
200,Jonathan,B3,2,5
|
|
13
|
+
200,Jonathan,B4,0,5
|
|
14
|
+
1000,Jonagold,B1,0,5
|
|
15
|
+
1000,Jonagold,B2,2,5
|
|
16
|
+
1000,Jonagold,B3,2,5
|
|
17
|
+
1000,Jonagold,B4,4,5
|
|
18
|
+
1000,Golden,B1,0,5
|
|
19
|
+
1000,Golden,B2,0,5
|
|
20
|
+
1000,Golden,B3,2,5
|
|
21
|
+
1000,Golden,B4,0,5
|
|
22
|
+
1000,Jonathan,B1,4,5
|
|
23
|
+
1000,Jonathan,B2,4,5
|
|
24
|
+
1000,Jonathan,B3,4,5
|
|
25
|
+
1000,Jonathan,B4,0,5
|
|
26
|
+
5000,Jonagold,B1,5,5
|
|
27
|
+
5000,Jonagold,B2,5,5
|
|
28
|
+
5000,Jonagold,B3,4,5
|
|
29
|
+
5000,Jonagold,B4,5,5
|
|
30
|
+
5000,Golden,B1,5,5
|
|
31
|
+
5000,Golden,B2,4,5
|
|
32
|
+
5000,Golden,B3,3,5
|
|
33
|
+
5000,Golden,B4,5,5
|
|
34
|
+
5000,Jonathan,B1,5,5
|
|
35
|
+
5000,Jonathan,B2,0,5
|
|
36
|
+
5000,Jonathan,B3,3,5
|
|
37
|
+
5000,Jonathan,B4,5,5
|
|
@@ -0,0 +1,199 @@
|
|
|
1
|
+
row,col,yield
|
|
2
|
+
1,1,235
|
|
3
|
+
2,1,348
|
|
4
|
+
3,1,NA
|
|
5
|
+
4,1,306
|
|
6
|
+
5,1,345
|
|
7
|
+
6,1,275
|
|
8
|
+
7,1,296
|
|
9
|
+
8,1,273
|
|
10
|
+
9,1,315
|
|
11
|
+
10,1,283
|
|
12
|
+
11,1,322
|
|
13
|
+
12,1,339
|
|
14
|
+
13,1,340
|
|
15
|
+
14,1,332
|
|
16
|
+
15,1,414
|
|
17
|
+
16,1,157
|
|
18
|
+
17,1,447
|
|
19
|
+
18,1,482
|
|
20
|
+
1,2,273
|
|
21
|
+
2,2,351
|
|
22
|
+
3,2,322
|
|
23
|
+
4,2,267
|
|
24
|
+
5,2,276
|
|
25
|
+
6,2,256
|
|
26
|
+
7,2,248
|
|
27
|
+
8,2,268
|
|
28
|
+
9,2,291
|
|
29
|
+
10,2,223
|
|
30
|
+
11,2,243
|
|
31
|
+
12,2,323
|
|
32
|
+
13,2,257
|
|
33
|
+
14,2,315
|
|
34
|
+
15,2,320
|
|
35
|
+
16,2,267
|
|
36
|
+
17,2,359
|
|
37
|
+
18,2,289
|
|
38
|
+
1,3,281
|
|
39
|
+
2,3,212
|
|
40
|
+
3,3,274
|
|
41
|
+
4,3,288
|
|
42
|
+
5,3,323
|
|
43
|
+
6,3,330
|
|
44
|
+
7,3,201
|
|
45
|
+
8,3,179
|
|
46
|
+
9,3,230
|
|
47
|
+
10,3,260
|
|
48
|
+
11,3,214
|
|
49
|
+
12,3,308
|
|
50
|
+
13,3,NA
|
|
51
|
+
14,3,NA
|
|
52
|
+
15,3,337
|
|
53
|
+
16,3,257
|
|
54
|
+
17,3,341
|
|
55
|
+
18,3,210
|
|
56
|
+
1,4,240
|
|
57
|
+
2,4,331
|
|
58
|
+
3,4,224
|
|
59
|
+
4,4,229
|
|
60
|
+
5,4,130
|
|
61
|
+
6,4,230
|
|
62
|
+
7,4,227
|
|
63
|
+
8,4,270
|
|
64
|
+
9,4,258
|
|
65
|
+
10,4,250
|
|
66
|
+
11,4,263
|
|
67
|
+
12,4,253
|
|
68
|
+
13,4,197
|
|
69
|
+
14,4,NA
|
|
70
|
+
15,4,317
|
|
71
|
+
16,4,244
|
|
72
|
+
17,4,233
|
|
73
|
+
18,4,248
|
|
74
|
+
1,5,272
|
|
75
|
+
2,5,288
|
|
76
|
+
3,5,287
|
|
77
|
+
4,5,232
|
|
78
|
+
5,5,216
|
|
79
|
+
6,5,227
|
|
80
|
+
7,5,205
|
|
81
|
+
8,5,213
|
|
82
|
+
9,5,240
|
|
83
|
+
10,5,216
|
|
84
|
+
11,5,224
|
|
85
|
+
12,5,286
|
|
86
|
+
13,5,237
|
|
87
|
+
14,5,313
|
|
88
|
+
15,5,336
|
|
89
|
+
16,5,187
|
|
90
|
+
17,5,258
|
|
91
|
+
18,5,221
|
|
92
|
+
1,6,288
|
|
93
|
+
2,6,270
|
|
94
|
+
3,6,242
|
|
95
|
+
4,6,202
|
|
96
|
+
5,6,248
|
|
97
|
+
6,6,239
|
|
98
|
+
7,6,135
|
|
99
|
+
8,6,239
|
|
100
|
+
9,6,182
|
|
101
|
+
10,6,276
|
|
102
|
+
11,6,295
|
|
103
|
+
12,6,267
|
|
104
|
+
13,6,217
|
|
105
|
+
14,6,NA
|
|
106
|
+
15,6,279
|
|
107
|
+
16,6,167
|
|
108
|
+
17,6,193
|
|
109
|
+
18,6,335
|
|
110
|
+
1,7,299
|
|
111
|
+
2,7,212
|
|
112
|
+
3,7,238
|
|
113
|
+
4,7,187
|
|
114
|
+
5,7,258
|
|
115
|
+
6,7,189
|
|
116
|
+
7,7,173
|
|
117
|
+
8,7,118
|
|
118
|
+
9,7,250
|
|
119
|
+
10,7,183
|
|
120
|
+
11,7,300
|
|
121
|
+
12,7,259
|
|
122
|
+
13,7,212
|
|
123
|
+
14,7,218
|
|
124
|
+
15,7,309
|
|
125
|
+
16,7,159
|
|
126
|
+
17,7,215
|
|
127
|
+
18,7,234
|
|
128
|
+
1,8,255
|
|
129
|
+
2,8,276
|
|
130
|
+
3,8,195
|
|
131
|
+
4,8,217
|
|
132
|
+
5,8,191
|
|
133
|
+
6,8,200
|
|
134
|
+
7,8,236
|
|
135
|
+
8,8,187
|
|
136
|
+
9,8,191
|
|
137
|
+
10,8,212
|
|
138
|
+
11,8,307
|
|
139
|
+
12,8,310
|
|
140
|
+
13,8,NA
|
|
141
|
+
14,8,NA
|
|
142
|
+
15,8,241
|
|
143
|
+
16,8,194
|
|
144
|
+
17,8,242
|
|
145
|
+
18,8,139
|
|
146
|
+
1,9,264
|
|
147
|
+
2,9,231
|
|
148
|
+
3,9,207
|
|
149
|
+
4,9,174
|
|
150
|
+
5,9,145
|
|
151
|
+
6,9,230
|
|
152
|
+
7,9,240
|
|
153
|
+
8,9,214
|
|
154
|
+
9,9,183
|
|
155
|
+
10,9,245
|
|
156
|
+
11,9,NA
|
|
157
|
+
12,9,278
|
|
158
|
+
13,9,285
|
|
159
|
+
14,9,219
|
|
160
|
+
15,9,366
|
|
161
|
+
16,9,207
|
|
162
|
+
17,9,290
|
|
163
|
+
18,9,192
|
|
164
|
+
1,10,225
|
|
165
|
+
2,10,NA
|
|
166
|
+
3,10,226
|
|
167
|
+
4,10,186
|
|
168
|
+
5,10,252
|
|
169
|
+
6,10,255
|
|
170
|
+
7,10,166
|
|
171
|
+
8,10,220
|
|
172
|
+
9,10,153
|
|
173
|
+
10,10,239
|
|
174
|
+
11,10,279
|
|
175
|
+
12,10,234
|
|
176
|
+
13,10,292
|
|
177
|
+
14,10,NA
|
|
178
|
+
15,10,NA
|
|
179
|
+
16,10,222
|
|
180
|
+
17,10,311
|
|
181
|
+
18,10,311
|
|
182
|
+
1,11,279
|
|
183
|
+
2,11,247
|
|
184
|
+
3,11,152
|
|
185
|
+
4,11,197
|
|
186
|
+
5,11,215
|
|
187
|
+
6,11,276
|
|
188
|
+
7,11,182
|
|
189
|
+
8,11,200
|
|
190
|
+
9,11,188
|
|
191
|
+
10,11,245
|
|
192
|
+
11,11,201
|
|
193
|
+
12,11,242
|
|
194
|
+
13,11,221
|
|
195
|
+
14,11,246
|
|
196
|
+
15,11,262
|
|
197
|
+
16,11,271
|
|
198
|
+
17,11,227
|
|
199
|
+
18,11,203
|