anemoi-utils 0.4.23__tar.gz → 0.4.24__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of anemoi-utils might be problematic. Click here for more details.
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.github/CODEOWNERS +0 -1
- anemoi_utils-0.4.24/.github/pull_request_template.md +13 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.github/workflows/downstream-ci-hpc.yml +1 -1
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.github/workflows/pr-conventional-commit.yml +1 -1
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.github/workflows/pr-label-conventional-commits.yml +1 -1
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.github/workflows/pr-label-file-based.yml +1 -1
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.github/workflows/pr-label-public.yml +1 -1
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.github/workflows/python-pull-request.yml +1 -1
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.github/workflows/readthedocs-pr-update.yml +1 -1
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.gitignore +7 -1
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.pre-commit-config.yaml +3 -2
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.release-please-config.json +6 -1
- anemoi_utils-0.4.24/.release-please-manifest.json +3 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/CHANGELOG.md +8 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/PKG-INFO +1 -1
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/_version.py +2 -2
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/remote/s3.py +107 -26
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi_utils.egg-info/PKG-INFO +1 -1
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi_utils.egg-info/SOURCES.txt +0 -1
- anemoi_utils-0.4.23/.github/pull_request_template.md +0 -46
- anemoi_utils-0.4.23/.github/release.yml +0 -23
- anemoi_utils-0.4.23/.release-please-manifest.json +0 -3
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.gitattributes +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.github/ci-hpc-config.yml +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.github/dependabot.yml +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.github/labeler.yml +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.github/workflows/python-publish.yml +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.github/workflows/release-please.yml +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/.readthedocs.yaml +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/CONTRIBUTORS.md +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/LICENSE +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/README.md +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/Makefile +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/_static/logo.png +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/_static/style.css +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/_templates/.gitkeep +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/_templates/apidoc/package.rst.jinja +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/conf.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/index.rst +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/installing.rst +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/modules/checkpoints.rst +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/modules/config.rst +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/modules/dates.rst +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/modules/grib.rst +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/modules/humanize.rst +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/modules/provenance.rst +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/modules/s3.rst +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/modules/testing.rst +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/modules/text.rst +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/docs/scripts/api_build.sh +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/pyproject.toml +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/setup.cfg +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/__init__.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/__main__.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/caching.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/checkpoints.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/cli.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/commands/__init__.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/commands/config.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/commands/requests.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/compatibility.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/config.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/dates.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/devtools.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/grib.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/grids.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/hindcasts.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/humanize.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/logs.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/mars/__init__.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/mars/mars.yaml +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/mars/requests.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/provenance.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/registry.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/remote/__init__.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/remote/ssh.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/rules.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/s3.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/sanitise.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/sanitize.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/schemas/__init__.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/schemas/errors.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/testing.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/text.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi/utils/timer.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi_utils.egg-info/dependency_links.txt +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi_utils.egg-info/entry_points.txt +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi_utils.egg-info/requires.txt +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/src/anemoi_utils.egg-info/top_level.txt +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test-transfer-data/directory/b/c/x +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test-transfer-data/directory/b/y +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test-transfer-data/directory/exotic filename ;^/"'[=.,#]()/303/252/303/274/303/247/303/262/342/234/205.txt" +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test-transfer-data/directory/z +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test-transfer-data/file +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test_caching.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test_compatibility.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test_dates.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test_frequency.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test_grids.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test_provenance.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test_remote.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test_sanetise.py +0 -0
- {anemoi_utils-0.4.23 → anemoi_utils-0.4.24}/tests/test_utils.py +0 -0
|
@@ -0,0 +1,13 @@
|
|
|
1
|
+
## Description
|
|
2
|
+
<!-- What issue or task does this change relate to? -->
|
|
3
|
+
|
|
4
|
+
## What problem does this change solve?
|
|
5
|
+
<!-- Describe if it's a bugfix, new feature, doc update, or breaking change -->
|
|
6
|
+
|
|
7
|
+
## What issue or task does this change relate to?
|
|
8
|
+
<!-- link to Issue Number -->
|
|
9
|
+
|
|
10
|
+
## Additional notes ##
|
|
11
|
+
<!-- Include any additional information, caveats, or considerations that the reviewer should be aware of. -->
|
|
12
|
+
|
|
13
|
+
***As a contributor to the Anemoi framework, please ensure that your changes include unit tests, updates to any affected dependencies and documentation, and have been tested in a parallel setting (i.e., with multiple GPUs). As a reviewer, you are also responsible for verifying these aspects and requesting changes if they are not adequately addressed. For guidelines about those please refer to https://anemoi.readthedocs.io/en/latest/***
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# This workflow triggers tests on dependent packages.
|
|
2
2
|
# The dependency tree itself is defined in ecmwf/downstream-ci/
|
|
3
|
-
name: Test downstream dependent packages
|
|
3
|
+
name: Test downstream dependent packages
|
|
4
4
|
|
|
5
5
|
on:
|
|
6
6
|
# Trigger the workflow on push to main or develop, except tag creation
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# This workflow assigns labels to a pull request based on the files changed in the PR.
|
|
2
2
|
# The labels are defined in the `.github/labels.yml` file.
|
|
3
|
-
name: "[
|
|
3
|
+
name: "[PR] Label File-based"
|
|
4
4
|
on:
|
|
5
5
|
pull_request_target:
|
|
6
6
|
types: [opened, synchronize]
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
# This workflow adds a link to the experimental documentation build to the PR.
|
|
2
2
|
# This does NOT trigger a build of the documentation, this is handled through webhooks.
|
|
3
|
-
name: Read the Docs
|
|
3
|
+
name: "[PR] Read the Docs Preview"
|
|
4
4
|
on:
|
|
5
5
|
pull_request_target:
|
|
6
6
|
types:
|
|
@@ -94,6 +94,11 @@ dmypy.json
|
|
|
94
94
|
*.csv
|
|
95
95
|
*.xlsx
|
|
96
96
|
*.xls
|
|
97
|
+
*.json
|
|
98
|
+
*.txt
|
|
99
|
+
*.zip
|
|
100
|
+
*.db
|
|
101
|
+
*.tgz
|
|
97
102
|
|
|
98
103
|
# ML artifacts
|
|
99
104
|
wandb/
|
|
@@ -120,7 +125,8 @@ tmp/
|
|
|
120
125
|
temp/
|
|
121
126
|
logs/
|
|
122
127
|
_dev/
|
|
123
|
-
|
|
128
|
+
_api/
|
|
129
|
+
./outputs
|
|
124
130
|
*tmp_data/
|
|
125
131
|
|
|
126
132
|
# Project specific
|
|
@@ -39,8 +39,9 @@ repos:
|
|
|
39
39
|
- -l 120
|
|
40
40
|
- --force-single-line-imports
|
|
41
41
|
- --profile black
|
|
42
|
+
- --project anemoi
|
|
42
43
|
- repo: https://github.com/astral-sh/ruff-pre-commit
|
|
43
|
-
rev: v0.11.
|
|
44
|
+
rev: v0.11.12
|
|
44
45
|
hooks:
|
|
45
46
|
- id: ruff
|
|
46
47
|
args:
|
|
@@ -64,7 +65,7 @@ repos:
|
|
|
64
65
|
- id: docconvert
|
|
65
66
|
args: ["numpy"]
|
|
66
67
|
- repo: https://github.com/tox-dev/pyproject-fmt
|
|
67
|
-
rev: "v2.
|
|
68
|
+
rev: "v2.6.0"
|
|
68
69
|
hooks:
|
|
69
70
|
- id: pyproject-fmt
|
|
70
71
|
- repo: https://github.com/jshwi/docsig # Check docstrings against function sig
|
|
@@ -10,11 +10,16 @@
|
|
|
10
10
|
"draft-pull-request": true,
|
|
11
11
|
"pull-request-title-pattern": "chore${scope}: Release${component} ${version}",
|
|
12
12
|
"pull-request-header": ":robot: Automated Release PR\n\nThis PR was created by `release-please` to prepare the next release. Once merged:\n\n1. A new version tag will be created\n2. A GitHub release will be published\n3. The changelog will be updated\n\nChanges to be included in the next release:",
|
|
13
|
-
"pull-request-footer": "> [!IMPORTANT]\n> :warning: Merging this PR will:\n> - Create a new release\n> - Trigger deployment pipelines\n> - Update package versions\n\n **Before merging:**\n - Ensure all tests pass\n - Review the changelog carefully\n - Get required approvals\n\n [Release-please documentation](https://github.com/googleapis/release-please)",
|
|
13
|
+
"pull-request-footer": "> [!IMPORTANT]\n> Please do not change the PR title, manifest file, or any other automatically generated content in this PR unless you understand the implications. Changes here can break the release process.\n> :warning: Merging this PR will:\n> - Create a new release\n> - Trigger deployment pipelines\n> - Update package versions\n\n **Before merging:**\n - Ensure all tests pass\n - Review the changelog carefully\n - Get required approvals\n\n [Release-please documentation](https://github.com/googleapis/release-please)",
|
|
14
14
|
"packages": {
|
|
15
15
|
".": {
|
|
16
16
|
"package-name": "anemoi-utils"
|
|
17
17
|
}
|
|
18
18
|
},
|
|
19
|
+
"plugins": [
|
|
20
|
+
{
|
|
21
|
+
"type": "sentence-case"
|
|
22
|
+
}
|
|
23
|
+
],
|
|
19
24
|
"$schema": "https://raw.githubusercontent.com/googleapis/release-please/main/schemas/config.json"
|
|
20
25
|
}
|
|
@@ -8,6 +8,14 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
|
|
|
8
8
|
Please add your functional changes to the appropriate section in the PR.
|
|
9
9
|
Keep it human-readable, your future self will thank you!
|
|
10
10
|
|
|
11
|
+
## [0.4.24](https://github.com/ecmwf/anemoi-utils/compare/0.4.23...0.4.24) (2025-06-06)
|
|
12
|
+
|
|
13
|
+
|
|
14
|
+
### Features
|
|
15
|
+
|
|
16
|
+
* Add s3.object_exists() function ([#157](https://github.com/ecmwf/anemoi-utils/issues/157)) ([d898811](https://github.com/ecmwf/anemoi-utils/commit/d8988116320265dc6dfe467c57e0b6f29f76a2c1))
|
|
17
|
+
* Allow wildcard in config for matching s3 buckets to end points ([#160](https://github.com/ecmwf/anemoi-utils/issues/160)) ([ab20da7](https://github.com/ecmwf/anemoi-utils/commit/ab20da7e9497435a7183705b02dcbb7317d2700b))
|
|
18
|
+
|
|
11
19
|
## [0.4.23](https://github.com/ecmwf/anemoi-utils/compare/0.4.22...0.4.23) (2025-05-20)
|
|
12
20
|
|
|
13
21
|
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: anemoi-utils
|
|
3
|
-
Version: 0.4.
|
|
3
|
+
Version: 0.4.24
|
|
4
4
|
Summary: A package to hold various functions to support training of ML models on ECMWF data.
|
|
5
5
|
Author-email: "European Centre for Medium-Range Weather Forecasts (ECMWF)" <software.support@ecmwf.int>
|
|
6
6
|
License: Apache License
|
|
@@ -24,6 +24,7 @@ the `~/.config/anemoi/settings.toml`
|
|
|
24
24
|
or `~/.config/anemoi/settings-secrets.toml` files.
|
|
25
25
|
"""
|
|
26
26
|
|
|
27
|
+
import fnmatch
|
|
27
28
|
import logging
|
|
28
29
|
import os
|
|
29
30
|
import threading
|
|
@@ -38,15 +39,15 @@ from ..humanize import bytes_to_human
|
|
|
38
39
|
from . import BaseDownload
|
|
39
40
|
from . import BaseUpload
|
|
40
41
|
|
|
41
|
-
|
|
42
|
-
|
|
42
|
+
LOG = logging.getLogger(__name__)
|
|
43
|
+
SECRETS = ["aws_access_key_id", "aws_secret_access_key"]
|
|
43
44
|
|
|
44
45
|
# s3_clients are not thread-safe, so we need to create a new client for each thread
|
|
45
46
|
|
|
46
47
|
thread_local = threading.local()
|
|
47
48
|
|
|
48
49
|
|
|
49
|
-
def s3_client(bucket: str, region: str = None) -> Any:
|
|
50
|
+
def s3_client(bucket: str, *, region: str = None, service: str = "s3") -> Any:
|
|
50
51
|
"""Get an S3 client for the specified bucket and region.
|
|
51
52
|
|
|
52
53
|
Parameters
|
|
@@ -55,6 +56,8 @@ def s3_client(bucket: str, region: str = None) -> Any:
|
|
|
55
56
|
The name of the S3 bucket.
|
|
56
57
|
region : str, optional
|
|
57
58
|
The AWS region of the S3 bucket.
|
|
59
|
+
service : str, optional
|
|
60
|
+
The AWS service to use, default is "s3".
|
|
58
61
|
|
|
59
62
|
Returns
|
|
60
63
|
-------
|
|
@@ -68,7 +71,7 @@ def s3_client(bucket: str, region: str = None) -> Any:
|
|
|
68
71
|
if not hasattr(thread_local, "s3_clients"):
|
|
69
72
|
thread_local.s3_clients = {}
|
|
70
73
|
|
|
71
|
-
key = f"{bucket}-{region}"
|
|
74
|
+
key = f"{bucket}-{region}-{service}"
|
|
72
75
|
|
|
73
76
|
if key in thread_local.s3_clients:
|
|
74
77
|
return thread_local.s3_clients[key]
|
|
@@ -96,17 +99,27 @@ def s3_client(bucket: str, region: str = None) -> Any:
|
|
|
96
99
|
# We may be accessing a different S3 compatible service
|
|
97
100
|
# Use anemoi.config to get the configuration
|
|
98
101
|
|
|
99
|
-
|
|
100
|
-
|
|
102
|
+
region = "unknown-region"
|
|
103
|
+
|
|
104
|
+
options = {"region_name": region}
|
|
105
|
+
config = load_config(secrets=SECRETS)
|
|
101
106
|
|
|
102
107
|
cfg = config.get("object-storage", {})
|
|
108
|
+
candidate = None
|
|
103
109
|
for k, v in cfg.items():
|
|
104
110
|
if isinstance(v, (str, int, float, bool)):
|
|
105
111
|
options[k] = v
|
|
106
112
|
|
|
107
|
-
|
|
108
|
-
|
|
109
|
-
|
|
113
|
+
if isinstance(v, dict):
|
|
114
|
+
if fnmatch.fnmatch(bucket, k):
|
|
115
|
+
if candidate is not None:
|
|
116
|
+
raise ValueError(f"Multiple object storage configurations match {bucket}: {candidate} and {k}")
|
|
117
|
+
candidate = k
|
|
118
|
+
|
|
119
|
+
if candidate is not None:
|
|
120
|
+
for k, v in cfg.get(candidate, {}).items():
|
|
121
|
+
if isinstance(v, (str, int, float, bool)):
|
|
122
|
+
options[k] = v
|
|
110
123
|
|
|
111
124
|
type = options.pop("type", "s3")
|
|
112
125
|
if type != "s3":
|
|
@@ -115,11 +128,27 @@ def s3_client(bucket: str, region: str = None) -> Any:
|
|
|
115
128
|
if "config" in options:
|
|
116
129
|
boto3_config.update(options["config"])
|
|
117
130
|
del options["config"]
|
|
118
|
-
from botocore.client import Config
|
|
119
131
|
|
|
120
132
|
options["config"] = Config(**boto3_config)
|
|
121
133
|
|
|
122
|
-
|
|
134
|
+
def _(options):
|
|
135
|
+
|
|
136
|
+
def __(k, v):
|
|
137
|
+
if k in SECRETS:
|
|
138
|
+
return "***"
|
|
139
|
+
return v
|
|
140
|
+
|
|
141
|
+
if isinstance(options, dict):
|
|
142
|
+
return {k: __(k, v) for k, v in options.items()}
|
|
143
|
+
|
|
144
|
+
if isinstance(options, list):
|
|
145
|
+
return [_(o) for o in options]
|
|
146
|
+
|
|
147
|
+
return options
|
|
148
|
+
|
|
149
|
+
LOG.info(f"Using S3 options: {_(options)}")
|
|
150
|
+
|
|
151
|
+
thread_local.s3_clients[key] = boto3.client(service, **options)
|
|
123
152
|
|
|
124
153
|
return thread_local.s3_clients[key]
|
|
125
154
|
|
|
@@ -215,7 +244,7 @@ class S3Upload(BaseUpload):
|
|
|
215
244
|
size = os.path.getsize(source)
|
|
216
245
|
|
|
217
246
|
if verbosity > 0:
|
|
218
|
-
|
|
247
|
+
LOG.info(f"{self.action} {source} to {target} ({bytes_to_human(size)})")
|
|
219
248
|
|
|
220
249
|
try:
|
|
221
250
|
results = s3.head_object(Bucket=bucket, Key=key)
|
|
@@ -227,7 +256,7 @@ class S3Upload(BaseUpload):
|
|
|
227
256
|
|
|
228
257
|
if remote_size is not None:
|
|
229
258
|
if remote_size != size:
|
|
230
|
-
|
|
259
|
+
LOG.warning(
|
|
231
260
|
f"{target} already exists, but with different size, re-uploading (remote={remote_size}, local={size})"
|
|
232
261
|
)
|
|
233
262
|
elif resume:
|
|
@@ -400,7 +429,7 @@ class S3Download(BaseDownload):
|
|
|
400
429
|
size = int(response["ContentLength"])
|
|
401
430
|
|
|
402
431
|
if verbosity > 0:
|
|
403
|
-
|
|
432
|
+
LOG.info(f"{self.action} {source} to {target} ({bytes_to_human(size)})")
|
|
404
433
|
|
|
405
434
|
if overwrite:
|
|
406
435
|
resume = False
|
|
@@ -409,7 +438,7 @@ class S3Download(BaseDownload):
|
|
|
409
438
|
if os.path.exists(target):
|
|
410
439
|
local_size = os.path.getsize(target)
|
|
411
440
|
if local_size != size:
|
|
412
|
-
|
|
441
|
+
LOG.warning(
|
|
413
442
|
f"{target} already with different size, re-downloading (remote={size}, local={local_size})"
|
|
414
443
|
)
|
|
415
444
|
else:
|
|
@@ -464,7 +493,7 @@ def _list_objects(target: str, batch: bool = False) -> Iterable:
|
|
|
464
493
|
yield from objects
|
|
465
494
|
|
|
466
495
|
|
|
467
|
-
def
|
|
496
|
+
def delete_folder(target: str) -> None:
|
|
468
497
|
"""Delete a folder from S3.
|
|
469
498
|
|
|
470
499
|
Parameters
|
|
@@ -477,13 +506,13 @@ def _delete_folder(target: str) -> None:
|
|
|
477
506
|
|
|
478
507
|
total = 0
|
|
479
508
|
for batch in _list_objects(target, batch=True):
|
|
480
|
-
|
|
509
|
+
LOG.info(f"Deleting {len(batch):,} objects from {target}")
|
|
481
510
|
s3.delete_objects(Bucket=bucket, Delete={"Objects": [{"Key": o["Key"]} for o in batch]})
|
|
482
511
|
total += len(batch)
|
|
483
|
-
|
|
512
|
+
LOG.info(f"Deleted {len(batch):,} objects (total={total:,})")
|
|
484
513
|
|
|
485
514
|
|
|
486
|
-
def
|
|
515
|
+
def delete_file(target: str) -> None:
|
|
487
516
|
"""Delete a file from S3.
|
|
488
517
|
|
|
489
518
|
Parameters
|
|
@@ -505,12 +534,12 @@ def _delete_file(target: str) -> None:
|
|
|
505
534
|
exits = False
|
|
506
535
|
|
|
507
536
|
if not exits:
|
|
508
|
-
|
|
537
|
+
LOG.warning(f"{target} does not exist. Did you mean to delete a folder? Then add a trailing '/'")
|
|
509
538
|
return
|
|
510
539
|
|
|
511
|
-
|
|
540
|
+
LOG.info(f"Deleting {target}")
|
|
512
541
|
s3.delete_object(Bucket=bucket, Key=key)
|
|
513
|
-
|
|
542
|
+
LOG.info(f"{target} is deleted")
|
|
514
543
|
|
|
515
544
|
|
|
516
545
|
def delete(target: str) -> None:
|
|
@@ -525,9 +554,9 @@ def delete(target: str) -> None:
|
|
|
525
554
|
assert target.startswith("s3://")
|
|
526
555
|
|
|
527
556
|
if target.endswith("/"):
|
|
528
|
-
|
|
557
|
+
delete_folder(target)
|
|
529
558
|
else:
|
|
530
|
-
|
|
559
|
+
delete_file(target)
|
|
531
560
|
|
|
532
561
|
|
|
533
562
|
def list_folder(folder: str) -> Iterable:
|
|
@@ -581,7 +610,33 @@ def object_info(target: str) -> dict:
|
|
|
581
610
|
return s3.head_object(Bucket=bucket, Key=key)
|
|
582
611
|
except s3.exceptions.ClientError as e:
|
|
583
612
|
if e.response["Error"]["Code"] == "404":
|
|
584
|
-
raise
|
|
613
|
+
raise FileNotFoundError(f"{target} does not exist")
|
|
614
|
+
raise
|
|
615
|
+
|
|
616
|
+
|
|
617
|
+
def object_exists(target: str) -> bool:
|
|
618
|
+
"""Check if an object exists.
|
|
619
|
+
|
|
620
|
+
Parameters
|
|
621
|
+
----------
|
|
622
|
+
target : str
|
|
623
|
+
The URL of a file or a folder on S3. The URL should start with 's3://'.
|
|
624
|
+
|
|
625
|
+
Returns
|
|
626
|
+
-------
|
|
627
|
+
bool
|
|
628
|
+
True if the object exists, False otherwise.
|
|
629
|
+
"""
|
|
630
|
+
|
|
631
|
+
_, _, bucket, key = target.split("/", 3)
|
|
632
|
+
s3 = s3_client(bucket)
|
|
633
|
+
|
|
634
|
+
try:
|
|
635
|
+
s3.head_object(Bucket=bucket, Key=key)
|
|
636
|
+
return True
|
|
637
|
+
except s3.exceptions.ClientError as e:
|
|
638
|
+
if e.response["Error"]["Code"] == "404":
|
|
639
|
+
return False
|
|
585
640
|
raise
|
|
586
641
|
|
|
587
642
|
|
|
@@ -600,7 +655,7 @@ def object_acl(target: str) -> dict:
|
|
|
600
655
|
"""
|
|
601
656
|
|
|
602
657
|
_, _, bucket, key = target.split("/", 3)
|
|
603
|
-
s3 = s3_client()
|
|
658
|
+
s3 = s3_client(bucket)
|
|
604
659
|
|
|
605
660
|
return s3.get_object_acl(Bucket=bucket, Key=key)
|
|
606
661
|
|
|
@@ -643,3 +698,29 @@ def upload(source: str, target: str, *args, **kwargs) -> None:
|
|
|
643
698
|
|
|
644
699
|
assert target.startswith("s3://"), f"target {target} should start with 's3://'"
|
|
645
700
|
return transfer(source, target, *args, **kwargs)
|
|
701
|
+
|
|
702
|
+
|
|
703
|
+
def quotas(target: str) -> dict:
|
|
704
|
+
"""Get the quotas for an S3 bucket.
|
|
705
|
+
|
|
706
|
+
Parameters
|
|
707
|
+
----------
|
|
708
|
+
target : str
|
|
709
|
+
The URL of a file or a folder on S3. The URL should start with 's3://'.
|
|
710
|
+
|
|
711
|
+
Returns
|
|
712
|
+
-------
|
|
713
|
+
dict
|
|
714
|
+
A dictionary with the quotas for the bucket.
|
|
715
|
+
"""
|
|
716
|
+
from botocore.exceptions import ClientError
|
|
717
|
+
|
|
718
|
+
_, _, bucket, _ = target.split("/", 3)
|
|
719
|
+
s3 = s3_client(bucket, service="service-quotas")
|
|
720
|
+
|
|
721
|
+
try:
|
|
722
|
+
return s3.list_service_quotas(ServiceCode="ec2")
|
|
723
|
+
except ClientError as e:
|
|
724
|
+
if e.response["Error"]["Code"] == "404":
|
|
725
|
+
raise ValueError(f"{target} does not exist")
|
|
726
|
+
raise
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: anemoi-utils
|
|
3
|
-
Version: 0.4.
|
|
3
|
+
Version: 0.4.24
|
|
4
4
|
Summary: A package to hold various functions to support training of ML models on ECMWF data.
|
|
5
5
|
Author-email: "European Centre for Medium-Range Weather Forecasts (ECMWF)" <software.support@ecmwf.int>
|
|
6
6
|
License: Apache License
|
|
@@ -14,7 +14,6 @@ pyproject.toml
|
|
|
14
14
|
.github/dependabot.yml
|
|
15
15
|
.github/labeler.yml
|
|
16
16
|
.github/pull_request_template.md
|
|
17
|
-
.github/release.yml
|
|
18
17
|
.github/workflows/downstream-ci-hpc.yml
|
|
19
18
|
.github/workflows/pr-conventional-commit.yml
|
|
20
19
|
.github/workflows/pr-label-conventional-commits.yml
|
|
@@ -1,46 +0,0 @@
|
|
|
1
|
-
## Description
|
|
2
|
-
|
|
3
|
-
<!-- Provide a brief summary of the changes introduced in this pull request. -->
|
|
4
|
-
|
|
5
|
-
## Type of Change
|
|
6
|
-
|
|
7
|
-
- [ ] Bug fix (non-breaking change which fixes an issue)
|
|
8
|
-
- [ ] New feature (non-breaking change which adds functionality)
|
|
9
|
-
- [ ] Breaking change (fix or feature that would cause existing functionality to not work as expected)
|
|
10
|
-
- [ ] Documentation update
|
|
11
|
-
|
|
12
|
-
## Issue Number
|
|
13
|
-
|
|
14
|
-
<!-- Link the Issue number this change addresses, ideally in one of the "magic format" such as Closes #XYZ -->
|
|
15
|
-
|
|
16
|
-
<!-- Alternatively, explain the motivation behind the changes and the context in which they are being made. -->
|
|
17
|
-
|
|
18
|
-
## Code Compatibility
|
|
19
|
-
|
|
20
|
-
- [ ] I have performed a self-review of my code
|
|
21
|
-
|
|
22
|
-
### Code Performance and Testing
|
|
23
|
-
|
|
24
|
-
- [ ] I have added tests that prove my fix is effective or that my feature works
|
|
25
|
-
- [ ] I ran the [complete Pytest test](https://anemoi.readthedocs.io/projects/training/en/latest/dev/testing.html) suite locally, and they pass
|
|
26
|
-
|
|
27
|
-
<!-- In case this affects the model sharding or other specific components please describe these here. -->
|
|
28
|
-
|
|
29
|
-
### Dependencies
|
|
30
|
-
|
|
31
|
-
- [ ] I have ensured that the code is still pip-installable after the changes and runs
|
|
32
|
-
- [ ] I have tested that new dependencies themselves are pip-installable.
|
|
33
|
-
|
|
34
|
-
<!-- List any new dependencies that are required for this change and the justification to add them. -->
|
|
35
|
-
|
|
36
|
-
### Documentation
|
|
37
|
-
|
|
38
|
-
- [ ] My code follows the style guidelines of this project
|
|
39
|
-
- [ ] I have updated the documentation and docstrings to reflect the changes
|
|
40
|
-
- [ ] I have added comments to my code, particularly in hard-to-understand areas
|
|
41
|
-
|
|
42
|
-
<!-- Describe any major updates to the documentation -->
|
|
43
|
-
|
|
44
|
-
## Additional Notes
|
|
45
|
-
|
|
46
|
-
<!-- Include any additional information, caveats, or considerations that the reviewer should be aware of. -->
|
|
@@ -1,23 +0,0 @@
|
|
|
1
|
-
# .github/release.yml
|
|
2
|
-
# https://docs.github.com/en/repositories/releasing-projects-on-github/automatically-generated-release-notes
|
|
3
|
-
|
|
4
|
-
changelog:
|
|
5
|
-
exclude:
|
|
6
|
-
labels:
|
|
7
|
-
- ignore-for-release
|
|
8
|
-
- no-changelog
|
|
9
|
-
authors:
|
|
10
|
-
- pre-commit-ci
|
|
11
|
-
categories:
|
|
12
|
-
- title: Breaking Changes 🛠
|
|
13
|
-
labels:
|
|
14
|
-
- "breaking change"
|
|
15
|
-
- title: Exciting New Features 🎉
|
|
16
|
-
labels:
|
|
17
|
-
- enhancement
|
|
18
|
-
- title: Config Changes 📑
|
|
19
|
-
labels:
|
|
20
|
-
- config
|
|
21
|
-
- title: Other Changes 🔗
|
|
22
|
-
labels:
|
|
23
|
-
- "*"
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|