triggerflow 0.3.4__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- trigger_dataset/__init__.py +0 -0
- trigger_dataset/core.py +88 -0
- trigger_loader/__init__.py +0 -0
- trigger_loader/cluster_manager.py +107 -0
- trigger_loader/loader.py +154 -0
- trigger_loader/processor.py +212 -0
- triggerflow/__init__.py +0 -0
- triggerflow/cli.py +122 -0
- triggerflow/core.py +617 -0
- triggerflow/interfaces/__init__.py +0 -0
- triggerflow/interfaces/uGT.py +187 -0
- triggerflow/mlflow_wrapper.py +270 -0
- triggerflow/starter/.gitignore +143 -0
- triggerflow/starter/README.md +0 -0
- triggerflow/starter/cookiecutter.json +5 -0
- triggerflow/starter/prompts.yml +9 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/.dvcignore +3 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/.gitignore +143 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/.gitlab-ci.yml +56 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/README.md +29 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/README.md +26 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/base/catalog.yml +84 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/base/parameters.yml +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/base/parameters_compile.yml +14 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/base/parameters_data_processing.yml +8 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/base/parameters_load_data.yml +5 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/base/parameters_model_training.yml +9 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/base/parameters_model_validation.yml +5 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/local/catalog.yml +90 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/local/parameters.yml +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/local/parameters_compile.yml +14 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/local/parameters_data_processing.yml +8 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/local/parameters_load_data.yml +5 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/local/parameters_model_training.yml +9 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/local/parameters_model_validation.yml +5 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/conf/logging.yml +43 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/data/01_raw/.gitkeep +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/data/01_raw/condor_config.json +11 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/data/01_raw/cuda_config.json +4 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/data/01_raw/samples.json +24 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/data/01_raw/settings.json +8 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/data/01_raw/test.root +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/data/02_loaded/.gitkeep +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/data/03_preprocessed/.gitkeep +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/data/04_models/.gitkeep +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/data/05_validation/.gitkeep +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/data/06_compile/.gitkeep +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/data/07_reporting/.gitkeep +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/dvc.yaml +7 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/environment.yml +23 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/pyproject.toml +50 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/__init__.py +3 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/__main__.py +25 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/datasets/any_object.py +20 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/datasets/base_dataset.py +137 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/datasets/base_loader.py +101 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/datasets/meta_dataset.py +49 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/datasets/{{ cookiecutter.python_package }}_dataset.py +35 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/datasets/{{ cookiecutter.python_package }}_loader.py +32 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/models/__init__.py +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/models/base_model.py +155 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/models/{{ cookiecutter.python_package }}_model.py +16 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipeline_registry.py +17 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/compile/__init__.py +10 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/compile/nodes.py +70 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/compile/pipeline.py +20 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/data_processing/__init__.py +10 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/data_processing/nodes.py +41 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/data_processing/pipeline.py +28 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/load_data/__init__.py +10 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/load_data/nodes.py +13 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/load_data/pipeline.py +20 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/model_training/__init__.py +10 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/model_training/nodes.py +48 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/model_training/pipeline.py +24 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/model_validation/__init__.py +10 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/model_validation/nodes.py +31 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/pipelines/model_validation/pipeline.py +24 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/settings.py +46 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/utils/__init__.py +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/utils/metric.py +4 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/src/{{ cookiecutter.python_package }}/utils/plotting.py +598 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/tests/__init__.py +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/tests/pipelines/__init__.py +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/tests/pipelines/compile/__init__.py +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/tests/pipelines/compile/test_pipeline.py +9 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/tests/pipelines/data_processing/__init__.py +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/tests/pipelines/data_processing/test_pipeline.py +9 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/tests/pipelines/load_data/__init__.py +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/tests/pipelines/load_data/test_pipeline.py +9 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/tests/pipelines/model_training/__init__.py +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/tests/pipelines/model_training/test_pipeline.py +9 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/tests/pipelines/model_validation/__init__.py +0 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/tests/pipelines/model_validation/test_pipeline.py +9 -0
- triggerflow/starter/{{ cookiecutter.repo_name }}/tests/test_run.py +27 -0
- triggerflow/templates/build_ugt.tcl +46 -0
- triggerflow/templates/data_types.h +524 -0
- triggerflow/templates/makefile +28 -0
- triggerflow/templates/makefile_version +15 -0
- triggerflow/templates/model-gt.cpp +104 -0
- triggerflow/templates/model_template.cpp +63 -0
- triggerflow/templates/scales.h +20 -0
- triggerflow-0.3.4.dist-info/METADATA +206 -0
- triggerflow-0.3.4.dist-info/RECORD +107 -0
- triggerflow-0.3.4.dist-info/WHEEL +5 -0
- triggerflow-0.3.4.dist-info/entry_points.txt +2 -0
- triggerflow-0.3.4.dist-info/top_level.txt +3 -0
|
@@ -0,0 +1,143 @@
|
|
|
1
|
+
# Byte-compiled / optimized / DLL files
|
|
2
|
+
__pycache__/
|
|
3
|
+
*.py[cod]
|
|
4
|
+
*$py.class
|
|
5
|
+
|
|
6
|
+
# C extensions
|
|
7
|
+
*.so
|
|
8
|
+
|
|
9
|
+
# Distribution / packaging
|
|
10
|
+
.Python
|
|
11
|
+
build/
|
|
12
|
+
develop-eggs/
|
|
13
|
+
dist/
|
|
14
|
+
downloads/
|
|
15
|
+
eggs/
|
|
16
|
+
.eggs/
|
|
17
|
+
lib/
|
|
18
|
+
lib64/
|
|
19
|
+
parts/
|
|
20
|
+
sdist/
|
|
21
|
+
var/
|
|
22
|
+
wheels/
|
|
23
|
+
share/python-wheels/
|
|
24
|
+
*.egg-info/
|
|
25
|
+
.installed.cfg
|
|
26
|
+
*.egg
|
|
27
|
+
MANIFEST
|
|
28
|
+
|
|
29
|
+
# PyInstaller
|
|
30
|
+
# Usually these files are written by a python script from a template
|
|
31
|
+
# before PyInstaller builds the exe, so as to inject date/other infos into it.
|
|
32
|
+
*.manifest
|
|
33
|
+
*.spec
|
|
34
|
+
|
|
35
|
+
# Installer logs
|
|
36
|
+
pip-log.txt
|
|
37
|
+
pip-delete-this-directory.txt
|
|
38
|
+
|
|
39
|
+
# Unit test / coverage reports
|
|
40
|
+
htmlcov/
|
|
41
|
+
.tox/
|
|
42
|
+
.nox/
|
|
43
|
+
.coverage
|
|
44
|
+
.coverage.*
|
|
45
|
+
.cache
|
|
46
|
+
nosetests.xml
|
|
47
|
+
coverage.xml
|
|
48
|
+
*.cover
|
|
49
|
+
*.py,cover
|
|
50
|
+
.hypothesis/
|
|
51
|
+
.pytest_cache/
|
|
52
|
+
cover/
|
|
53
|
+
|
|
54
|
+
# Translations
|
|
55
|
+
*.mo
|
|
56
|
+
*.pot
|
|
57
|
+
|
|
58
|
+
# Django stuff:
|
|
59
|
+
*.log
|
|
60
|
+
local_settings.py
|
|
61
|
+
db.sqlite3
|
|
62
|
+
db.sqlite3-journal
|
|
63
|
+
|
|
64
|
+
# Flask stuff:
|
|
65
|
+
instance/
|
|
66
|
+
.webassets-cache
|
|
67
|
+
|
|
68
|
+
# Scrapy stuff:
|
|
69
|
+
.scrapy
|
|
70
|
+
|
|
71
|
+
# Sphinx documentation
|
|
72
|
+
docs/_build/
|
|
73
|
+
|
|
74
|
+
# PyBuilder
|
|
75
|
+
.pybuilder/
|
|
76
|
+
target/
|
|
77
|
+
|
|
78
|
+
# Jupyter Notebook
|
|
79
|
+
.ipynb_checkpoints
|
|
80
|
+
|
|
81
|
+
# pyenv
|
|
82
|
+
# For a library or package, you might want to ignore these files since the code is
|
|
83
|
+
# intended to run in multiple environments; otherwise, check them in:
|
|
84
|
+
# .python-version
|
|
85
|
+
|
|
86
|
+
# pipenv
|
|
87
|
+
# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
|
|
88
|
+
# However, in case of collaboration, if having platform-specific dependencies or dependencies
|
|
89
|
+
# having no cross-platform support, pipenv may install dependencies that don't work, or not
|
|
90
|
+
# install all needed dependencies.
|
|
91
|
+
#Pipfile.lock
|
|
92
|
+
|
|
93
|
+
# PEP 582; used by e.g. github.com/David-OConnor/pyflow
|
|
94
|
+
__pypackages__/
|
|
95
|
+
|
|
96
|
+
# Celery stuff
|
|
97
|
+
celerybeat-schedule
|
|
98
|
+
celerybeat.pid
|
|
99
|
+
|
|
100
|
+
# SageMath parsed files
|
|
101
|
+
*.sage.py
|
|
102
|
+
|
|
103
|
+
# Environments
|
|
104
|
+
.env
|
|
105
|
+
.venv
|
|
106
|
+
env/
|
|
107
|
+
venv/
|
|
108
|
+
ENV/
|
|
109
|
+
env.bak/
|
|
110
|
+
venv.bak/
|
|
111
|
+
|
|
112
|
+
# Spyder project settings
|
|
113
|
+
.spyderproject
|
|
114
|
+
.spyproject
|
|
115
|
+
|
|
116
|
+
# Rope project settings
|
|
117
|
+
.ropeproject
|
|
118
|
+
|
|
119
|
+
# mkdocs documentation
|
|
120
|
+
/site
|
|
121
|
+
|
|
122
|
+
# mypy
|
|
123
|
+
.mypy_cache/
|
|
124
|
+
.dmypy.json
|
|
125
|
+
dmypy.json
|
|
126
|
+
|
|
127
|
+
# Pyre type checker
|
|
128
|
+
.pyre/
|
|
129
|
+
|
|
130
|
+
# pytype static type analyzer
|
|
131
|
+
.pytype/
|
|
132
|
+
|
|
133
|
+
# Cython debug symbols
|
|
134
|
+
cython_debug/
|
|
135
|
+
|
|
136
|
+
.vscode/
|
|
137
|
+
info.log
|
|
138
|
+
|
|
139
|
+
# IntelliJ
|
|
140
|
+
.idea/
|
|
141
|
+
*.iml
|
|
142
|
+
out/
|
|
143
|
+
.idea_modules/
|
|
@@ -0,0 +1,56 @@
|
|
|
1
|
+
image: continuumio/miniconda3
|
|
2
|
+
|
|
3
|
+
stages:
|
|
4
|
+
- load
|
|
5
|
+
- preprocess
|
|
6
|
+
- train
|
|
7
|
+
- validate
|
|
8
|
+
- compile
|
|
9
|
+
|
|
10
|
+
variables:
|
|
11
|
+
KEDRO_ENV: "base" # TODO: add production env
|
|
12
|
+
|
|
13
|
+
before_script:
|
|
14
|
+
- eval "$(conda shell.bash hook)"
|
|
15
|
+
- conda env create --file=environment.yml
|
|
16
|
+
- conda activate triggerflow
|
|
17
|
+
|
|
18
|
+
load_data:
|
|
19
|
+
stage: load
|
|
20
|
+
script:
|
|
21
|
+
- kedro run --pipeline=load_data
|
|
22
|
+
artifacts:
|
|
23
|
+
paths:
|
|
24
|
+
- data/02_loaded/
|
|
25
|
+
|
|
26
|
+
preprocess_data:
|
|
27
|
+
stage: preprocess
|
|
28
|
+
script:
|
|
29
|
+
- kedro run --pipeline=data_processing
|
|
30
|
+
artifacts:
|
|
31
|
+
paths:
|
|
32
|
+
- data/03_preprocessed/
|
|
33
|
+
|
|
34
|
+
train_model:
|
|
35
|
+
stage: train
|
|
36
|
+
script:
|
|
37
|
+
- kedro run --pipeline=model_training
|
|
38
|
+
artifacts:
|
|
39
|
+
paths:
|
|
40
|
+
- data/04_models/
|
|
41
|
+
|
|
42
|
+
validate_model:
|
|
43
|
+
stage: validate
|
|
44
|
+
script:
|
|
45
|
+
- kedro run --pipeline=model_validation
|
|
46
|
+
artifacts:
|
|
47
|
+
paths:
|
|
48
|
+
- data/05_validation/
|
|
49
|
+
|
|
50
|
+
compile:
|
|
51
|
+
stage: compile
|
|
52
|
+
script:
|
|
53
|
+
- kedro run --pipeline=compile
|
|
54
|
+
artifacts:
|
|
55
|
+
paths:
|
|
56
|
+
- data/06_compile/
|
|
@@ -0,0 +1,29 @@
|
|
|
1
|
+
# {{ cookiecutter.project_name }}
|
|
2
|
+
|
|
3
|
+
- conda env create --file=environment.yml
|
|
4
|
+
- conda activate {{ cookiecutter.project_name }}
|
|
5
|
+
|
|
6
|
+
## Data versioning
|
|
7
|
+
When a dataset changes one can do (TODO: add this to pipeline to compare the hash):
|
|
8
|
+
- dvc add data/01_raw/companies.csv
|
|
9
|
+
- git add data/01_raw/companies.csv.dvc
|
|
10
|
+
- git commit -m "Track dataset changes with DVC"
|
|
11
|
+
|
|
12
|
+
## Run CI local
|
|
13
|
+
- brew install gitlab-ci-local
|
|
14
|
+
- gitlab-ci-local --list
|
|
15
|
+
- gitlab-ci-local
|
|
16
|
+
|
|
17
|
+
## ToDos:
|
|
18
|
+
- move functionality of uhh_mlatl1 to pipeline
|
|
19
|
+
- if case in base dataloader for classification or not
|
|
20
|
+
- add model evaluation steps
|
|
21
|
+
- automation of dvc in CI pipeline
|
|
22
|
+
- move {{ cookiecutter.project_name }} meta data json to dvc
|
|
23
|
+
- add linting and type checking
|
|
24
|
+
- write tests
|
|
25
|
+
- write out reporting / logging / plots etc.
|
|
26
|
+
- track plots with dvc?
|
|
27
|
+
- cross check pipeline afterwards with {{ cookiecutter.project_name }} team
|
|
28
|
+
- make starter pipeline as template
|
|
29
|
+
- add {{ cookiecutter.project_name }} model
|
|
@@ -0,0 +1,26 @@
|
|
|
1
|
+
# What is this for?
|
|
2
|
+
|
|
3
|
+
This folder should be used to store configuration files used by Kedro or by separate tools.
|
|
4
|
+
|
|
5
|
+
This file can be used to provide users with instructions for how to reproduce local configuration with their own credentials. You can edit the file however you like, but you may wish to retain the information below and add your own section in the [Instructions](#Instructions) section.
|
|
6
|
+
|
|
7
|
+
## Local configuration
|
|
8
|
+
|
|
9
|
+
The `local` folder should be used for configuration that is either user-specific (e.g. IDE configuration) or protected (e.g. security keys).
|
|
10
|
+
|
|
11
|
+
> *Note:* Please do not check in any local configuration to version control.
|
|
12
|
+
|
|
13
|
+
## Base configuration
|
|
14
|
+
|
|
15
|
+
The `base` folder is for shared configuration, such as non-sensitive and project-related configuration that may be shared across team members.
|
|
16
|
+
|
|
17
|
+
WARNING: Please do not put access credentials in the base configuration folder.
|
|
18
|
+
|
|
19
|
+
## Instructions
|
|
20
|
+
|
|
21
|
+
|
|
22
|
+
|
|
23
|
+
|
|
24
|
+
## Need help?
|
|
25
|
+
|
|
26
|
+
[Find out more about configuration from the Kedro documentation](https://docs.kedro.org/en/stable/kedro_project_setup/configuration.html).
|
|
@@ -0,0 +1,84 @@
|
|
|
1
|
+
{{ cookiecutter.python_package }}_meta_data:
|
|
2
|
+
filepath: data/01_raw/samples.json
|
|
3
|
+
sample_key: samples
|
|
4
|
+
type: {{ cookiecutter.python_package }}.datasets.meta_dataset.MetaDataset
|
|
5
|
+
|
|
6
|
+
{{ cookiecutter.python_package }}_meta_data_loaded:
|
|
7
|
+
filepath: data/02_loaded/{{ cookiecutter.python_package }}_meta_data.json
|
|
8
|
+
sample_key: samples
|
|
9
|
+
type: {{ cookiecutter.python_package }}.datasets.meta_dataset.MetaDataset
|
|
10
|
+
|
|
11
|
+
{{ cookiecutter.python_package }}_data:
|
|
12
|
+
sample_info: data/01_raw/samples.json
|
|
13
|
+
sample_key: samples
|
|
14
|
+
type: {{ cookiecutter.python_package }}.datasets.{{ cookiecutter.python_package }}_dataset.{{ cookiecutter.project_name }}Dataset
|
|
15
|
+
|
|
16
|
+
{{ cookiecutter.python_package }}_data_loaded:
|
|
17
|
+
filepath: data/02_loaded/{{ cookiecutter.python_package }}_data.csv
|
|
18
|
+
save_args:
|
|
19
|
+
index: False
|
|
20
|
+
sep: ','
|
|
21
|
+
type: pandas.CSVDataset
|
|
22
|
+
|
|
23
|
+
processed_{{ cookiecutter.python_package }}_X_train:
|
|
24
|
+
filepath: data/03_preprocessed/processed_{{ cookiecutter.python_package }}_X_train.csv
|
|
25
|
+
save_args:
|
|
26
|
+
index: False
|
|
27
|
+
sep: ','
|
|
28
|
+
type: pandas.CSVDataset
|
|
29
|
+
|
|
30
|
+
processed_{{ cookiecutter.python_package }}_X_test:
|
|
31
|
+
filepath: data/03_preprocessed/processed_{{ cookiecutter.python_package }}_X_test.csv
|
|
32
|
+
save_args:
|
|
33
|
+
index: False
|
|
34
|
+
sep: ','
|
|
35
|
+
type: pandas.CSVDataset
|
|
36
|
+
|
|
37
|
+
processed_{{ cookiecutter.python_package }}_y_train:
|
|
38
|
+
filepath: data/03_preprocessed/processed_{{ cookiecutter.python_package }}_y_train.csv
|
|
39
|
+
save_args:
|
|
40
|
+
index: False
|
|
41
|
+
sep: ','
|
|
42
|
+
type: pandas.CSVDataset
|
|
43
|
+
|
|
44
|
+
processed_{{ cookiecutter.python_package }}_y_test:
|
|
45
|
+
filepath: data/03_preprocessed/processed_{{ cookiecutter.python_package }}_y_test.csv
|
|
46
|
+
save_args:
|
|
47
|
+
index: False
|
|
48
|
+
sep: ','
|
|
49
|
+
type: pandas.CSVDataset
|
|
50
|
+
|
|
51
|
+
event_ids_train:
|
|
52
|
+
filepath: data/03_preprocessed/event_ids_train.csv
|
|
53
|
+
save_args:
|
|
54
|
+
index: False
|
|
55
|
+
sep: ','
|
|
56
|
+
type: pandas.CSVDataset
|
|
57
|
+
|
|
58
|
+
event_ids_test:
|
|
59
|
+
filepath: data/03_preprocessed/event_ids_test.csv
|
|
60
|
+
save_args:
|
|
61
|
+
index: False
|
|
62
|
+
sep: ','
|
|
63
|
+
type: pandas.CSVDataset
|
|
64
|
+
|
|
65
|
+
scaler:
|
|
66
|
+
filepath: data/03_preprocessed/scaler.pkl
|
|
67
|
+
type: pickle.PickleDataset
|
|
68
|
+
|
|
69
|
+
train_model:
|
|
70
|
+
filepath: data/04_models/trained_model.pkl
|
|
71
|
+
type: pickle.PickleDataset
|
|
72
|
+
|
|
73
|
+
training_history:
|
|
74
|
+
type: matplotlib.MatplotlibDataset
|
|
75
|
+
filepath: data/07_reporting/training_history.png
|
|
76
|
+
save_args:
|
|
77
|
+
format: png
|
|
78
|
+
|
|
79
|
+
model_pred:
|
|
80
|
+
filepath: data/05_validation/model_pred.pkl
|
|
81
|
+
save_args:
|
|
82
|
+
index: False
|
|
83
|
+
sep: ','
|
|
84
|
+
type: pandas.CSVDataset
|
|
File without changes
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
# This is a boilerplate parameters config generated for pipeline 'compile'
|
|
2
|
+
# using Kedro 1.0.0
|
|
3
|
+
#
|
|
4
|
+
# Documentation for this file format can be found in "Parameters"
|
|
5
|
+
# Link: https://docs.kedro.org/en/1.0.0/configuration/parameters.html
|
|
6
|
+
|
|
7
|
+
|
|
8
|
+
compile:
|
|
9
|
+
name: "munet"
|
|
10
|
+
ml_backend: "Keras"
|
|
11
|
+
compiler: "hls4ml"
|
|
12
|
+
mlflow_url: "https://mlflow-deploy-mflow.app.cern.ch"
|
|
13
|
+
compiler_config:
|
|
14
|
+
test: 123
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
# This is a boilerplate parameters config generated for pipeline 'data_processing'
|
|
2
|
+
# using Kedro 1.0.0
|
|
3
|
+
#
|
|
4
|
+
# Documentation for this file format can be found in "Parameters"
|
|
5
|
+
# Link: https://docs.kedro.org/en/1.0.0/configuration/parameters.html
|
|
6
|
+
|
|
7
|
+
random_state: 42
|
|
8
|
+
test_size: 0.5
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
# This is a boilerplate parameters config generated for pipeline 'model_training'
|
|
2
|
+
# using Kedro 1.0.0
|
|
3
|
+
#
|
|
4
|
+
# Documentation for this file format can be found in "Parameters"
|
|
5
|
+
# Link: https://docs.kedro.org/en/1.0.0/configuration/parameters.html
|
|
6
|
+
|
|
7
|
+
{{ cookiecutter.python_package }}_model:
|
|
8
|
+
hps:
|
|
9
|
+
name: "{{ cookiecutter.python_package }}"
|
|
@@ -0,0 +1,90 @@
|
|
|
1
|
+
{{ cookiecutter.python_package }}_meta_data:
|
|
2
|
+
filepath: data/01_raw/samples.json
|
|
3
|
+
sample_key: samples
|
|
4
|
+
type: {{ cookiecutter.python_package }}.datasets.meta_dataset.MetaDataset
|
|
5
|
+
|
|
6
|
+
{{ cookiecutter.python_package }}_data:
|
|
7
|
+
sample_info: data/01_raw/samples.json
|
|
8
|
+
sample_key: samples
|
|
9
|
+
type: {{ cookiecutter.python_package }}.datasets.{{ cookiecutter.python_package }}_dataset.{{ cookiecutter.project_name }}Dataset
|
|
10
|
+
|
|
11
|
+
{{ cookiecutter.python_package }}_meta_data_loaded:
|
|
12
|
+
filepath: data/02_loaded/{{ cookiecutter.python_package }}_meta_data.json
|
|
13
|
+
sample_key: samples
|
|
14
|
+
type: {{ cookiecutter.python_package }}.datasets.meta_dataset.MetaDataset
|
|
15
|
+
|
|
16
|
+
{{ cookiecutter.python_package }}_loader:
|
|
17
|
+
sample_json: data/01_raw/samples.json
|
|
18
|
+
settings: data/01_raw/settings.json
|
|
19
|
+
config: data/01_raw/condor_config.json
|
|
20
|
+
type: {{ cookiecutter.python_package }}.datasets.{{ cookiecutter.python_package }}_loader.{{ cookiecutter.project_name }}Loader
|
|
21
|
+
|
|
22
|
+
{{ cookiecutter.python_package }}_data_loaded:
|
|
23
|
+
filepath: data/02_loaded/{{ cookiecutter.python_package }}_data.csv
|
|
24
|
+
save_args:
|
|
25
|
+
index: False
|
|
26
|
+
sep: ','
|
|
27
|
+
type: pandas.CSVDataset
|
|
28
|
+
|
|
29
|
+
processed_{{ cookiecutter.python_package }}_X_train:
|
|
30
|
+
filepath: data/03_preprocessed/processed_{{ cookiecutter.python_package }}_X_train.csv
|
|
31
|
+
save_args:
|
|
32
|
+
index: False
|
|
33
|
+
sep: ','
|
|
34
|
+
type: pandas.CSVDataset
|
|
35
|
+
|
|
36
|
+
processed_{{ cookiecutter.python_package }}_X_test:
|
|
37
|
+
filepath: data/03_preprocessed/processed_{{ cookiecutter.python_package }}_X_test.csv
|
|
38
|
+
save_args:
|
|
39
|
+
index: False
|
|
40
|
+
sep: ','
|
|
41
|
+
type: pandas.CSVDataset
|
|
42
|
+
|
|
43
|
+
processed_{{ cookiecutter.python_package }}_y_train:
|
|
44
|
+
filepath: data/03_preprocessed/processed_{{ cookiecutter.python_package }}_y_train.csv
|
|
45
|
+
save_args:
|
|
46
|
+
index: False
|
|
47
|
+
sep: ','
|
|
48
|
+
type: pandas.CSVDataset
|
|
49
|
+
|
|
50
|
+
processed_{{ cookiecutter.python_package }}_y_test:
|
|
51
|
+
filepath: data/03_preprocessed/processed_{{ cookiecutter.python_package }}_y_test.csv
|
|
52
|
+
save_args:
|
|
53
|
+
index: False
|
|
54
|
+
sep: ','
|
|
55
|
+
type: pandas.CSVDataset
|
|
56
|
+
|
|
57
|
+
event_ids_train:
|
|
58
|
+
filepath: data/03_preprocessed/event_ids_train.csv
|
|
59
|
+
save_args:
|
|
60
|
+
index: False
|
|
61
|
+
sep: ','
|
|
62
|
+
type: pandas.CSVDataset
|
|
63
|
+
|
|
64
|
+
event_ids_test:
|
|
65
|
+
filepath: data/03_preprocessed/event_ids_test.csv
|
|
66
|
+
save_args:
|
|
67
|
+
index: False
|
|
68
|
+
sep: ','
|
|
69
|
+
type: pandas.CSVDataset
|
|
70
|
+
|
|
71
|
+
scaler:
|
|
72
|
+
filepath: data/03_preprocessed/scaler.pkl
|
|
73
|
+
type: pickle.PickleDataset
|
|
74
|
+
|
|
75
|
+
train_model:
|
|
76
|
+
filepath: data/04_models/trained_model.pkl
|
|
77
|
+
type: pickle.PickleDataset
|
|
78
|
+
|
|
79
|
+
training_history:
|
|
80
|
+
type: matplotlib.MatplotlibDataset
|
|
81
|
+
filepath: data/07_reporting/training_history.png
|
|
82
|
+
save_args:
|
|
83
|
+
format: png
|
|
84
|
+
|
|
85
|
+
model_pred:
|
|
86
|
+
filepath: data/05_validation/model_pred.pkl
|
|
87
|
+
save_args:
|
|
88
|
+
index: False
|
|
89
|
+
sep: ','
|
|
90
|
+
type: pandas.CSVDataset
|
|
File without changes
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
# This is a boilerplate parameters config generated for pipeline 'compile'
|
|
2
|
+
# using Kedro 0.19.14.
|
|
3
|
+
#
|
|
4
|
+
# Documentation for this file format can be found in "Parameters"
|
|
5
|
+
# Link: https://docs.kedro.org/en/0.19.14/configuration/parameters.html
|
|
6
|
+
|
|
7
|
+
|
|
8
|
+
compile:
|
|
9
|
+
name: "munet"
|
|
10
|
+
ml_backend: "Keras"
|
|
11
|
+
compiler: "hls4ml"
|
|
12
|
+
mlflow_url: "https://mlflow-deploy-mflow.app.cern.ch"
|
|
13
|
+
compiler_config:
|
|
14
|
+
test: 123
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
# This is a boilerplate parameters config generated for pipeline 'data_processing'
|
|
2
|
+
# using Kedro 0.19.14.
|
|
3
|
+
#
|
|
4
|
+
# Documentation for this file format can be found in "Parameters"
|
|
5
|
+
# Link: https://docs.kedro.org/en/0.19.14/configuration/parameters.html
|
|
6
|
+
|
|
7
|
+
random_state: 42
|
|
8
|
+
test_size: 0.5
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
# This is a boilerplate parameters config generated for pipeline 'model_training'
|
|
2
|
+
# using Kedro 1.0.0
|
|
3
|
+
#
|
|
4
|
+
# Documentation for this file format can be found in "Parameters"
|
|
5
|
+
# Link: https://docs.kedro.org/en/1.0.0/configuration/parameters.html
|
|
6
|
+
|
|
7
|
+
{{ cookiecutter.python_package }}_model:
|
|
8
|
+
hps:
|
|
9
|
+
name: "{{ cookiecutter.python_package }}"
|
|
@@ -0,0 +1,43 @@
|
|
|
1
|
+
# To enable this custom logging configuration, set KEDRO_LOGGING_CONFIG to the path of this file.
|
|
2
|
+
# More information available at https://docs.kedro.org/en/stable/logging/logging.html
|
|
3
|
+
version: 1
|
|
4
|
+
|
|
5
|
+
disable_existing_loggers: False
|
|
6
|
+
|
|
7
|
+
formatters:
|
|
8
|
+
simple:
|
|
9
|
+
format: "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
|
|
10
|
+
|
|
11
|
+
handlers:
|
|
12
|
+
console:
|
|
13
|
+
class: logging.StreamHandler
|
|
14
|
+
level: INFO
|
|
15
|
+
formatter: simple
|
|
16
|
+
stream: ext://sys.stdout
|
|
17
|
+
|
|
18
|
+
info_file_handler:
|
|
19
|
+
class: logging.handlers.RotatingFileHandler
|
|
20
|
+
level: INFO
|
|
21
|
+
formatter: simple
|
|
22
|
+
filename: info.log
|
|
23
|
+
maxBytes: 10485760 # 10MB
|
|
24
|
+
backupCount: 20
|
|
25
|
+
encoding: utf8
|
|
26
|
+
delay: True
|
|
27
|
+
|
|
28
|
+
rich:
|
|
29
|
+
class: kedro.logging.RichHandler
|
|
30
|
+
rich_tracebacks: True
|
|
31
|
+
# Advance options for customisation.
|
|
32
|
+
# See https://docs.kedro.org/en/stable/logging/logging.html#project-side-logging-configuration
|
|
33
|
+
# tracebacks_show_locals: False
|
|
34
|
+
|
|
35
|
+
loggers:
|
|
36
|
+
kedro:
|
|
37
|
+
level: INFO
|
|
38
|
+
|
|
39
|
+
{{ cookiecutter.python_package }}:
|
|
40
|
+
level: INFO
|
|
41
|
+
|
|
42
|
+
root:
|
|
43
|
+
handlers: [rich, info_file_handler]
|
|
File without changes
|
|
@@ -0,0 +1,24 @@
|
|
|
1
|
+
{
|
|
2
|
+
"samples" : {
|
|
3
|
+
"signal" : {
|
|
4
|
+
"files":"data/01_raw/test.root",
|
|
5
|
+
"file_pattern":["test.root"],
|
|
6
|
+
"DAS" : "Blabla",
|
|
7
|
+
"type" : "123",
|
|
8
|
+
"data" : false,
|
|
9
|
+
"era" : "phase1",
|
|
10
|
+
"run" : "run3",
|
|
11
|
+
"is_signal": true
|
|
12
|
+
},
|
|
13
|
+
"background" : {
|
|
14
|
+
"files":"data/01_raw/test.root",
|
|
15
|
+
"file_pattern":["test.root"],
|
|
16
|
+
"DAS" : "Blabla",
|
|
17
|
+
"type" : "123",
|
|
18
|
+
"data" : false,
|
|
19
|
+
"era" : "phase1",
|
|
20
|
+
"run" : "run3",
|
|
21
|
+
"is_signal": false
|
|
22
|
+
}
|
|
23
|
+
}
|
|
24
|
+
}
|
|
Binary file
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|