phylogenie 2.0.11__tar.gz → 2.0.13__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (28) hide show
  1. {phylogenie-2.0.11 → phylogenie-2.0.13}/PKG-INFO +1 -1
  2. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/__init__.py +6 -0
  3. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/generators/__init__.py +8 -0
  4. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/generators/configs.py +7 -7
  5. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/generators/dataset.py +11 -8
  6. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/generators/factories.py +2 -2
  7. phylogenie-2.0.13/phylogenie/generators/typeguards.py +25 -0
  8. {phylogenie-2.0.11 → phylogenie-2.0.13}/pyproject.toml +1 -1
  9. phylogenie-2.0.11/phylogenie/generators/typeguards.py +0 -28
  10. {phylogenie-2.0.11 → phylogenie-2.0.13}/LICENSE.txt +0 -0
  11. {phylogenie-2.0.11 → phylogenie-2.0.13}/README.md +0 -0
  12. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/generators/alisim.py +0 -0
  13. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/generators/trees.py +0 -0
  14. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/io.py +0 -0
  15. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/main.py +0 -0
  16. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/msa.py +0 -0
  17. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/py.typed +0 -0
  18. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/skyline/__init__.py +0 -0
  19. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/skyline/matrix.py +0 -0
  20. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/skyline/parameter.py +0 -0
  21. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/skyline/vector.py +0 -0
  22. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/tree.py +0 -0
  23. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/treesimulator/__init__.py +0 -0
  24. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/treesimulator/events.py +0 -0
  25. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/treesimulator/gillespie.py +0 -0
  26. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/treesimulator/model.py +0 -0
  27. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/typeguards.py +0 -0
  28. {phylogenie-2.0.11 → phylogenie-2.0.13}/phylogenie/typings.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: phylogenie
3
- Version: 2.0.11
3
+ Version: 2.0.13
4
4
  Summary: Generate phylogenetic datasets with minimal setup effort
5
5
  Author: Gabriele Marino
6
6
  Author-email: gabmarino.8601@gmail.com
@@ -8,6 +8,9 @@ from phylogenie.generators import (
8
8
  DatasetGeneratorConfig,
9
9
  EpidemiologicalTreeDatasetGenerator,
10
10
  FBDTreeDatasetGenerator,
11
+ SkylineMatrixModel,
12
+ SkylineParameterModel,
13
+ SkylineVectorModel,
11
14
  TreeDatasetGeneratorConfig,
12
15
  )
13
16
  from phylogenie.io import load_fasta, load_newick
@@ -48,13 +51,16 @@ __all__ = [
48
51
  "FBDTreeDatasetGenerator",
49
52
  "SkylineMatrix",
50
53
  "SkylineMatrixCoercible",
54
+ "SkylineMatrixModel",
51
55
  "skyline_matrix",
52
56
  "SkylineParameter",
53
57
  "SkylineParameterLike",
58
+ "SkylineParameterModel",
54
59
  "skyline_parameter",
55
60
  "SkylineVector",
56
61
  "SkylineVectorCoercible",
57
62
  "SkylineVectorLike",
63
+ "SkylineVectorModel",
58
64
  "skyline_vector",
59
65
  "Tree",
60
66
  "TreeDatasetGeneratorConfig",
@@ -3,6 +3,11 @@ from typing import Annotated
3
3
  from pydantic import Field
4
4
 
5
5
  from phylogenie.generators.alisim import AliSimDatasetGenerator
6
+ from phylogenie.generators.configs import (
7
+ SkylineMatrixModel,
8
+ SkylineParameterModel,
9
+ SkylineVectorModel,
10
+ )
6
11
  from phylogenie.generators.dataset import DatasetGenerator
7
12
  from phylogenie.generators.trees import (
8
13
  BDEITreeDatasetGenerator,
@@ -29,4 +34,7 @@ __all__ = [
29
34
  "BDTreeDatasetGenerator",
30
35
  "BDEITreeDatasetGenerator",
31
36
  "BDSSTreeDatasetGenerator",
37
+ "SkylineMatrixModel",
38
+ "SkylineParameterModel",
39
+ "SkylineVectorModel",
32
40
  ]
@@ -10,9 +10,9 @@ class Distribution(BaseModel):
10
10
 
11
11
  Integer = str | int
12
12
  Scalar = str | pgt.Scalar
13
- ManyScalars = str | list[Scalar]
14
- OneOrManyScalars = Scalar | list[Scalar]
15
- OneOrMany2DScalars = Scalar | list[list[Scalar]]
13
+ ManyScalars = str | pgt.Many[Scalar]
14
+ OneOrManyScalars = Scalar | pgt.Many[Scalar]
15
+ OneOrMany2DScalars = Scalar | pgt.Many2D[Scalar]
16
16
 
17
17
 
18
18
  class StrictBaseModel(BaseModel):
@@ -25,15 +25,15 @@ class SkylineParameterModel(StrictBaseModel):
25
25
 
26
26
 
27
27
  class SkylineVectorModel(StrictBaseModel):
28
- value: str | list[OneOrManyScalars]
28
+ value: str | pgt.Many[OneOrManyScalars]
29
29
  change_times: ManyScalars
30
30
 
31
31
 
32
32
  class SkylineMatrixModel(StrictBaseModel):
33
- value: str | list[OneOrMany2DScalars]
33
+ value: str | pgt.Many[OneOrMany2DScalars]
34
34
  change_times: ManyScalars
35
35
 
36
36
 
37
37
  SkylineParameter = Scalar | SkylineParameterModel
38
- SkylineVector = str | pgt.Scalar | list[SkylineParameter] | SkylineVectorModel
39
- SkylineMatrix = str | pgt.Scalar | list[SkylineVector] | SkylineMatrixModel | None
38
+ SkylineVector = str | pgt.Scalar | pgt.Many[SkylineParameter] | SkylineVectorModel
39
+ SkylineMatrix = str | pgt.Scalar | pgt.Many[SkylineVector] | SkylineMatrixModel | None
@@ -41,21 +41,24 @@ class DatasetGenerator(ABC, cfg.StrictBaseModel):
41
41
  self._generate_one(filename=filename, rng=default_rng(seed), data=data)
42
42
 
43
43
  def _generate(self, rng: Generator, n_samples: int, output_dir: str) -> None:
44
+ if os.path.exists(output_dir):
45
+ print(f"Output directory {output_dir} already exists. Skipping.")
46
+ return
47
+
48
+ data_dir = (
49
+ output_dir
50
+ if self.context is None
51
+ else os.path.join(output_dir, DATA_DIRNAME)
52
+ )
53
+ os.makedirs(data_dir)
54
+
44
55
  data: list[dict[str, Any]] = [{} for _ in range(n_samples)]
45
56
  if self.context is not None:
46
- data_dir = os.path.join(output_dir, DATA_DIRNAME)
47
57
  for d, (k, v) in product(data, self.context.items()):
48
58
  args = v.model_extra if v.model_extra is not None else {}
49
59
  d[k] = np.array(getattr(rng, v.type)(**args)).tolist()
50
60
  df = pd.DataFrame([{"file_id": str(i), **d} for i, d in enumerate(data)])
51
61
  df.to_csv(os.path.join(output_dir, METADATA_FILENAME), index=False)
52
- else:
53
- data_dir = output_dir
54
-
55
- if os.path.exists(data_dir):
56
- print(f"Output directory {data_dir} already exists. Skipping.")
57
- return
58
- os.makedirs(data_dir)
59
62
 
60
63
  joblib.Parallel(n_jobs=self.n_jobs)(
61
64
  joblib.delayed(self.generate_one)(
@@ -100,7 +100,7 @@ def skyline_vector(
100
100
  )
101
101
  if isinstance(x, pgt.Scalar):
102
102
  return x
103
- if ctg.is_list_of_skyline_parameter_configs(x):
103
+ if ctg.is_many_skyline_parameter_configs(x):
104
104
  return [skyline_parameter(p, data) for p in x]
105
105
 
106
106
  assert isinstance(x, cfg.SkylineVectorModel)
@@ -161,7 +161,7 @@ def skyline_matrix(
161
161
  )
162
162
  if isinstance(x, pgt.Scalar):
163
163
  return x
164
- if ctg.is_list_of_skyline_vector_configs(x):
164
+ if ctg.is_many_skyline_vector_configs(x):
165
165
  return [skyline_vector(v, data) for v in x]
166
166
 
167
167
  assert isinstance(x, cfg.SkylineMatrixModel)
@@ -0,0 +1,25 @@
1
+ from typing import Any, TypeGuard
2
+
3
+ import phylogenie.generators.configs as cfg
4
+ import phylogenie.typeguards as tg
5
+ import phylogenie.typings as pgt
6
+
7
+
8
+ def is_many_scalar_configs(x: Any) -> TypeGuard[pgt.Many[cfg.Scalar]]:
9
+ return tg.is_many(x) and all(isinstance(v, cfg.Scalar) for v in x)
10
+
11
+
12
+ def is_many_skyline_parameter_configs(
13
+ x: Any,
14
+ ) -> TypeGuard[pgt.Many[cfg.SkylineParameter]]:
15
+ return tg.is_many(x) and all(isinstance(v, cfg.SkylineParameter) for v in x)
16
+
17
+
18
+ def is_skyline_vector_config(x: Any) -> TypeGuard[cfg.SkylineVector]:
19
+ return isinstance(
20
+ x, str | pgt.Scalar | cfg.SkylineVectorModel
21
+ ) or is_many_skyline_parameter_configs(x)
22
+
23
+
24
+ def is_many_skyline_vector_configs(x: Any) -> TypeGuard[pgt.Many[cfg.SkylineVector]]:
25
+ return tg.is_many(x) and all(is_skyline_vector_config(v) for v in x)
@@ -1,6 +1,6 @@
1
1
  [tool.poetry]
2
2
  name = "phylogenie"
3
- version = "2.0.11"
3
+ version = "2.0.13"
4
4
  description = "Generate phylogenetic datasets with minimal setup effort"
5
5
  authors = ["Gabriele Marino <gabmarino.8601@gmail.com>"]
6
6
  readme = "README.md"
@@ -1,28 +0,0 @@
1
- from typing import Any, TypeGuard
2
-
3
- import phylogenie.generators.configs as cfg
4
- import phylogenie.typings as pgt
5
-
6
-
7
- def is_list(x: Any) -> TypeGuard[list[Any]]:
8
- return isinstance(x, list)
9
-
10
-
11
- def is_list_of_scalar_configs(x: Any) -> TypeGuard[list[cfg.Scalar]]:
12
- return is_list(x) and all(isinstance(v, cfg.Scalar) for v in x)
13
-
14
-
15
- def is_list_of_skyline_parameter_configs(
16
- x: Any,
17
- ) -> TypeGuard[list[cfg.SkylineParameter]]:
18
- return is_list(x) and all(isinstance(v, cfg.SkylineParameter) for v in x)
19
-
20
-
21
- def is_skyline_vector_config(x: Any) -> TypeGuard[cfg.SkylineVector]:
22
- return isinstance(
23
- x, str | pgt.Scalar | cfg.SkylineVectorModel
24
- ) or is_list_of_skyline_parameter_configs(x)
25
-
26
-
27
- def is_list_of_skyline_vector_configs(x: Any) -> TypeGuard[list[cfg.SkylineVector]]:
28
- return is_list(x) and all(is_skyline_vector_config(v) for v in x)
File without changes
File without changes