domainiac 0.1.3__tar.gz → 0.1.5__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: domainiac
3
- Version: 0.1.3
3
+ Version: 0.1.5
4
4
  Summary: Package for working with Energinet data, but with specialized functions used for Enigma.
5
5
  Author: Team Enigma
6
6
  Author-email: gridop-enigma@energinet.dk
@@ -0,0 +1,79 @@
1
+ import datamazing.pandas as pdz
2
+ import pandas as pd
3
+ from typeguard import typechecked
4
+
5
+
6
+ class ResourceManager:
7
+ """
8
+ Manager which simplifies the process of handling resource schedules.
9
+ Scheduled resources are delivered in a 5 min resolution. If a higher
10
+ resolution is chosen,
11
+ the result will be the most conservative value in the time interval,
12
+ e.i. max of minimum capacity and min of maximum capacity.
13
+ If no resolution is given, the default is 5 min.
14
+ If resolution is less than 5 min, the resulting time series will
15
+ default to 5 min resolution.
16
+ """
17
+
18
+ def __init__(
19
+ self,
20
+ db: pdz.Database,
21
+ time_interval: pdz.TimeInterval,
22
+ resolution: pd.Timedelta = pd.Timedelta("PT5M"),
23
+ ) -> None:
24
+ self.db = db
25
+ self.time_interval = time_interval
26
+ self.resolution = resolution
27
+
28
+ @typechecked
29
+ def get_resource_schedules(self, resource_gsrn: str | list[str]) -> pd.DataFrame:
30
+ """Gets resource schedules for a given list of resource gsrns."""
31
+ df_resource_schedules = self.db.query(
32
+ table_name="scheduleResourcePowerPlan",
33
+ time_interval=self.time_interval,
34
+ filters={"resource_gsrn": resource_gsrn},
35
+ )
36
+
37
+ if df_resource_schedules.empty:
38
+ raise ValueError(f"No resource schedules found for gsrn {resource_gsrn}.")
39
+
40
+ df_resource_resampled = (
41
+ pdz.group(
42
+ df_resource_schedules,
43
+ by=[
44
+ "market_participant",
45
+ "created_time_utc",
46
+ "price_area",
47
+ "resource_gsrn",
48
+ ],
49
+ )
50
+ .resample(on="time_utc", resolution=self.resolution)
51
+ .agg(
52
+ {
53
+ "schedule_power_MW": "mean",
54
+ "schedule_capacity_min_MW": "max",
55
+ "schedule_capacity_max_MW": "min",
56
+ }
57
+ )
58
+ .dropna()
59
+ )
60
+ return df_resource_resampled
61
+
62
+ @typechecked
63
+ def get_latest_resource_schedules(
64
+ self,
65
+ resource_gsrn: str | list[str],
66
+ ) -> pd.DataFrame:
67
+ """Gets the lastest resource schedules for a given list of resource gsrns."""
68
+
69
+ df_resource_schedules = self.get_resource_schedules(resource_gsrn=resource_gsrn)
70
+
71
+ df_latest_created_time = pdz.group(
72
+ df=df_resource_schedules, by=["resource_gsrn", "time_utc"]
73
+ ).agg({"created_time_utc": "max"})
74
+
75
+ df_resource_latest = df_latest_created_time.merge(
76
+ df_resource_schedules, on=list(df_latest_created_time.columns)
77
+ )
78
+
79
+ return df_resource_latest
@@ -1,6 +1,6 @@
1
1
  [tool.poetry]
2
2
  name = "domainiac"
3
- version = "0.1.3"
3
+ version = "0.1.5"
4
4
  description = "Package for working with Energinet data, but with specialized functions used for Enigma."
5
5
  authors = ["Team Enigma <gridop-enigma@energinet.dk>"]
6
6
  packages = [
@@ -1,65 +0,0 @@
1
- import datamazing.pandas as pdz
2
- import pandas as pd
3
- from typeguard import typechecked
4
-
5
-
6
- class ResourceManager:
7
- """
8
- Manager which simplifies the process of handling resource schedules.
9
- """
10
-
11
- def __init__(
12
- self,
13
- db: pdz.Database,
14
- time_interval: pdz.TimeInterval,
15
- ) -> None:
16
- self.db = db
17
- self.time_interval = time_interval
18
-
19
- @typechecked
20
- def get_resource_schedules(
21
- self,
22
- resource_gsrns: list,
23
- ) -> pd.DataFrame:
24
- """Gets resource schedules for a given list of resource gsrns."""
25
- df_resource_schedules = self.db.query(
26
- table_name="resourceSchedule",
27
- time_interval=self.time_interval,
28
- filters={"resource_gsrn": resource_gsrns},
29
- )
30
- df_resource_schedules = df_resource_schedules.filter(
31
- [
32
- "market_participant",
33
- "created_time_utc",
34
- "price_area",
35
- "resource_gsrn",
36
- "main_fuel_type",
37
- "is_sum_plan",
38
- "time_utc",
39
- "schedule_power_MW",
40
- "schedule_capacity_min_MW",
41
- "schedule_capacity_max_MW",
42
- ]
43
- )
44
- return df_resource_schedules
45
-
46
- @typechecked
47
- def get_latest_resource_plan(
48
- self,
49
- resource_gsrns: list,
50
- ) -> pd.DataFrame:
51
- """Gets the lastest resource schedules for a given list of resource gsrns."""
52
-
53
- df_resource_schedules = self.get_resource_schedules(
54
- resource_gsrns=resource_gsrns
55
- )
56
-
57
- df_latest_created_time = pdz.group(
58
- df=df_resource_schedules, by=["resource_gsrn", "time_utc"]
59
- ).agg({"created_time_utc": max})
60
-
61
- df_resource_latest = df_latest_created_time.merge(
62
- df_resource_schedules, on=list(df_latest_created_time.columns)
63
- )
64
-
65
- return df_resource_latest