halib 0.2.32__py3-none-any.whl → 0.2.34__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,234 @@
1
+ import os
2
+ import pandas as pd
3
+ from typing import List, Optional, Callable, Union
4
+ from rich.pretty import pprint
5
+ import plotly.express as px
6
+ from ..common.common import pprint_local_path
7
+
8
+
9
+ class PlotlyUtils:
10
+ @staticmethod
11
+ # Extract experiment IDs from complex naming convention
12
+ def exp_id_extractor(df: pd.DataFrame) -> pd.Series:
13
+ # MainPC__ds_UFireIndoor2__mt_temp_method_motion_block__9896ed2e67e7__20260202.133758
14
+ exp_names = df["Name"].to_list()
15
+ exp_ids = []
16
+ for name in exp_names:
17
+ parts = name.split("__")
18
+ exp_id = parts[-2] if len(parts) >= 2 else name
19
+ exp_ids.append(exp_id)
20
+ return pd.Series(exp_ids)
21
+
22
+ @staticmethod
23
+ def exp_id_formatter(exp_id: str) -> str:
24
+ if len(exp_id) <= 6:
25
+ return exp_id
26
+ return f"{exp_id[:6]}"
27
+
28
+ @staticmethod
29
+ def parallel_plot(
30
+ df_or_csv_file: Union[pd.DataFrame, str],
31
+ dimensions: List[str] = [],
32
+ exclude_dims: List[str] = [],
33
+ exp_col_or_func: Union[
34
+ str, Callable[[pd.DataFrame], pd.Series]
35
+ ] = exp_id_extractor,
36
+ exp_id_formatter: Optional[Callable[[str], str]] = exp_id_formatter,
37
+ color: Optional[str] = None,
38
+ csv_separator: str = ";",
39
+ plot_bar_height: int = 1200,
40
+ plot_width: int = 1500,
41
+ title: str = "Parallel Coordinates Plot",
42
+ template: str = "plotly_white",
43
+ outdir: str = ".",
44
+ outfile: str = "zresults_with_table.html",
45
+ ):
46
+ # 1. Unified Data Loading
47
+ if isinstance(df_or_csv_file, str):
48
+ df = pd.read_csv(df_or_csv_file, sep=csv_separator, encoding="utf-8")
49
+ else:
50
+ df = df_or_csv_file.copy()
51
+
52
+ # 2. Extract Experiment IDs
53
+ if callable(exp_col_or_func):
54
+ df["exp_id"] = exp_col_or_func(df)
55
+ elif isinstance(exp_col_or_func, str):
56
+ if exp_col_or_func not in df.columns:
57
+ raise ValueError(f"Column '{exp_col_or_func}' not found.")
58
+ df["exp_id"] = df[exp_col_or_func].copy()
59
+ exclude_dims.append(exp_col_or_func)
60
+ else:
61
+ raise ValueError("exp_col_or_func must be a column name or a callable.")
62
+
63
+ # 3. Setup Plot Dimensions
64
+ # Priority: explicit dimensions -> all columns minus exclusions
65
+ if not dimensions:
66
+ dimensions = [
67
+ c for c in df.columns if c not in exclude_dims and c != "exp_id"
68
+ ]
69
+
70
+ df["numeric_id"] = range(len(df))
71
+ # Ensure numeric_id is the first axis for the labels to work
72
+ final_plot_dims = ["numeric_id"] + [
73
+ d for d in dimensions if d != "numeric_id" and d in df.columns
74
+ ]
75
+
76
+ pprint(f"Generating plot: {title}")
77
+
78
+ # 4. Create and Configure Plotly Figure
79
+ fig = px.parallel_coordinates(
80
+ df,
81
+ dimensions=final_plot_dims,
82
+ color=color,
83
+ title=title,
84
+ template=template,
85
+ )
86
+
87
+ # Map string IDs to the numeric axis
88
+ fig.data[0].dimensions[0].tickvals = list(df["numeric_id"])
89
+ fig.data[0].dimensions[0].ticktext = (
90
+ [exp_id_formatter(i) for i in df["exp_id"]]
91
+ if exp_id_formatter
92
+ else df["exp_id"]
93
+ )
94
+ fig.data[0].dimensions[0].label = "Exp IDs"
95
+
96
+ fig.update_layout(
97
+ title={
98
+ "text": title,
99
+ "y": 0.98,
100
+ "x": 0.5,
101
+ "xanchor": "center",
102
+ "yanchor": "top",
103
+ },
104
+ width=plot_width,
105
+ height=plot_bar_height,
106
+ margin=dict(l=150, r=50, t=150, b=50),
107
+ )
108
+
109
+ # 5. Prepare Table Display
110
+ # Clean up columns: Move exp_id to front, drop internal numeric_id
111
+ cols = ["exp_id"] + [c for c in df.columns if c not in ["exp_id", "numeric_id"]]
112
+ df_display = df[cols].copy()
113
+ df_display.insert(0, "Selection", '<button class="select-btn">Select</button>')
114
+
115
+ chart_html = fig.to_html(full_html=False, include_plotlyjs="cdn")
116
+
117
+ # Create a display copy with a 'Select' button column
118
+ df_display = df.copy()
119
+ df_display_cols = df_display.columns.tolist()
120
+ # move 'exp_id' to the front for better visibility
121
+ if "exp_id" in df_display_cols:
122
+ df_display_cols.insert(
123
+ 0, df_display_cols.pop(df_display_cols.index("exp_id"))
124
+ )
125
+ df_display = df_display[df_display_cols]
126
+ # remove 'numeric_id' from display
127
+ if "numeric_id" in df_display.columns:
128
+ df_display = df_display.drop(columns=["numeric_id"])
129
+ df_display.insert(0, "Selection", '<button class="select-btn">Select</button>')
130
+
131
+ table_html = df_display.to_html(
132
+ classes="display nowrap", table_id="exp_table", index=False, escape=False
133
+ )
134
+
135
+ final_html = f"""
136
+ <!DOCTYPE html>
137
+ <html>
138
+ <head>
139
+ <title>Experiment Dashboard</title>
140
+ <link rel="stylesheet" type="text/css" href="https://cdn.datatables.net/1.11.5/css/jquery.dataTables.css">
141
+ <script type="text/javascript" charset="utf8" src="https://code.jquery.com/jquery-3.5.1.js"></script>
142
+ <script type="text/javascript" charset="utf8" src="https://cdn.datatables.net/1.11.5/js/jquery.dataTables.js"></script>
143
+ <style>
144
+ body {{ font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif; margin: 20px; background-color: #f0f2f5; }}
145
+ .container {{ background: white; padding: 30px; border-radius: 12px; box-shadow: 0 4px 20px rgba(0,0,0,0.08); }}
146
+ #exp_table tbody tr:nth-child(even), #selected_table tbody tr:nth-child(even) {{ background-color: #f2f2f2; }}
147
+ #exp_table tbody tr:nth-child(odd), #selected_table tbody tr:nth-child(odd) {{ background-color: #ffffff; }}
148
+ #exp_table tbody tr:hover, #selected_table tbody tr:hover {{ background-color: #e0e0e0; }}
149
+ table.dataTable thead th {{ background-color: #333; color: white; padding: 12px; }}
150
+ h2 {{ color: #2c3e50; border-bottom: 2px solid #eee; padding-bottom: 10px; margin-top: 40px; }}
151
+ .select-btn {{ background-color: #28a745; color: white; border: none; padding: 5px 10px; cursor: pointer; border-radius: 4px; }}
152
+ .remove-btn {{ background-color: #dc3545; color: white; border: none; padding: 5px 10px; cursor: pointer; border-radius: 4px; }}
153
+ .clear-btn {{ background-color: #6c757d; color: white; border: none; padding: 10px 15px; cursor: pointer; border-radius: 4px; margin-bottom: 10px; }}
154
+ </style>
155
+ </head>
156
+ <body>
157
+ <div class="container">
158
+ {chart_html}
159
+
160
+ <h2>Selected Experiments</h2>
161
+ <button id="clear_all" class="clear-btn">Clear All</button>
162
+ <div style="overflow-x:auto; margin-bottom: 40px;">
163
+ <table id="selected_table" class="display nowrap">
164
+ <thead>{df_display.iloc[:0].to_html(index=False, escape=False).split("<thead>")[1].split("</thead>")[0]}</thead>
165
+ <tbody></tbody>
166
+ </table>
167
+ </div>
168
+
169
+ <hr>
170
+
171
+ <h2>Full Experiment Raw Data</h2>
172
+ <div style="overflow-x:auto;">
173
+ {table_html}
174
+ </div>
175
+ </div>
176
+
177
+ <script>
178
+ $(document).ready( function () {{
179
+ var mainTable = $('#exp_table').DataTable({{
180
+ "pageLength": 25,
181
+ "order": [[ 5, "desc" ]],
182
+ "stripeClasses": []
183
+ }});
184
+
185
+ var selectedTable = $('#selected_table').DataTable({{
186
+ "paging": false,
187
+ "searching": false,
188
+ "info": false,
189
+ "stripeClasses": []
190
+ }});
191
+
192
+ // Handle Select button
193
+ $('#exp_table tbody').on('click', '.select-btn', function () {{
194
+ var data = mainTable.row($(this).parents('tr')).data();
195
+ var rowNode = $(this).parents('tr');
196
+
197
+ // Change button to remove in the new table
198
+ var newData = [...data];
199
+ newData[0] = '<button class="remove-btn">Remove</button>';
200
+
201
+ // Check if already in selectedTable (optional but good)
202
+ var alreadyExists = false;
203
+ selectedTable.rows().every(function() {{
204
+ if(this.data()[1] === data[1]) {{ alreadyExists = true; }}
205
+ }});
206
+
207
+ if(!alreadyExists) {{
208
+ selectedTable.row.add(newData).draw();
209
+ }}
210
+ }});
211
+
212
+ // Handle Remove button
213
+ $('#selected_table tbody').on('click', '.remove-btn', function () {{
214
+ selectedTable.row($(this).parents('tr')).remove().draw();
215
+ }});
216
+
217
+ // Handle Clear All
218
+ $('#clear_all').on('click', function() {{
219
+ selectedTable.clear().draw();
220
+ }});
221
+ }});
222
+ </script>
223
+ </body>
224
+ </html>
225
+ """
226
+
227
+ final_html_path = os.path.join(outdir, outfile)
228
+ with open(final_html_path, "w") as f:
229
+ f.write(final_html)
230
+
231
+ pprint_local_path(
232
+ final_html_path, get_wins_path=True, tag="PlotlyUtils.parallel_plot"
233
+ )
234
+ return fig
@@ -0,0 +1,86 @@
1
+ import time
2
+ from slack_sdk import WebClient
3
+ from slack_sdk.errors import SlackApiError
4
+ from rich.pretty import pprint
5
+
6
+ """
7
+ Utilities for interacting with Slack for experiment notification via Wandb Logger.
8
+ """
9
+ class SlackUtils:
10
+ _instance = None
11
+
12
+ def __new__(cls, token=None):
13
+ """
14
+ Singleton __new__ method.
15
+ Ensures only one instance of SlackUtils exists.
16
+ """
17
+ if cls._instance is None:
18
+ if token is None:
19
+ raise ValueError(
20
+ "A Slack Token is required for the first initialization."
21
+ )
22
+
23
+ # Create the instance
24
+ cls._instance = super(SlackUtils, cls).__new__(cls)
25
+
26
+ # Initialize the WebClient only once
27
+ cls._instance.client = WebClient(token=token)
28
+ cls._instance.token = token
29
+
30
+ return cls._instance
31
+
32
+ def clear_channel(self, channel_id, sleep_interval=1.0):
33
+ """
34
+ Fetches and deletes all messages in a specified channel.
35
+ """
36
+ cursor = None
37
+ deleted_count = 0
38
+
39
+ pprint(f"--- Starting cleanup for Channel ID: {channel_id} ---")
40
+
41
+ while True:
42
+ try:
43
+ # Fetch history in batches of 100
44
+ response = self.client.conversations_history( # ty:ignore[unresolved-attribute]
45
+ channel=channel_id, cursor=cursor, limit=100
46
+ )
47
+
48
+ messages = response.get("messages", [])
49
+
50
+ if not messages:
51
+ pprint("No more messages found to delete.")
52
+ break
53
+
54
+ for msg in messages:
55
+ ts = msg.get("ts")
56
+
57
+ try:
58
+ # Attempt delete
59
+ self.client.chat_delete( # ty:ignore[unresolved-attribute]
60
+ channel=channel_id, ts=ts
61
+ )
62
+ pprint(f"Deleted: {ts}")
63
+ deleted_count += 1
64
+
65
+ # Rate limit protection (Tier 3 limit)
66
+ time.sleep(sleep_interval)
67
+
68
+ except SlackApiError as e:
69
+ error_code = e.response["error"]
70
+ if error_code == "cant_delete_message":
71
+ pprint(f"Skipped (Permission denied): {ts}")
72
+ elif error_code == "message_not_found":
73
+ pprint(f"Skipped (Already deleted): {ts}")
74
+ else:
75
+ pprint(f"Error deleting {ts}: {error_code}")
76
+ # Check for pagination
77
+ if response["has_more"]:
78
+ cursor = response["response_metadata"]["next_cursor"]
79
+ else:
80
+ break
81
+
82
+ except SlackApiError as e:
83
+ print(f"Critical API Error fetching history: {e.response['error']}")
84
+ break
85
+
86
+ print(f"--- Completed. Total messages deleted: {deleted_count} ---")
@@ -0,0 +1,140 @@
1
+ import glob
2
+ import wandb
3
+ import subprocess
4
+ from pathlib import Path
5
+ from typing import Optional, Literal
6
+
7
+ from tap import Tap
8
+ from tqdm import tqdm
9
+
10
+ from rich.console import Console
11
+ import yaml
12
+
13
+ wandb_console = Console()
14
+
15
+
16
+ # --- Argument Parser ---
17
+ class WandbArgs(Tap):
18
+ # --- Auth ---
19
+ api_key_yaml: Path = Path(
20
+ "E:/Dev/__halib/.env.yaml"
21
+ ) # Path to YAML file containing W&B API key
22
+
23
+ # --- Operations ---
24
+ op: Literal["sync", "delete"] = "delete" # Operation to perform
25
+
26
+ # --- Project & Filtering ---
27
+ project: str = "paper2_main" # W&B project name
28
+ pattern: Optional[str] = None # Run name pattern to match for deletion
29
+
30
+ # --- Paths ---
31
+ outdir: Path = Path("./zout/zruns") # Directory containing runs to sync
32
+
33
+ def configure(self):
34
+ self.add_argument("-prj", "--project")
35
+ self.add_argument("-pt", "--pattern")
36
+ self.add_argument("-o", "--outdir")
37
+ self.add_argument("-k", "--api_key_yaml")
38
+
39
+ def validate(self):
40
+ if self.op == "sync" and not self.outdir.exists():
41
+ raise ValueError(f"Output directory {self.outdir} does not exist.")
42
+ if self.op == "delete" and not self.project.strip():
43
+ raise ValueError("Project name must be a non-empty string.")
44
+
45
+
46
+ def login_wandb(api_key: Optional[str]):
47
+ """Handles authentication with Weights & Biases."""
48
+ try:
49
+ if api_key:
50
+ # Explicit login with key
51
+ wandb.login(key=api_key)
52
+ wandb_console.print(
53
+ "[green]Successfully logged into W&B using provided API key.[/green]"
54
+ )
55
+ else:
56
+ # Attempts to find key in environment variables or netrc file
57
+ if wandb.login():
58
+ wandb_console.print(
59
+ "[blue]Logged into W&B using existing credentials.[/blue]"
60
+ )
61
+ else:
62
+ wandb_console.print(
63
+ "[red]Authentication failed. Please provide an API key with -k.[/red]"
64
+ )
65
+ exit(1)
66
+ except Exception as e:
67
+ wandb_console.print(f"[bold red]Login Error:[/bold red] {e}")
68
+ exit(1)
69
+
70
+
71
+ # --- Logic Functions ---
72
+
73
+
74
+ def sync_runs(outdir: Path):
75
+ outdir_path = outdir.absolute()
76
+ sub_dirs = [d for d in outdir_path.iterdir() if d.is_dir()]
77
+
78
+ if not sub_dirs:
79
+ wandb_console.print(f"[red]No subdirectories found in {outdir_path}.[/red]")
80
+ return
81
+
82
+ wandb_console.rule(f"Syncing from {outdir_path}")
83
+
84
+ wandb_dirs = []
85
+ for exp_dir in sub_dirs:
86
+ wandb_dirs.extend(glob.glob(str(exp_dir / "wandb" / "*run-*")))
87
+
88
+ if not wandb_dirs:
89
+ wandb_console.print("No wandb runs found.")
90
+ return
91
+
92
+ for i, wandb_dir in enumerate(wandb_dirs):
93
+ wandb_console.print(f"[{i+1}/{len(wandb_dirs)}] Syncing: {wandb_dir}")
94
+
95
+ # Note: 'wandb sync' command uses the credentials from wandb.login()
96
+ process = subprocess.Popen(
97
+ ["wandb", "sync", wandb_dir],
98
+ stdout=subprocess.PIPE,
99
+ stderr=subprocess.STDOUT,
100
+ text=True,
101
+ )
102
+ for line in process.stdout: # ty:ignore[not-iterable]
103
+ if "ERROR" in line:
104
+ wandb_console.print(f"[red]{line.strip()}[/red]")
105
+ process.wait()
106
+
107
+
108
+ def delete_runs(project: str, pattern: Optional[str]):
109
+ api = wandb.Api()
110
+ runs = api.runs(project)
111
+
112
+ deleted = 0
113
+ for run in tqdm(runs, desc="Processing runs"):
114
+ if pattern is None or pattern in run.name:
115
+ run.delete()
116
+ deleted += 1
117
+ wandb_console.print(f"[green]Total runs deleted: {deleted}[/green]")
118
+
119
+
120
+ def main():
121
+ args = WandbArgs().parse_args()
122
+ cfg_dict = {}
123
+ with open(args.api_key_yaml, "r") as f:
124
+ cfg_dict = yaml.safe_load(f)
125
+ wandb_api_key = cfg_dict.get("WANDB_API_KEY")
126
+ assert (
127
+ wandb_api_key is not None
128
+ ), "W&B API key not found in the specified YAML file."
129
+ # 1. Login first
130
+ login_wandb(wandb_api_key)
131
+
132
+ # 2. Execute operation
133
+ if args.op == "sync":
134
+ sync_runs(args.outdir)
135
+ elif args.op == "delete":
136
+ delete_runs(args.project, args.pattern)
137
+
138
+
139
+ if __name__ == "__main__":
140
+ main()
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: halib
3
- Version: 0.2.32
3
+ Version: 0.2.34
4
4
  Summary: Small library for common tasks
5
5
  Author: Hoang Van Ha
6
6
  Author-email: hoangvanhauit@gmail.com
@@ -57,7 +57,12 @@ Dynamic: summary
57
57
 
58
58
  ## v0.2.x (Experiment & Core Updates)
59
59
 
60
- ### **v0.2.32**
60
+ ### **v0.2.34**
61
+
62
+ - ✨ **New Feature:**: introduce `utils.PlotlyUtils` with parallel coordinates plot and data table support
63
+
64
+ - 🚀 **Improvement:**: move `wandb_op.py` to `utils` and add `scripts` folder
65
+
61
66
 
62
67
  - ✨ **New Feature:**: add `common.common.log_func` as decorator to log function entry, exit, with execution time and arguments.
63
68
 
@@ -100,11 +100,14 @@ halib/utils/dict_op.py,sha256=wYE6Iw-_CnCWdMg9tpJ2Y2-e2ESkW9FxmdBkZkbUh80,299
100
100
  halib/utils/gpu_mon.py,sha256=vD41_ZnmPLKguuq9X44SB_vwd9JrblO4BDzHLXZhhFY,2233
101
101
  halib/utils/list.py,sha256=bbey9_0IaMXnHx1pudv3C3_WU9uFQEQ5qHPklSN-7o0,498
102
102
  halib/utils/listop.py,sha256=Vpa8_2fI0wySpB2-8sfTBkyi_A4FhoFVVvFiuvW8N64,339
103
+ halib/utils/plotly_op.py,sha256=RzN7dHzNzJUfSgzKh6Yh60xR709YQUw0IXEvui5EBvw,9799
103
104
  halib/utils/slack.py,sha256=2ugWE_eJ0s479ObACJbx7iEu3kjMPD4Rt2hEwuMpuNQ,3099
105
+ halib/utils/slack_op.py,sha256=2ugWE_eJ0s479ObACJbx7iEu3kjMPD4Rt2hEwuMpuNQ,3099
104
106
  halib/utils/tele_noti.py,sha256=-4WXZelCA4W9BroapkRyIdUu9cUVrcJJhegnMs_WpGU,5928
105
107
  halib/utils/video.py,sha256=zLoj5EHk4SmP9OnoHjO8mLbzPdtq6gQPzTQisOEDdO8,3261
106
- halib-0.2.32.dist-info/licenses/LICENSE.txt,sha256=qZssdna4aETiR8znYsShUjidu-U4jUT9Q-EWNlZ9yBQ,1100
107
- halib-0.2.32.dist-info/METADATA,sha256=nNZlX11Q-7O3QWNeUooBUbYCicmwJnJC-4ue44mVYA4,8183
108
- halib-0.2.32.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
109
- halib-0.2.32.dist-info/top_level.txt,sha256=7AD6PLaQTreE0Fn44mdZsoHBe_Zdd7GUmjsWPyQ7I-k,6
110
- halib-0.2.32.dist-info/RECORD,,
108
+ halib/utils/wandb_op.py,sha256=qqDdTMW4J07bzuJTTg2HoLAPs21nVEbwt2-Aa5ZKiVk,4336
109
+ halib-0.2.34.dist-info/licenses/LICENSE.txt,sha256=qZssdna4aETiR8znYsShUjidu-U4jUT9Q-EWNlZ9yBQ,1100
110
+ halib-0.2.34.dist-info/METADATA,sha256=C5Pu5me0s-Giwn_xdybYhRxCoMu0rR6cFzkIOdfuejw,8379
111
+ halib-0.2.34.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
112
+ halib-0.2.34.dist-info/top_level.txt,sha256=7AD6PLaQTreE0Fn44mdZsoHBe_Zdd7GUmjsWPyQ7I-k,6
113
+ halib-0.2.34.dist-info/RECORD,,
File without changes