windows-mcp 0.5.8__tar.gz → 0.6.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (45) hide show
  1. windows_mcp-0.6.0/.github/FUNDING.yml +15 -0
  2. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/.mcpbignore +3 -1
  3. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/PKG-INFO +27 -21
  4. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/README.md +24 -15
  5. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/SECURITY.md +15 -15
  6. windows_mcp-0.6.0/assets/logo.png +0 -0
  7. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/manifest.json +2 -2
  8. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/pyproject.toml +3 -6
  9. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/__main__.py +299 -314
  10. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/analytics.py +0 -5
  11. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/desktop/service.py +638 -458
  12. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/desktop/views.py +7 -5
  13. windows_mcp-0.6.0/src/windows_mcp/tree/cache_utils.py +126 -0
  14. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/tree/config.py +25 -0
  15. windows_mcp-0.6.0/src/windows_mcp/tree/service.py +543 -0
  16. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/tree/views.py +142 -116
  17. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/uia/controls.py +11 -2
  18. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/uia/core.py +9 -0
  19. windows_mcp-0.6.0/src/windows_mcp/vdm/__init__.py +1 -0
  20. windows_mcp-0.6.0/src/windows_mcp/vdm/core.py +490 -0
  21. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/watchdog/event_handlers.py +13 -9
  22. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/watchdog/service.py +15 -4
  23. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/uv.lock +8 -544
  24. windows_mcp-0.5.8/assets/demo1.mov +0 -0
  25. windows_mcp-0.5.8/assets/demo2.mov +0 -0
  26. windows_mcp-0.5.8/assets/logo.png +0 -0
  27. windows_mcp-0.5.8/src/windows_mcp/tree/service.py +0 -601
  28. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/.gitignore +0 -0
  29. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/.python-version +0 -0
  30. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/CONTRIBUTING.md +0 -0
  31. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/LICENSE.md +0 -0
  32. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/assets/screenshots/screenshot_1.png +0 -0
  33. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/assets/screenshots/screenshot_2.png +0 -0
  34. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/assets/screenshots/screenshot_3.png +0 -0
  35. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/server.json +0 -0
  36. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/__init__.py +0 -0
  37. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/desktop/__init__.py +0 -0
  38. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/desktop/config.py +0 -0
  39. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/tree/__init__.py +0 -0
  40. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/tree/utils.py +0 -0
  41. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/uia/__init__.py +0 -0
  42. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/uia/enums.py +0 -0
  43. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/uia/events.py +0 -0
  44. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/uia/patterns.py +0 -0
  45. {windows_mcp-0.5.8 → windows_mcp-0.6.0}/src/windows_mcp/watchdog/__init__.py +0 -0
@@ -0,0 +1,15 @@
1
+ # These are supported funding model platforms
2
+
3
+ github: # Replace with up to 4 GitHub Sponsors-enabled usernames e.g., [user1, user2]
4
+ patreon: # Replace with a single Patreon username
5
+ open_collective: # Replace with a single Open Collective username
6
+ ko_fi: # Replace with a single Ko-fi username
7
+ tidelift: # Replace with a single Tidelift platform-name/package-name e.g., npm/babel
8
+ community_bridge: # Replace with a single Community Bridge project-name e.g., cloud-foundry
9
+ liberapay: # Replace with a single Liberapay username
10
+ issuehunt: # Replace with a single IssueHunt username
11
+ lfx_crowdfunding: # Replace with a single LFX Crowdfunding project-name e.g., cloud-foundry
12
+ polar: # Replace with a single Polar username
13
+ buy_me_a_coffee: jeogeoalukf
14
+ thanks_dev: gh/jeomon
15
+ custom: # Replace with up to 4 custom sponsorship URLs e.g., ['link1', 'link2']
@@ -2,4 +2,6 @@
2
2
  __pycache__
3
3
  build
4
4
  dist
5
- notebook.ipynb
5
+ *.ipynb
6
+ .github
7
+ assets
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: windows-mcp
3
- Version: 0.5.8
3
+ Version: 0.6.0
4
4
  Summary: Lightweight MCP Server for interacting with Windows Operating System.
5
5
  Project-URL: homepage, https://github.com/CursorTouch
6
6
  Author-email: Jeomon George <jeogeoalukka@gmail.com>
@@ -29,20 +29,17 @@ License-File: LICENSE.md
29
29
  Keywords: ai,ai agent,desktop,mcp,windows
30
30
  Requires-Python: >=3.13
31
31
  Requires-Dist: click>=8.2.1
32
+ Requires-Dist: comtypes>=1.4.15
32
33
  Requires-Dist: fastmcp>=2.14.2
33
34
  Requires-Dist: fuzzywuzzy>=0.18.0
34
- Requires-Dist: humancursor>=1.1.5
35
- Requires-Dist: ipykernel>=6.30.0
36
35
  Requires-Dist: markdownify>=1.1.0
37
- Requires-Dist: pdfplumber>=0.11.7
38
36
  Requires-Dist: pillow>=11.2.1
39
37
  Requires-Dist: posthog>=7.4.0
40
38
  Requires-Dist: psutil>=7.0.0
41
39
  Requires-Dist: pyautogui>=0.9.54
42
- Requires-Dist: pygetwindow>=0.0.9
43
40
  Requires-Dist: python-dotenv>=1.1.0
44
41
  Requires-Dist: python-levenshtein>=0.27.1
45
- Requires-Dist: pywinauto>=0.6.9
42
+ Requires-Dist: pywin32>=311
46
43
  Requires-Dist: requests>=2.32.3
47
44
  Requires-Dist: tabulate>=0.9.0
48
45
  Requires-Dist: uuid7>=0.1.0
@@ -76,7 +73,8 @@ Description-Content-Type: text/markdown
76
73
  mcp-name: io.github.CursorTouch/Windows-MCP
77
74
 
78
75
  ## Updates
79
- - Windows-MCP is now available on [PyPI](https://pypi.org/project/windows-mcp/) (thus supports `uvx`)
76
+ - Windows-MCP reached 1M+ Users in [Claude Desktop Extensiosn](https://claude.ai/directory).
77
+ - Windows-MCP is now available on [PyPI](https://pypi.org/project/windows-mcp/) (thus supports `uvx windows-mcp`)
80
78
  - Windows-MCP is added to [MCP Registry](https://github.com/modelcontextprotocol/registry)
81
79
  - Try out 🪟[Windows-Use](https://github.com/CursorTouch/Windows-Use)!!, an agent built using Windows-MCP.
82
80
  - Windows-MCP is now featured as Desktop Extension in `Claude Desktop`.
@@ -112,13 +110,15 @@ mcp-name: io.github.CursorTouch/Windows-MCP
112
110
  Easily adapt or extend tools to suit your unique automation or AI integration needs.
113
111
 
114
112
  - **Real-Time Interaction**
115
- Typical latency between actions (e.g., from one mouse click to the next) ranges from **0.7 to 2.5 secs**, and may slightly vary based on the number of active applications and system load, also the inferencing speed of the llm.
113
+ Typical latency between actions (e.g., from one mouse click to the next) ranges from **0.4 to 1.2 secs**, and may slightly vary based on the number of active applications and system load, also the inferencing speed of the llm.
116
114
 
117
115
  - **DOM Mode for Browser Automation**
118
116
  Special `use_dom=True` mode for State-Tool that focuses exclusively on web page content, filtering out browser UI elements for cleaner, more efficient web automation.
119
117
 
120
118
  ## 🛠️Installation
121
119
 
120
+ **Note:** When you install this MCP server for the first time it may take a minute or two because of installing the dependencies in `pyproject.toml`. In the first run the server may timeout ignore it and restart it.
121
+
122
122
  ### Prerequisites
123
123
 
124
124
  - Python 3.13+
@@ -344,17 +344,17 @@ args=[
344
344
 
345
345
  MCP Client can access the following tools to interact with Windows:
346
346
 
347
- - `Click-Tool`: Click on the screen at the given coordinates.
348
- - `Type-Tool`: Type text on an element (optionally clears existing text).
349
- - `Scroll-Tool`: Scroll vertically or horizontally on the window or specific regions.
350
- - `Drag-Tool`: Drag from one point to another.
351
- - `Move-Tool`: Move mouse pointer.
352
- - `Shortcut-Tool`: Press keyboard shortcuts (`Ctrl+c`, `Alt+Tab`, etc).
353
- - `Wait-Tool`: Pause for a defined duration.
354
- - `State-Tool`: Combined snapshot of default language, browser, active apps and interactive, textual and scrollable elements along with screenshot of the desktop. Supports `use_dom=True` for browser content extraction (web page elements only) and `use_vision=True` for including screenshots.
355
- - `App-Tool`: To launch an application from the start menu, resize or move the window and switch between apps.
356
- - `Shell-Tool`: To execute PowerShell commands.
357
- - `Scrape-Tool`: To scrape the entire webpage for information.
347
+ - `Click`: Click on the screen at the given coordinates.
348
+ - `Type`: Type text on an element (optionally clears existing text).
349
+ - `Scroll`: Scroll vertically or horizontally on the window or specific regions.
350
+ - `Drag`: Drag from one point to another.
351
+ - `Move`: Move mouse pointer.
352
+ - `Shortcut`: Press keyboard shortcuts (`Ctrl+c`, `Alt+Tab`, etc).
353
+ - `Wait`: Pause for a defined duration.
354
+ - `Snapshot`: Combined snapshot of default language, browser, active apps and interactive, textual and scrollable elements along with screenshot of the desktop. Supports `use_dom=True` for browser content extraction (web page elements only) and `use_vision=True` for including screenshots.
355
+ - `App`: To launch an application from the start menu, resize or move the window and switch between apps.
356
+ - `Shell`: To execute PowerShell commands.
357
+ - `Scrape`: To scrape the entire webpage for information.
358
358
 
359
359
  ## 🤝 Connect with Us
360
360
  Stay updated and join our community:
@@ -367,9 +367,15 @@ Stay updated and join our community:
367
367
 
368
368
  [![Star History Chart](https://api.star-history.com/svg?repos=CursorTouch/Windows-MCP&type=Date)](https://www.star-history.com/#CursorTouch/Windows-MCP&Date)
369
369
 
370
- ## ⚠️Caution
370
+ ## 👥 Contributors
371
+
372
+ Thanks to all the amazing people who have contributed to Windows-MCP! 🎉
373
+
374
+ <a href="https://github.com/CursorTouch/Windows-MCP/graphs/contributors">
375
+ <img src="https://contrib.rocks/image?repo=CursorTouch/Windows-MCP" />
376
+ </a>
371
377
 
372
- This MCP interacts directly with your Windows operating system to perform actions. Use with caution and avoid deploying it in environments where such risks cannot be tolerated.
378
+ We appreciate every contribution, whether it's code, documentation, bug reports, or feature suggestions. Want to contribute? Check out our [Contributing Guidelines](CONTRIBUTING)!
373
379
 
374
380
  ## 🔒 Security
375
381
 
@@ -26,7 +26,8 @@
26
26
  mcp-name: io.github.CursorTouch/Windows-MCP
27
27
 
28
28
  ## Updates
29
- - Windows-MCP is now available on [PyPI](https://pypi.org/project/windows-mcp/) (thus supports `uvx`)
29
+ - Windows-MCP reached 1M+ Users in [Claude Desktop Extensiosn](https://claude.ai/directory).
30
+ - Windows-MCP is now available on [PyPI](https://pypi.org/project/windows-mcp/) (thus supports `uvx windows-mcp`)
30
31
  - Windows-MCP is added to [MCP Registry](https://github.com/modelcontextprotocol/registry)
31
32
  - Try out 🪟[Windows-Use](https://github.com/CursorTouch/Windows-Use)!!, an agent built using Windows-MCP.
32
33
  - Windows-MCP is now featured as Desktop Extension in `Claude Desktop`.
@@ -62,13 +63,15 @@ mcp-name: io.github.CursorTouch/Windows-MCP
62
63
  Easily adapt or extend tools to suit your unique automation or AI integration needs.
63
64
 
64
65
  - **Real-Time Interaction**
65
- Typical latency between actions (e.g., from one mouse click to the next) ranges from **0.7 to 2.5 secs**, and may slightly vary based on the number of active applications and system load, also the inferencing speed of the llm.
66
+ Typical latency between actions (e.g., from one mouse click to the next) ranges from **0.4 to 1.2 secs**, and may slightly vary based on the number of active applications and system load, also the inferencing speed of the llm.
66
67
 
67
68
  - **DOM Mode for Browser Automation**
68
69
  Special `use_dom=True` mode for State-Tool that focuses exclusively on web page content, filtering out browser UI elements for cleaner, more efficient web automation.
69
70
 
70
71
  ## 🛠️Installation
71
72
 
73
+ **Note:** When you install this MCP server for the first time it may take a minute or two because of installing the dependencies in `pyproject.toml`. In the first run the server may timeout ignore it and restart it.
74
+
72
75
  ### Prerequisites
73
76
 
74
77
  - Python 3.13+
@@ -294,17 +297,17 @@ args=[
294
297
 
295
298
  MCP Client can access the following tools to interact with Windows:
296
299
 
297
- - `Click-Tool`: Click on the screen at the given coordinates.
298
- - `Type-Tool`: Type text on an element (optionally clears existing text).
299
- - `Scroll-Tool`: Scroll vertically or horizontally on the window or specific regions.
300
- - `Drag-Tool`: Drag from one point to another.
301
- - `Move-Tool`: Move mouse pointer.
302
- - `Shortcut-Tool`: Press keyboard shortcuts (`Ctrl+c`, `Alt+Tab`, etc).
303
- - `Wait-Tool`: Pause for a defined duration.
304
- - `State-Tool`: Combined snapshot of default language, browser, active apps and interactive, textual and scrollable elements along with screenshot of the desktop. Supports `use_dom=True` for browser content extraction (web page elements only) and `use_vision=True` for including screenshots.
305
- - `App-Tool`: To launch an application from the start menu, resize or move the window and switch between apps.
306
- - `Shell-Tool`: To execute PowerShell commands.
307
- - `Scrape-Tool`: To scrape the entire webpage for information.
300
+ - `Click`: Click on the screen at the given coordinates.
301
+ - `Type`: Type text on an element (optionally clears existing text).
302
+ - `Scroll`: Scroll vertically or horizontally on the window or specific regions.
303
+ - `Drag`: Drag from one point to another.
304
+ - `Move`: Move mouse pointer.
305
+ - `Shortcut`: Press keyboard shortcuts (`Ctrl+c`, `Alt+Tab`, etc).
306
+ - `Wait`: Pause for a defined duration.
307
+ - `Snapshot`: Combined snapshot of default language, browser, active apps and interactive, textual and scrollable elements along with screenshot of the desktop. Supports `use_dom=True` for browser content extraction (web page elements only) and `use_vision=True` for including screenshots.
308
+ - `App`: To launch an application from the start menu, resize or move the window and switch between apps.
309
+ - `Shell`: To execute PowerShell commands.
310
+ - `Scrape`: To scrape the entire webpage for information.
308
311
 
309
312
  ## 🤝 Connect with Us
310
313
  Stay updated and join our community:
@@ -317,9 +320,15 @@ Stay updated and join our community:
317
320
 
318
321
  [![Star History Chart](https://api.star-history.com/svg?repos=CursorTouch/Windows-MCP&type=Date)](https://www.star-history.com/#CursorTouch/Windows-MCP&Date)
319
322
 
320
- ## ⚠️Caution
323
+ ## 👥 Contributors
324
+
325
+ Thanks to all the amazing people who have contributed to Windows-MCP! 🎉
326
+
327
+ <a href="https://github.com/CursorTouch/Windows-MCP/graphs/contributors">
328
+ <img src="https://contrib.rocks/image?repo=CursorTouch/Windows-MCP" />
329
+ </a>
321
330
 
322
- This MCP interacts directly with your Windows operating system to perform actions. Use with caution and avoid deploying it in environments where such risks cannot be tolerated.
331
+ We appreciate every contribution, whether it's code, documentation, bug reports, or feature suggestions. Want to contribute? Check out our [Contributing Guidelines](CONTRIBUTING)!
323
332
 
324
333
  ## 🔒 Security
325
334
 
@@ -74,7 +74,7 @@ If you must use Windows-MCP on a regular system:
74
74
  2. **Regular Backups**: Maintain frequent, verified backups of all important data
75
75
  3. **Network Isolation**: Disconnect from production networks or use firewall rules
76
76
  4. **Supervised Operation**: Always monitor the agent's actions in real-time
77
- 5. **Disable High-Risk Tools**: Remove or restrict access to PowerShell-Tool and other destructive tools
77
+ 5. **Disable High-Risk Tools**: Remove or restrict access to Shell and other destructive tools
78
78
  6. **Test First**: Thoroughly test workflows in a safe environment before production use
79
79
 
80
80
  ## Security Considerations
@@ -97,11 +97,11 @@ These tools can make permanent changes to your system:
97
97
 
98
98
  | Tool | Risk | Description |
99
99
  |------|------|-------------|
100
- | **Powershell-Tool** | Critical | Can execute arbitrary PowerShell commands, including system modifications, file deletions, and network operations |
101
- | **Click-Tool** | High | Can trigger destructive UI actions (delete confirmations, system dialogs) |
102
- | **Type-Tool** | High | Can overwrite text, potentially destroying data when `clear=True` |
103
- | **Drag-Tool** | High | Can move/reorganize files, potentially overwriting existing files |
104
- | **Shortcut-Tool** | High | Can execute destructive keyboard shortcuts (Ctrl+D delete, Alt+F4 close) |
100
+ | **Shell** | Critical | Can execute arbitrary PowerShell commands, including system modifications, file deletions, and network operations |
101
+ | **Click** | High | Can trigger destructive UI actions (delete confirmations, system dialogs) |
102
+ | **Type** | High | Can overwrite text, potentially destroying data when `clear=True` |
103
+ | **Drag** | High | Can move/reorganize files, potentially overwriting existing files |
104
+ | **Shortcut** | High | Can execute destructive keyboard shortcuts (Ctrl+D delete, Alt+F4 close) |
105
105
 
106
106
  #### **Medium-Risk Tools** (Modifying but Non-Destructive)
107
107
 
@@ -109,9 +109,9 @@ These tools modify system state but are generally safe:
109
109
 
110
110
  | Tool | Risk | Description |
111
111
  |------|------|-------------|
112
- | **App-Tool** | Medium | Launches/manages applications but doesn't modify data |
113
- | **Scroll-Tool** | Low | Only changes viewport position |
114
- | **Move-Tool** | Low | Only positions mouse cursor |
112
+ | **App** | Medium | Launches/manages applications but doesn't modify data |
113
+ | **Scroll** | Low | Only changes viewport position |
114
+ | **Move** | Low | Only positions mouse cursor |
115
115
 
116
116
  #### **Low-Risk Tools** (Read-Only)
117
117
 
@@ -119,9 +119,9 @@ These tools only read information without making changes:
119
119
 
120
120
  | Tool | Risk | Description |
121
121
  |------|------|-------------|
122
- | **State-Tool** | Safe | Only captures desktop state and screenshots |
123
- | **Wait-Tool** | Safe | Only pauses execution |
124
- | **Scrape-Tool** | Safe* | Fetches web content (*may expose browsing activity) |
122
+ | **Snapshot** | Safe | Only captures desktop state and screenshots |
123
+ | **Wait** | Safe | Only pauses execution |
124
+ | **Scrape** | Safe* | Fetches web content (*may expose browsing activity) |
125
125
 
126
126
  ## Best Practices
127
127
 
@@ -140,7 +140,7 @@ These tools only read information without making changes:
140
140
  ### 3. **Monitor Tool Usage**
141
141
 
142
142
  - Regularly review logs to understand what actions are being performed
143
- - Be especially vigilant with high-risk tools (Powershell-Tool, Click-Tool, etc.)
143
+ - Be especially vigilant with high-risk tools (Shell, Click, etc.)
144
144
  - Set up alerts for unexpected or suspicious activity
145
145
 
146
146
  ### 4. **Network Security**
@@ -152,8 +152,8 @@ These tools only read information without making changes:
152
152
 
153
153
  ### 5. **Data Protection**
154
154
 
155
- - Be aware that **State-Tool** captures screenshots that may contain sensitive information
156
- - **Scrape-Tool** may fetch content from untrusted websites
155
+ - Be aware that **Snapshot** captures screenshots that may contain sensitive information
156
+ - **Scrape** may fetch content from untrusted websites
157
157
  - Avoid using Windows-MCP in environments with highly sensitive data
158
158
  - Consider disabling screenshot functionality (`use_vision=False`) when handling confidential information
159
159
 
Binary file
@@ -1,9 +1,9 @@
1
1
  {
2
2
  "manifest_version": "0.2",
3
3
  "name": "Windows-MCP",
4
- "version": "0.5.8",
4
+ "version": "0.5.7",
5
5
  "description": "MCP Server that enables Claude to interact with Windows OS",
6
- "long_description": "Windows MCP is an open-source project that enables seamless integration between AI agents and the Windows operating system. Acting as an MCP server bridges the gap between LLMs and the Windows operating system, allowing agents to perform tasks such as **file navigation, application control, UI interaction, QA testing,** and more.\\n\\n## Key Features\\n\\n- **Seamless Windows Integration**: Interacts natively with Windows UI elements, opens apps, controls windows, simulates user input, and more.\\n- **Use Any LLM (Vision Optional)**: Unlike many automation tools, Windows MCP doesn't rely on any traditional computer vision techniques or specific fine-tuned models; it works with any LLMs, reducing complexity and setup time.\\n- **Rich Toolset for UI Automation**: Includes tools for basic keyboard, mouse operation and capturing window/UI state.\\n- **Lightweight & Open-Source**: Minimal dependencies and easy setup with full source code available under MIT license.\\n- **Customizable & Extendable**: Easily adapt or extend tools to suit your unique automation or AI integration needs.\\n- **Real-Time Interaction**: Typical latency between actions (e.g., from one mouse click to the next) ranges from **1.5 to 2.3 secs**, and may slightly vary based on the number of active applications and system load, also the inferencing speed of the llm.\\n\\n## Requirements\\n\\n### UV Package Manager\\nThis MCP server requires [UV](https://github.com/astral-sh/uv), a fast Python package manager. \\n\\n```bash\\npip install uv\\n```\\n\\nFor detailed installation instructions, see the [UV documentation](https://github.com/astral-sh/uv#installation).",
6
+ "long_description": "Windows MCP is an open-source project that enables seamless integration between AI agents and the Windows operating system. Acting as an MCP server, it bridges the gap between large language models (LLMs) and the Windows OS, allowing agents to perform tasks such as **file navigation, application control, UI interaction, QA testing, and more**.\n\n**KEY FEATURES**\n- **Seamless Windows Integration**: Interacts natively with Windows UI elements, opens applications, controls windows, simulates user input, and more.\n- **Use Any LLM (Vision Optional)**: Does not rely on traditional computer vision techniques or fine-tuned models. Works with any LLM, reducing complexity and setup time.\n- **Rich Toolset for UI Automation**: Includes tools for keyboard and mouse control, window management, and capturing window or UI state.\n- **Lightweight & Open-Source**: Minimal dependencies with full source code available under the MIT license.\n- **Customizable & Extendable**: Easily adapt or extend tools to suit custom automation workflows or AI integrations.\n- **Real-Time Interaction**: Typical latency between actions ranges from `0.4` to `1.2` seconds, depending on system load, active applications, and LLM inference speed.\n\n**MINIMUM REQUIREMENTS**\n- Python 3.13 or higher\n- UV Package Manager\nThis MCP server requires UV, a fast Python package manager.\nInstallation:\n`curl -LsSf https://astral.sh/uv/install.sh | sh`\nFor detailed installation instructions, [see the UV documentation](https://github.com/astral-sh/uv)",
7
7
  "author": {
8
8
  "name": "CursorTouch",
9
9
  "url": "https://cursortouch.com/"
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "windows-mcp"
3
- version = "0.5.8"
3
+ version = "0.6.0"
4
4
  description = "Lightweight MCP Server for interacting with Windows Operating System."
5
5
  authors = [
6
6
  { name = "Jeomon George", email = "jeogeoalukka@gmail.com" }
@@ -12,20 +12,17 @@ keywords = ["windows", "mcp", "ai", "desktop","ai agent"]
12
12
  requires-python = ">=3.13"
13
13
  dependencies = [
14
14
  "click>=8.2.1",
15
+ "comtypes>=1.4.15",
15
16
  "fastmcp>=2.14.2",
16
17
  "fuzzywuzzy>=0.18.0",
17
- "humancursor>=1.1.5",
18
- "ipykernel>=6.30.0",
19
18
  "markdownify>=1.1.0",
20
- "pdfplumber>=0.11.7",
21
19
  "pillow>=11.2.1",
22
20
  "posthog>=7.4.0",
23
21
  "psutil>=7.0.0",
24
22
  "pyautogui>=0.9.54",
25
- "pygetwindow>=0.0.9",
26
23
  "python-dotenv>=1.1.0",
27
24
  "python-levenshtein>=0.27.1",
28
- "pywinauto>=0.6.9",
25
+ "pywin32>=311",
29
26
  "requests>=2.32.3",
30
27
  "tabulate>=0.9.0",
31
28
  "uuid7>=0.1.0",