orgo 0.0.13__tar.gz → 0.0.14__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {orgo-0.0.13 → orgo-0.0.14}/PKG-INFO +4 -1
- {orgo-0.0.13 → orgo-0.0.14}/README.md +3 -0
- {orgo-0.0.13 → orgo-0.0.14}/pyproject.toml +1 -1
- {orgo-0.0.13 → orgo-0.0.14}/src/orgo/__init__.py +1 -0
- {orgo-0.0.13 → orgo-0.0.14}/src/orgo/api/__init__.py +1 -0
- {orgo-0.0.13 → orgo-0.0.14}/src/orgo/api/client.py +8 -1
- {orgo-0.0.13 → orgo-0.0.14}/src/orgo/computer.py +33 -1
- {orgo-0.0.13 → orgo-0.0.14}/src/orgo/project.py +1 -0
- {orgo-0.0.13 → orgo-0.0.14}/src/orgo/prompt.py +1 -0
- {orgo-0.0.13 → orgo-0.0.14}/src/orgo/utils/__init__.py +1 -0
- {orgo-0.0.13 → orgo-0.0.14}/src/orgo/utils/auth.py +1 -0
- {orgo-0.0.13 → orgo-0.0.14}/src/orgo.egg-info/PKG-INFO +4 -1
- {orgo-0.0.13 → orgo-0.0.14}/src/orgo.egg-info/SOURCES.txt +0 -4
- orgo-0.0.13/src/orgo/adapters/__init__.py +0 -7
- orgo-0.0.13/src/orgo/adapters/anthropic.py +0 -64
- orgo-0.0.13/src/orgo/adapters/base.py +0 -14
- orgo-0.0.13/src/orgo/adapters/openai.py +0 -69
- {orgo-0.0.13 → orgo-0.0.14}/setup.cfg +0 -0
- {orgo-0.0.13 → orgo-0.0.14}/src/orgo.egg-info/dependency_links.txt +0 -0
- {orgo-0.0.13 → orgo-0.0.14}/src/orgo.egg-info/requires.txt +0 -0
- {orgo-0.0.13 → orgo-0.0.14}/src/orgo.egg-info/top_level.txt +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: orgo
|
|
3
|
-
Version: 0.0.
|
|
3
|
+
Version: 0.0.14
|
|
4
4
|
Summary: Computers for AI agents
|
|
5
5
|
Author: Orgo Team
|
|
6
6
|
License: MIT
|
|
@@ -35,6 +35,9 @@ computer.type("Hello world")
|
|
|
35
35
|
computer.key("Enter")
|
|
36
36
|
computer.screenshot() # Returns PIL Image
|
|
37
37
|
|
|
38
|
+
# Execute Python code
|
|
39
|
+
computer.exec("import pyautogui; pyautogui.click(512, 384)")
|
|
40
|
+
|
|
38
41
|
# Cleanup
|
|
39
42
|
computer.shutdown()
|
|
40
43
|
```
|
|
@@ -1,5 +1,5 @@
|
|
|
1
|
-
"""API client for Orgo service"""
|
|
2
1
|
# src/orgo/api/client.py
|
|
2
|
+
"""API client for Orgo service"""
|
|
3
3
|
|
|
4
4
|
import requests
|
|
5
5
|
from typing import Dict, Any, Optional
|
|
@@ -96,6 +96,13 @@ class ApiClient:
|
|
|
96
96
|
"command": command
|
|
97
97
|
})
|
|
98
98
|
|
|
99
|
+
def execute_python(self, project_id: str, code: str, timeout: int = 10) -> Dict[str, Any]:
|
|
100
|
+
"""Execute Python code on the computer"""
|
|
101
|
+
return self._request("POST", f"computers/{project_id}/exec", {
|
|
102
|
+
"code": code,
|
|
103
|
+
"timeout": timeout
|
|
104
|
+
})
|
|
105
|
+
|
|
99
106
|
def wait(self, project_id: str, seconds: float) -> Dict[str, Any]:
|
|
100
107
|
return self._request("POST", f"computers/{project_id}/wait", {
|
|
101
108
|
"seconds": seconds
|
|
@@ -1,3 +1,4 @@
|
|
|
1
|
+
# src/orgo/computer.py
|
|
1
2
|
"""Computer class for interacting with Orgo virtual environments"""
|
|
2
3
|
import os
|
|
3
4
|
import io
|
|
@@ -110,6 +111,37 @@ class Computer:
|
|
|
110
111
|
response = self.api.execute_bash(self.project_id, command)
|
|
111
112
|
return response.get("output", "")
|
|
112
113
|
|
|
114
|
+
def exec(self, code: str, timeout: int = 10) -> Dict[str, Any]:
|
|
115
|
+
"""
|
|
116
|
+
Execute Python code on the remote computer.
|
|
117
|
+
|
|
118
|
+
Args:
|
|
119
|
+
code: Python code to execute
|
|
120
|
+
timeout: Maximum execution time in seconds (default: 10, max: 300)
|
|
121
|
+
|
|
122
|
+
Returns:
|
|
123
|
+
Dict with keys:
|
|
124
|
+
- success: bool indicating if execution completed without errors
|
|
125
|
+
- output: str containing stdout output
|
|
126
|
+
- error: str containing error message if any
|
|
127
|
+
- error_type: str with exception type name if error occurred
|
|
128
|
+
- timeout: bool indicating if execution timed out
|
|
129
|
+
|
|
130
|
+
Example:
|
|
131
|
+
result = computer.exec('''
|
|
132
|
+
import os
|
|
133
|
+
print(f"Current directory: {os.getcwd()}")
|
|
134
|
+
print(f"Files: {os.listdir('.')}")
|
|
135
|
+
''')
|
|
136
|
+
|
|
137
|
+
if result['success']:
|
|
138
|
+
print(result['output'])
|
|
139
|
+
else:
|
|
140
|
+
print(f"Error: {result['error']}")
|
|
141
|
+
"""
|
|
142
|
+
response = self.api.execute_python(self.project_id, code, timeout)
|
|
143
|
+
return response
|
|
144
|
+
|
|
113
145
|
def wait(self, seconds: float) -> Dict[str, Any]:
|
|
114
146
|
"""Wait for specified number of seconds"""
|
|
115
147
|
return self.api.wait(self.project_id, seconds)
|
|
@@ -168,4 +200,4 @@ class Computer:
|
|
|
168
200
|
# Pass through the Orgo API client configuration
|
|
169
201
|
orgo_api_key=self.api_key,
|
|
170
202
|
orgo_base_url=self.base_api_url
|
|
171
|
-
)
|
|
203
|
+
)
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: orgo
|
|
3
|
-
Version: 0.0.
|
|
3
|
+
Version: 0.0.14
|
|
4
4
|
Summary: Computers for AI agents
|
|
5
5
|
Author: Orgo Team
|
|
6
6
|
License: MIT
|
|
@@ -35,6 +35,9 @@ computer.type("Hello world")
|
|
|
35
35
|
computer.key("Enter")
|
|
36
36
|
computer.screenshot() # Returns PIL Image
|
|
37
37
|
|
|
38
|
+
# Execute Python code
|
|
39
|
+
computer.exec("import pyautogui; pyautogui.click(512, 384)")
|
|
40
|
+
|
|
38
41
|
# Cleanup
|
|
39
42
|
computer.shutdown()
|
|
40
43
|
```
|
|
@@ -9,10 +9,6 @@ src/orgo.egg-info/SOURCES.txt
|
|
|
9
9
|
src/orgo.egg-info/dependency_links.txt
|
|
10
10
|
src/orgo.egg-info/requires.txt
|
|
11
11
|
src/orgo.egg-info/top_level.txt
|
|
12
|
-
src/orgo/adapters/__init__.py
|
|
13
|
-
src/orgo/adapters/anthropic.py
|
|
14
|
-
src/orgo/adapters/base.py
|
|
15
|
-
src/orgo/adapters/openai.py
|
|
16
12
|
src/orgo/api/__init__.py
|
|
17
13
|
src/orgo/api/client.py
|
|
18
14
|
src/orgo/utils/__init__.py
|
|
@@ -1,64 +0,0 @@
|
|
|
1
|
-
"""Adapter for Anthropic's Claude"""
|
|
2
|
-
|
|
3
|
-
from typing import Dict, Any, Optional
|
|
4
|
-
from .base import BaseAdapter
|
|
5
|
-
|
|
6
|
-
class AnthropicAdapter(BaseAdapter):
|
|
7
|
-
def get_tool_definition(self) -> Dict[str, Any]:
|
|
8
|
-
return {
|
|
9
|
-
"name": "computer",
|
|
10
|
-
"description": "Controls a virtual computer to automate tasks",
|
|
11
|
-
"type": "function",
|
|
12
|
-
"parameters": {
|
|
13
|
-
"type": "object",
|
|
14
|
-
"properties": {
|
|
15
|
-
"action": {
|
|
16
|
-
"type": "string",
|
|
17
|
-
"enum": ["left_click", "right_click", "double_click", "type", "key", "scroll", "screenshot"],
|
|
18
|
-
"description": "The action to perform on the computer"
|
|
19
|
-
},
|
|
20
|
-
"coordinate": {
|
|
21
|
-
"type": "array",
|
|
22
|
-
"items": {"type": "number"},
|
|
23
|
-
"description": "The x,y coordinates for click actions",
|
|
24
|
-
"minItems": 2,
|
|
25
|
-
"maxItems": 2
|
|
26
|
-
},
|
|
27
|
-
"text": {
|
|
28
|
-
"type": "string",
|
|
29
|
-
"description": "The text to type or key to press"
|
|
30
|
-
},
|
|
31
|
-
"direction": {
|
|
32
|
-
"type": "string",
|
|
33
|
-
"enum": ["up", "down", "left", "right"],
|
|
34
|
-
"description": "The direction to scroll"
|
|
35
|
-
},
|
|
36
|
-
"amount": {
|
|
37
|
-
"type": "number",
|
|
38
|
-
"description": "The amount to scroll"
|
|
39
|
-
}
|
|
40
|
-
},
|
|
41
|
-
"required": ["action"],
|
|
42
|
-
"additionalProperties": False
|
|
43
|
-
}
|
|
44
|
-
}
|
|
45
|
-
|
|
46
|
-
def format_result(self, tool_id: str, output: Optional[str] = None, error: Optional[str] = None) -> Dict[str, Any]:
|
|
47
|
-
screenshot = self.computer.get_base64()
|
|
48
|
-
result = {
|
|
49
|
-
"type": "tool_result",
|
|
50
|
-
"id": tool_id,
|
|
51
|
-
"content": {
|
|
52
|
-
"type": "image",
|
|
53
|
-
"source": {
|
|
54
|
-
"type": "base64",
|
|
55
|
-
"media_type": "image/png",
|
|
56
|
-
"data": screenshot
|
|
57
|
-
}
|
|
58
|
-
}
|
|
59
|
-
}
|
|
60
|
-
|
|
61
|
-
if error:
|
|
62
|
-
result["error"] = error
|
|
63
|
-
|
|
64
|
-
return result
|
|
@@ -1,14 +0,0 @@
|
|
|
1
|
-
"""Base adapter for AI model integration"""
|
|
2
|
-
|
|
3
|
-
from typing import Dict, Any, Optional
|
|
4
|
-
from ..computer import Computer
|
|
5
|
-
|
|
6
|
-
class BaseAdapter:
|
|
7
|
-
def __init__(self, computer: Computer):
|
|
8
|
-
self.computer = computer
|
|
9
|
-
|
|
10
|
-
def get_tool_definition(self) -> Dict[str, Any]:
|
|
11
|
-
raise NotImplementedError("Subclasses must implement get_tool_definition()")
|
|
12
|
-
|
|
13
|
-
def format_result(self, tool_id: str, output: Optional[str] = None, error: Optional[str] = None) -> Dict[str, Any]:
|
|
14
|
-
raise NotImplementedError("Subclasses must implement format_result()")
|
|
@@ -1,69 +0,0 @@
|
|
|
1
|
-
"""Adapter for OpenAI models"""
|
|
2
|
-
|
|
3
|
-
from typing import Dict, Any, Optional
|
|
4
|
-
from .base import BaseAdapter
|
|
5
|
-
|
|
6
|
-
class OpenAIAdapter(BaseAdapter):
|
|
7
|
-
def get_tool_definition(self) -> Dict[str, Any]:
|
|
8
|
-
return {
|
|
9
|
-
"type": "function",
|
|
10
|
-
"function": {
|
|
11
|
-
"name": "computer",
|
|
12
|
-
"description": "Controls a virtual computer to automate tasks",
|
|
13
|
-
"parameters": {
|
|
14
|
-
"type": "object",
|
|
15
|
-
"properties": {
|
|
16
|
-
"action": {
|
|
17
|
-
"type": "string",
|
|
18
|
-
"enum": ["click", "right_click", "double_click", "type", "key", "scroll", "screenshot"],
|
|
19
|
-
"description": "The action to perform on the computer"
|
|
20
|
-
},
|
|
21
|
-
"x": {
|
|
22
|
-
"type": "number",
|
|
23
|
-
"description": "The x coordinate for click actions"
|
|
24
|
-
},
|
|
25
|
-
"y": {
|
|
26
|
-
"type": "number",
|
|
27
|
-
"description": "The y coordinate for click actions"
|
|
28
|
-
},
|
|
29
|
-
"text": {
|
|
30
|
-
"type": "string",
|
|
31
|
-
"description": "The text to type or key to press"
|
|
32
|
-
},
|
|
33
|
-
"direction": {
|
|
34
|
-
"type": "string",
|
|
35
|
-
"enum": ["up", "down", "left", "right"],
|
|
36
|
-
"description": "The direction to scroll"
|
|
37
|
-
},
|
|
38
|
-
"amount": {
|
|
39
|
-
"type": "number",
|
|
40
|
-
"description": "The amount to scroll"
|
|
41
|
-
}
|
|
42
|
-
},
|
|
43
|
-
"required": ["action"],
|
|
44
|
-
"additionalProperties": False
|
|
45
|
-
}
|
|
46
|
-
}
|
|
47
|
-
}
|
|
48
|
-
|
|
49
|
-
def format_result(self, tool_id: str, output: Optional[str] = None, error: Optional[str] = None) -> Dict[str, Any]:
|
|
50
|
-
screenshot = self.computer.get_base64()
|
|
51
|
-
result = {
|
|
52
|
-
"tool_call_id": tool_id,
|
|
53
|
-
"content": [
|
|
54
|
-
{
|
|
55
|
-
"type": "image_url",
|
|
56
|
-
"image_url": {
|
|
57
|
-
"url": f"data:image/png;base64,{screenshot}"
|
|
58
|
-
}
|
|
59
|
-
}
|
|
60
|
-
]
|
|
61
|
-
}
|
|
62
|
-
|
|
63
|
-
if error:
|
|
64
|
-
result["content"].insert(0, {
|
|
65
|
-
"type": "text",
|
|
66
|
-
"text": f"Error: {error}"
|
|
67
|
-
})
|
|
68
|
-
|
|
69
|
-
return result
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|