vision-agent 0.2.189__tar.gz → 0.2.190__tar.gz
Sign up to get free protection for your applications and to get access to all the features.
- {vision_agent-0.2.189 → vision_agent-0.2.190}/PKG-INFO +1 -1
- {vision_agent-0.2.189 → vision_agent-0.2.190}/pyproject.toml +1 -1
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/tools/__init__.py +1 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/tools/tools.py +42 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/LICENSE +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/README.md +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/__init__.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/agent/__init__.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/agent/agent.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/agent/agent_utils.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/agent/vision_agent.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/agent/vision_agent_coder.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/agent/vision_agent_coder_prompts.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/agent/vision_agent_planner.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/agent/vision_agent_planner_prompts.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/agent/vision_agent_prompts.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/clients/__init__.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/clients/http.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/clients/landing_public_api.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/fonts/__init__.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/fonts/default_font_ch_en.ttf +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/lmm/__init__.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/lmm/lmm.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/lmm/types.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/tools/meta_tools.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/tools/prompts.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/tools/tool_utils.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/tools/tools_types.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/utils/__init__.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/utils/exceptions.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/utils/execute.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/utils/image_utils.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/utils/sim.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/utils/type_defs.py +0 -0
- {vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/utils/video.py +0 -0
@@ -1845,6 +1845,48 @@ def flux_image_inpainting(
|
|
1845
1845
|
return output_image
|
1846
1846
|
|
1847
1847
|
|
1848
|
+
def siglip_classification(image: np.ndarray, labels: List[str]) -> Dict[str, Any]:
|
1849
|
+
"""'siglip_classification' is a tool that can classify an image or a cropped detection given a list
|
1850
|
+
of input labels or tags. It returns the same list of the input labels along with
|
1851
|
+
their probability scores based on image content.
|
1852
|
+
|
1853
|
+
Parameters:
|
1854
|
+
image (np.ndarray): The image to classify or tag
|
1855
|
+
labels (List[str]): The list of labels or tags that is associated with the image
|
1856
|
+
|
1857
|
+
Returns:
|
1858
|
+
Dict[str, Any]: A dictionary containing the labels and scores. One dictionary
|
1859
|
+
contains a list of given labels and other a list of scores.
|
1860
|
+
|
1861
|
+
Example
|
1862
|
+
-------
|
1863
|
+
>>> siglip_classification(image, ['dog', 'cat', 'bird'])
|
1864
|
+
{"labels": ["dog", "cat", "bird"], "scores": [0.68, 0.30, 0.02]},
|
1865
|
+
"""
|
1866
|
+
|
1867
|
+
if image.shape[0] < 1 or image.shape[1] < 1:
|
1868
|
+
return {"labels": [], "scores": []}
|
1869
|
+
|
1870
|
+
image_file = numpy_to_bytes(image)
|
1871
|
+
|
1872
|
+
files = [("image", image_file)]
|
1873
|
+
|
1874
|
+
payload = {
|
1875
|
+
"model": "siglip",
|
1876
|
+
"labels": labels,
|
1877
|
+
}
|
1878
|
+
|
1879
|
+
response: dict[str, Any] = send_inference_request(
|
1880
|
+
payload=payload,
|
1881
|
+
endpoint_name="classification",
|
1882
|
+
files=files,
|
1883
|
+
v2=True,
|
1884
|
+
metadata_payload={"function_name": "siglip_classification"},
|
1885
|
+
)
|
1886
|
+
|
1887
|
+
return response
|
1888
|
+
|
1889
|
+
|
1848
1890
|
# Utility and visualization functions
|
1849
1891
|
|
1850
1892
|
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/agent/vision_agent_coder_prompts.py
RENAMED
File without changes
|
File without changes
|
{vision_agent-0.2.189 → vision_agent-0.2.190}/vision_agent/agent/vision_agent_planner_prompts.py
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|